ViewVC Help
View File | Revision Log | Show Annotations | View Changeset | Root Listing
root/BBClone/trunk/lib/robot.php
Revision: 366
Committed: Sun Sep 25 13:38:38 2016 UTC (8 years, 2 months ago) by matthys
File size: 158470 byte(s)
Log Message:
Added LinkedIn + Pinterest detection + icons

File Contents

# User Rev Content
1 joku 63 <?php
2     /* This file is part of BBClone (A PHP based Web Counter on Steroids)
3     *
4     * SVN FILE $Id$
5     *
6 matthys 355 * Copyright (C) 2001-2016, the BBClone Team (see doc/authors.txt for details)
7 joku 63 *
8     * This program is free software: you can redistribute it and/or modify
9     * it under the terms of the GNU General Public License as published by
10     * the Free Software Foundation, either version 3 of the License, or
11     * (at your option) any later version.
12     *
13     * This program is distributed in the hope that it will be useful,
14     * but WITHOUT ANY WARRANTY; without even the implied warranty of
15     * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16     * GNU General Public License for more details.
17     *
18     * See doc/copying.txt for details
19     */
20    
21     /////////////////////
22     // Robot Detection //
23     /////////////////////
24    
25     $robot = array(
26     "1noon" => array(
27     "icon" => "1noon",
28     "title" => "1noon",
29     "rule" => array(
30     "1Noonbot[/ ]([0-9.]{1,10})" => "\\1",
31     "^Yeti$" => ""
32     ),
33     "uri" => ""
34     ),
35     "123people" => array(
36     "icon" => "123people",
37     "title" => "123people",
38     "rule" => array(
39     "123peoplebot[ /]([0-9.]{1,10})" => "\\1"
40     ),
41     "uri" => "http://www.123people.fr/"
42     ),
43     "123spider" => array(
44     "icon" => "robot",
45     "title" => "123Spider",
46     "rule" => array(
47     "123spider-Bot \(Version: ([0-9.]{1,10})" => "\\1"
48     ),
49     "uri" => "http://www.123spider.de/"
50     ),
51     "192com" => array(
52     "icon" => "robot",
53     "title" => "192.com",
54     "rule" => array(
55     "192.comAgent" => ""
56     ),
57     "uri" => "http://www.192.com/"
58     ),
59 matthys 298 "200please" => array(
60     "icon" => "200please",
61     "title" => "200please Crawler",
62     "rule" => array(
63     "200PleaseBot[ /]([0-9.]{1,10})" => "\\1"
64     ),
65     "uri" => "http://www.200please.com/bot"
66     ),
67 joku 63 "2dehands" => array(
68     "icon" => "2dehands",
69     "title" => "2deHands",
70     "rule" => array(
71     "2dehands\.nl" => ""
72     ),
73     "uri" => ""
74     ),
75     "80legs" => array(
76     "icon" => "80legs",
77     "title" => "80legs",
78     "rule" => array(
79     "008[/ ]([0-9.]{1,10}).*80legs" => "\\1"
80     ),
81     "uri" => "http://www.80legs.com/"
82     ),
83     "a1sitemap" => array(
84     "icon" => "a1sitemap",
85     "title" => "A1 Sitemap",
86     "rule" => array(
87     "^A1 Sitemap Generator[ /]([0-9.]{1,10})" => "\\1",
88     "miggibot[ /]([0-9.]{1,10})" => "\\1"
89     ),
90     "uri" => "http://www.micro-sys.dk/products/sitemap-generator/"
91     ),
92     "a2b" => array(
93     "icon" => "a2b",
94     "title" => "A2B",
95     "rule" => array(
96     "www\.a2b\.cc" => ""
97     ),
98     "uri" => "http://www.a2b.cc"
99     ),
100     "abacho" => array(
101     "icon" => "robot",
102     "title" => "Abacho",
103     "rule" => array(
104     "^ABACHOBot" => ""
105     ),
106     "uri" => ""
107     ),
108     "abcdatos" => array(
109     "icon" => "abcdatos",
110     "title" => "ABCdatos",
111     "rule" => array(
112     "^ABCdatos BotLink[ /]([0-9.]{1,10})" => "\\1"
113     ),
114     "uri" => "http://www.abcdatos.com/"
115     ),
116     "abot" => array(
117     "icon" => "abot",
118     "title" => "aBot",
119     "rule" => array(
120     "^abot[ /]([0-9.]{1,10})" => "\\1"
121     ),
122     "uri" => ""
123     ),
124     "about" => array(
125     "icon" => "about",
126     "title" => "About",
127     "rule" => array(
128     "Libby[_/ ]([0-9.]{1,10})" => "\\1",
129     "About[_/ ]([0-9.]{1,10})libwww-perl" => "\\1"
130     ),
131     "uri" => ""
132     ),
133     "aboutus" => array(
134     "icon" => "aboutus",
135     "title" => "AboutUs",
136     "rule" => array(
137     "AboutUsBot" => ""
138     ),
139     "uri" => "http://www.aboutus.org/"
140     ),
141     "ackerm" => array(
142     "icon" => "robot",
143     "title" => "Ackerm",
144     "rule" => array(
145     "www.ackerm.com" => ""
146     ),
147     "uri" => "http://www.ackerm.com/"
148     ),
149     "acoi" => array(
150     "icon" => "acoi",
151     "title" => "AcoiRobot",
152     "rule" => array(
153     "^AcoiRobot" => ""
154     ),
155     "uri" => "http://monetdb.cwi.nl/acoi/projects.html"
156     ),
157     "acoon" => array(
158     "icon" => "acoon",
159     "title" => "Acoon",
160     "rule" => array(
161     "Acoon[ \-]?Robot" => ""
162     ),
163     "uri" => ""
164     ),
165     "accoona" => array(
166     "icon" => "accoona",
167     "title" => "Accoona",
168     "rule" => array(
169     "Accoona-AI-Agent[/ ]([0-9.]{1,10})" => "\\1",
170     "^accoona" => ""
171     ),
172     "uri" => ""
173     ),
174     "acme" => array(
175     "icon" => "acme",
176     "title" => "Acme",
177     "rule" => array(
178     "^Acme\.Spider" => ""
179     ),
180     "uri" => "http://www.acme.com/java/software/Acme.Spider.html"
181     ),
182     "active" => array(
183     "icon" => "robot",
184     "title" => "ActiveBookmark",
185     "rule" => array(
186     "ActiveBookmark[/ ]([0-9.]{1,10})" => "\\1"
187     ),
188     "uri" => ""
189     ),
190     "admuncher" => array(
191     "icon" => "robot",
192     "title" => "Ad Muncher",
193     "rule" => array(
194     "Ad Muncher[/ v]*([0-9.]{1,10})" => "\\1"
195     ),
196     "uri" => ""
197     ),
198     "aesop" => array(
199     "icon" => "robot",
200     "title" => "Aesop",
201     "rule" => array(
202     "^AESOP_com_SpiderMan" => ""
203     ),
204     "uri" => "http://www.aesop.com"
205     ),
206     "agada" => array(
207     "icon" => "robot",
208     "title" => "Agada",
209     "rule" => array(
210     "^agadine[/ ]([0-9.]{1,10})" => "\\1"
211     ),
212     "uri" => ""
213     ),
214     "ahrefs" => array(
215     "icon" => "ahrefs",
216     "title" => "Ahrefs",
217     "rule" => array(
218     "AhrefsBot[ /]([0-9.]{1,10})" => "\\1"
219     ),
220     "uri" => "http://ahrefs.com/"
221     ),
222     "aibot" => array(
223     "icon" => "robot",
224     "title" => "Aibot",
225     "rule" => array(
226     "AIBOT[/ ]([0-9.]{1,10})" => "\\1"
227     ),
228     "uri" => ""
229     ),
230     "aihitbot" => array(
231     "icon" => "robot",
232     "title" => "aiHit",
233     "rule" => array(
234     "aiHitBot[/ ]([0-9.]{1,10})" => "\\1"
235     ),
236     "uri" => "http://www.aihit.com/"
237     ),
238     "aipbot" => array(
239     "icon" => "robot",
240     "title" => "Aipbot",
241     "rule" => array(
242     "aipbot[/ ]([0-9.]{1,10})" => "\\1"
243     ),
244     "uri" => ""
245     ),
246     "aleksika" => array(
247     "icon" => "aleksika",
248     "title" => "Aleksika",
249     "rule" => array(
250     "Aleksika Spider[/ ]([0-9.]{1,10})" => "\\1"
251     ),
252     "uri" => ""
253     ),
254     "alertsite" => array(
255     "icon" => "alertsite",
256     "title" => "AlertSite",
257     "rule" => array(
258     "ipd[ /]([0-9.]{1,10}).*Alertsite\.com" => "\\1"
259     ),
260     "uri" => "http://www.alertsite.com/index.html"
261     ),
262     "alexa" => array(
263     "icon" => "alexa",
264     "title" => "Alexa",
265     "rule" => array(
266     "^ia_archive" => ""
267     ),
268     "uri" => "http://www.alexa.com/"
269     ),
270     "almaden" => array(
271     "icon" => "almaden",
272     "title" => "IBM Crawler",
273     "rule" => array(
274     "www\.almaden\.ibm\.com/cs/crawler" => ""
275     ),
276     "uri" => "http://www.almaden.ibm.com/cs/crawler/"
277     ),
278     "altavista" => array(
279     "icon" => "altavista",
280     "title" => "Altavista",
281     "rule" => array(
282     "Scooter[ /\-]*[a-z]*([0-9.]{1,10})" => "\\1",
283     "AltaVista V([0-9.]{1,10})" => "\\1",
284     "AltaVista Intranet V([0-9.]{1,10})" => "\\1"
285     ),
286     "uri" => "http://www.altavista.com/"
287     ),
288     "amazon" => array(
289     "icon" => "amazon",
290     "title" => "Amazon",
291     "rule" => array(
292     "^(aranhabot|amzn_assoc)" => "",
293     "^NutchEC2Test" => ""
294     ),
295     "uri" => "http://www.amazon.com/"
296     ),
297     "amidalla" => array(
298     "icon" => "amidalla",
299     "title" => "Amidalla",
300     "rule" => array(
301     "^amibot" => ""
302     ),
303     "uri" => ""
304     ),
305     "amfibi" => array(
306     "icon" => "amfibi",
307     "title" => "Amfibi",
308     "rule" => array(
309     "Amfibibot[/ ]([0-9.]{1,10})" => "\\1",
310     "Amfibibot" => ""
311     ),
312     "uri" => ""
313     ),
314     "amphetadesk" => array(
315     "icon" => "robot",
316     "title" => "AmphetaDesk",
317     "rule" => array(
318     "AmphetaDesk[/ ]([0-9.]{1,10})" => "\\1"
319     ),
320     "uri" => ""
321     ),
322     "amphetameme" => array(
323     "icon" => "robot",
324     "title" => "Amphetameme",
325     "rule" => array(
326     "amphetameme[ \-]?crawler" => ""
327     ),
328     "uri" => ""
329     ),
330     "annomille" => array(
331     "icon" => "robot",
332     "title" => "AnnoMille",
333     "rule" => array(
334     "^AnnoMille( spider)?[/ ]([0-9.]{1,10})" => "\\2"
335     ),
336     "uri" => "http://www.annomille.it"
337     ),
338     "anonymouse" => array(
339     "icon" => "anonymouse",
340     "title" => "Anonymouse.org",
341     "rule" => array(
342     "http://Anonymouse.org" => ""
343     ),
344     "uri" => "http://anonymouse.org"
345     ),
346     "ansearch" => array(
347     "icon" => "robot",
348     "title" => "Ansearch",
349     "rule" => array(
350     "AnsearchBot[/ ]([0-9.]{1,10})" => "\\1"
351     ),
352     "uri" => ""
353     ),
354     "answerchase" => array(
355     "icon" => "answerchase",
356     "title" => "AnswerChase",
357     "rule" => array(
358     "AnswerChase( PROve)?[/ ]([0-9.]{1,10})" => "\\2"
359     ),
360     "uri" => "http://www.answerchase.com/"
361     ),
362     "antibot" => array(
363     "icon" => "robot",
364 matthys 205 "title" => "Antibot",
365 joku 63 "rule" => array(
366     "antibot-V([0-9.]{1,10})" => "\\1"
367     ),
368     "uri" => ""
369     ),
370     "aonde" => array(
371     "icon" => "aonde",
372     "title" => "Aonde",
373     "rule" => array(
374     "^AONDE-Spider" => ""
375     ),
376     "uri" => ""
377     ),
378     "aonline" => array(
379     "icon" => "robot",
380     "title" => "A-Online.at",
381     "rule" => array(
382     "^A-Online Search" => ""
383     ),
384     "uri" => "http://www.a-online.at/"
385     ),
386     "aol" => array(
387     "icon" => "aol",
388     "title" => "AOLserver",
389     "rule" => array(
390     "^AOLserver-Tcl[/ ]([0-9.]{1,10})" => "\\1",
391     "^AOLserver" => ""
392     ),
393     "uri" => ""
394     ),
395     "apachebench" => array(
396     "icon" => "robot",
397     "title" => "ApacheBench",
398     "rule" => array(
399     "ApacheBench[ /]([0-9.]{1,10})" => "\\1"
400     ),
401     "uri" => ""
402     ),
403     "apassion4jazz" => array(
404     "icon" => "robot",
405     "title" => "Passion 4 Jazz",
406     "rule" => array(
407     "^BebopBot[ /]([0-9.]{1,10})" => "\\1"
408     ),
409     "uri" => "http://www.apassion4jazz.net/bebopbot.html"
410     ),
411     "apexoo" => array(
412     "icon" => "robot",
413     "title" => "Apexoo",
414     "rule" => array(
415     "^Apexoo Spider ([0-9.]{1,10})" => "\\1"
416     ),
417     "uri" => "http://www.apexoo.com/"
418     ),
419     "apnoti" => array(
420     "icon" => "apnoti",
421 matthys 205 "title" => "Apnoti",
422 joku 63 "rule" => array(
423     "apnoti.*Robot[ /]v([0-9.]{1,10})" => "\\1"
424     ),
425     "uri" => "http://www.apnoti.com/"
426     ),
427     "aport" => array(
428     "icon" => "aport",
429     "title" => "Aport",
430     "rule" => array(
431     "^Aport" => ""
432     ),
433     "uri" => ""
434     ),
435     "appie" => array(
436     "icon" => "walhello",
437     "title" => "Walhello",
438     "rule" => array(
439     "appie[ /]([0-9.]{1,10})" => "\\1"
440     ),
441     "uri" => ""
442     ),
443     "arachmo" => array(
444     "icon" => "arachmo",
445     "title" => "Arachmo",
446     "rule" => array(
447     "compatible; Arachmo" => ""
448     ),
449     "uri" => ""
450     ),
451     "arexera" => array(
452     "icon" => "arexera",
453     "title" => "Arexera",
454     "rule" => array(
455     "^X-Crawler" => "",
456     "^TECOMAC-Crawler[ /]([0-9.]{1,10})" => "\\1"
457     ),
458     "uri" => "http://www.arexera.de/"
459     ),
460     "arianna" => array(
461     "icon" => "arianna",
462     "title" => "Arianna",
463     "rule" => array(
464     "^www.arianna.it" => ""
465     ),
466     "uri" => "http://www.arianna.it/"
467     ),
468     "artface" => array(
469     "icon" => "robot",
470     "title" => "Artface",
471     "rule" => array(
472     "^ArtfaceBot" => ""
473     ),
474     "uri" => ""
475     ),
476     "artviper" => array(
477     "icon" => "artviper",
478     "title" => "artViper",
479     "rule" => array(
480     "artViper" => ""
481     ),
482     "uri" => "http://www.artviper.net/"
483     ),
484     "asinfo" => array(
485     "icon" => "robot",
486     "title" => "Any Search Info",
487     "rule" => array(
488     "Sleek Spider[ /]([0-9.]{1,10})" => "\\1"
489     ),
490     "uri" => "http://search-info.com/"
491     ),
492     "ask" => array(
493     "icon" => "askjeeves",
494     "title" => "Ask Jeeves",
495     "rule" => array(
496     "Ask[ \-]?Jeeves" => "",
497     "teomaagent" => ""
498     ),
499     "uri" => ""
500     ),
501     "askaboutoil" => array(
502     "icon" => "robot",
503     "title" => "ASPseek",
504     "rule" => array(
505     "^AskAboutOil[ /]([0-9.]{1,10})" => "\\1"
506     ),
507     "uri" => "http://askaboutoil.com/"
508     ),
509     "asked" => array(
510     "icon" => "robot",
511 matthys 205 "title" => "AskEd!",
512 joku 63 "rule" => array(
513     "^asked[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
514     ),
515     "uri" => "http://asked.jp"
516     ),
517     "aspseek" => array(
518     "icon" => "robot",
519     "title" => "ASPseek",
520     "rule" => array(
521     "^ASPseek[/ ]([0-9.]{1,10})" => "\\1"
522     ),
523     "uri" => ""
524     ),
525     "atlocal" => array(
526     "icon" => "robot",
527     "title" => "At Local",
528     "rule" => array(
529     "AtlocalBot[/ ]([0-9.]{1,10})" => "\\1"
530     ),
531     "uri" => "http://www.atlocal.com/"
532     ),
533     "atomz" => array(
534     "icon" => "atomz",
535     "title" => "Atomz",
536     "rule" => array(
537     "Atomz[/ ]([0-9.]{1,10})" => "\\1"
538     ),
539     "uri" => ""
540     ),
541 matthys 345 "avira" => array(
542     "icon" => "avira",
543     "title" => "Avira SafeSearch",
544     "rule" => array(
545     "^SafeSearch microdata crawler" => ""
546     ),
547     "uri" => "https://safesearch.avira.com"
548     ),
549 joku 63 "axel" => array(
550     "icon" => "robot",
551     "title" => "Axel",
552     "rule" => array(
553     "^axel" => ""
554     ),
555     "uri" => ""
556     ),
557     "axmo" => array(
558     "icon" => "axmo",
559     "title" => "Axmo",
560     "rule" => array(
561     "AxmoRobot" => ""
562     ),
563     "uri" => ""
564     ),
565     "answerbus" => array(
566     "icon" => "answerbus",
567     "title" => "AnswerBus",
568     "rule" => array(
569     "answerbus" => ""
570     ),
571     "uri" => ""
572     ),
573     "automapit" => array(
574     "icon" => "robot",
575     "title" => "AutoMapIt",
576     "rule" => array(
577     "AutoMapIt[ /](Bot)?" => ""
578     ),
579     "uri" => "http://www.automapit.com/bot.html"
580     ),
581     "augurnfind" => array(
582     "icon" => "robot",
583     "title" => "Augurnfind",
584     "rule" => array(
585     "augurnfind[/ ][v\-]*([0-9.]{1,10})" => "\\1"
586     ),
587     "uri" => ""
588     ),
589     "awasu" => array(
590     "icon" => "awasu",
591     "title" => "Awasu",
592     "rule" => array(
593     "Awasu[/ ]([0-9a-z.]{1,10})" => "\\1"
594     ),
595     "uri" => ""
596     ),
597     "axxus" => array(
598     "icon" => "axxus",
599     "title" => "axxus.de",
600     "rule" => array(
601     "whoiam" => ""
602     ),
603     "uri" => "http://www.axxus.de/"
604     ),
605     "ayell" => array(
606     "icon" => "ayell",
607     "title" => "Ayell",
608     "rule" => array(
609     "^Eurobot[ /]([0-9.]{1,10})" => "\\1"
610     ),
611     "uri" => "http://eurobot.ayell.eu"
612     ),
613     "babaloo" => array(
614     "icon" => "babaloo",
615     "title" => "Babaloo",
616     "rule" => array(
617     "BabalooSpider[ /]([0-9.]{1,10})" => "\\1"
618     ),
619     "uri" => "http://www.babaloo.si"
620     ),
621     "babe" => array(
622     "icon" => "robot",
623     "title" => "ba.be",
624     "rule" => array(
625     "BACS http://www.ba.be" => ""
626     ),
627     "uri" => "http://www.ba.be/"
628     ),
629     "baidu" => array(
630     "icon" => "baidu",
631     "title" => "Baidu",
632     "rule" => array(
633     "Baiduspider[ /]([0-9.]{1,10})" => "\\1",
634     "Baiduspider" => ""
635     ),
636     "uri" => "http://www.baidu.com/search/spider.html"
637     ),
638     "bananatree" => array(
639     "icon" => "robot",
640     "title" => "BananaTree",
641     "rule" => array(
642     "www\.thebananatree\.org" => ""
643     ),
644     "uri" => "http://www.thebananatree.org/"
645     ),
646     "bdcindexer" => array(
647     "icon" => "robot",
648     "title" => "bdcindexer",
649     "rule" => array(
650     "bdcindexer_([0-9a-z.]{1,10})" => "\\1"
651     ),
652     "uri" => "http://www.business.com/"
653     ),
654     "bdfetch" => array(
655     "icon" => "robot",
656     "title" => "BDFetch",
657     "rule" => array(
658     "^BDFetch" => ""
659     ),
660     "uri" => ""
661     ),
662     "bdncentral" => array(
663     "icon" => "robot",
664     "title" => "Bdncentral",
665     "rule" => array(
666     "BDNcentral Crawler v([0-9.]{1,10})" => "\\1"
667     ),
668     "uri" => "http://www.bdncentral.com/robot.html"
669     ),
670     "beammachine" => array(
671     "icon" => "robot",
672     "title" => "BeamMachine",
673     "rule" => array(
674     "^BeamMachine[ /]([0-9.]{1,10})" => "\\1"
675     ),
676     "uri" => "http://www.beammachine.net/"
677     ),
678     "become" => array(
679     "icon" => "become",
680     "title" => "Become",
681     "rule" => array(
682     "Become(JP)?Bot[/ ]([0-9.]{1,10})" => "\\2",
683     "(BecomeBot|Exabot)@exava\.com\)$" => ""
684     ),
685     "uri" => "http://www.become.com/"
686     ),
687     "beebware" => array(
688     "icon" => "robot",
689     "title" => "Beebware",
690     "rule" => array(
691     "BeebwareDirectory[/ ]v?([0-9.]{1,10})" => "\\2"
692     ),
693     "uri" => ""
694     ),
695     "bigbrother" => array(
696     "icon" => "robot",
697     "title" => "Big Brother",
698     "rule" => array(
699     "^Big Brother" => ""
700     ),
701     "uri" => "http://pauillac.inria.fr/~fpottier/"
702     ),
703     "bigclique" => array(
704     "icon" => "robot",
705     "title" => "BigClique",
706     "rule" => array(
707     "^BigCliqueBOT[/ ]([0-9.]{1,10})" => "\\1"
708     ),
709     "uri" => "http://www.bigclique.com"
710     ),
711     "biglotron" => array(
712     "icon" => "robot",
713     "title" => "Biglotron",
714     "rule" => array(
715     "^BIGLOTRON" => ""
716     ),
717     "uri" => "http://www.bigclique.com"
718     ),
719     "bigsearch" => array(
720     "icon" => "bigsearch",
721     "title" => "Bigsearch",
722     "rule" => array(
723     "Bigsearch.ca[/ ]Nutch[- ]([0-9.]{1,10})" => "\\1"
724     ),
725     "uri" => ""
726     ),
727     "bilbo" => array(
728     "icon" => "robot",
729     "title" => "Bilbo",
730     "rule" => array(
731     "Bilbo[ /]([0-9.]{1,10})" => "\\1"
732     ),
733     "uri" => "http://home.broadpark.no/~tnilsen-1/Linux/Bilbo_-_Nessus_WEB/bilbo_-_nessus_web.html"
734     ),
735     "bilgi" => array(
736     "icon" => "bilgi",
737     "title" => "Bilgi",
738     "rule" => array(
739     "Bilgi(Beta)?Bot[ /]([0-9.]{1,10})" => "\\1"
740     ),
741     "uri" => "http://www.bilgi.com/"
742     ),
743     "bitacle" => array(
744     "icon" => "bitacle",
745     "title" => "Bitacle",
746     "rule" => array(
747     "Bitacle (ro)?bot[ \(/V\:]+([0-9.]{1,10})" => "\\2",
748     ),
749     "uri" => "http://bitacle.org/"
750     ),
751     "bitbeamer" => array(
752     "icon" => "bitbeamer",
753     "title" => "BitBeamer",
754     "rule" => array(
755     "BitBeamer/([0-9.]{1,10})" => "\\1"
756     ),
757     "uri" => ""
758     ),
759     "biz360" => array(
760     "icon" => "biz360",
761     "title" => "Biz360",
762     "rule" => array(
763     "^Biz360 spider" => ""
764     ),
765     "uri" => ""
766     ),
767     "backlinktest" => array(
768     "icon" => "backlinktest",
769     "title" => "BacklinkCrawler",
770     "rule" => array(
771     "BacklinkCrawler" => ""
772     ),
773     "uri" => "http://www.backlinktest.com/crawler.html"
774     ),
775     "blaizbee" => array(
776     "icon" => "blaiz-bee",
777     "title" => "Blaiz-Bee",
778     "rule" => array(
779     "Blaiz-Bee[ /]([0-9.]{1,10})" => ""
780     ),
781     "uri" => ""
782     ),
783     "blogbeat" => array(
784     "icon" => "robot",
785     "title" => "BlogBeat",
786     "rule" => array(
787     "BlogBeat/?([0-9.]{1,10})" => "\\1",
788     ),
789     "uri" => "http://www.blogbeat.nl"
790     ),
791     "blogbotde" => array(
792     "icon" => "robot",
793     "title" => "blogbot.de",
794     "rule" => array(
795     "Naamah[ /]([0-9.a-z]{1,10})[ /]Blogbot" => "\\1",
796     ),
797     "uri" => "http://blogbot.de/"
798     ),
799     "blogcensus" => array(
800     "icon" => "blogcensus",
801     "title" => "Blogcensus",
802     "rule" => array(
803     "^Blogcensus" => "",
804     ),
805     "uri" => "http://blogcensus.de/bot/"
806     ),
807     "blogdex" => array(
808     "icon" => "robot",
809     "title" => "Blogdex",
810     "rule" => array(
811     "Blogdex[ /]([0-9.]{1,10})" => "\\1",
812     ),
813     "uri" => ""
814     ),
815     "blogg" => array(
816     "icon" => "blogg",
817     "title" => "Blogg",
818     "rule" => array(
819     "^blogg\.de" => ""
820     ),
821     "uri" => ""
822     ),
823     "blogland" => array(
824     "icon" => "robot",
825     "title" => "BlogLand",
826     "rule" => array(
827     "BlogLand[/ ]([0-9.]{1,10})" => "\\1"
828     ),
829     "uri" => ""
830     ),
831     "bloglines" => array(
832     "icon" => "bloglines",
833     "title" => "Bloglines",
834     "rule" => array(
835     "Bloglines[ /]([0-9.]{1,10})" => "\\1",
836     "Bloglines" => ""
837     ),
838     "uri" => ""
839     ),
840     "blogmap" => array(
841     "icon" => "robot",
842     "title" => "Blogmap",
843     "rule" => array(
844     "blogmap" => ""
845     ),
846     "uri" => ""
847     ),
848     "blogosphere" => array(
849     "icon" => "robot",
850     "title" => "Blogosphere",
851     "rule" => array(
852     "Blogosphere" => ""
853     ),
854     "uri" => ""
855     ),
856     "blogpeople" => array(
857     "icon" => "robot",
858     "title" => "BlogPeople",
859     "rule" => array(
860     "BlogPeople" => ""
861     ),
862     "uri" => ""
863     ),
864     "blogpulse" => array(
865     "icon" => "blogpulse",
866     "title" => "Blogpulse",
867     "rule" => array(
868     "Blogpulse" => ""
869     ),
870     "uri" => ""
871     ),
872     "blogranking" => array(
873     "icon" => "blogranking",
874     "title" => "BlogRanking",
875     "rule" => array(
876     "^BlogRanking(/RSS checker)?" => ""
877     ),
878     "uri" => ""
879     ),
880     "blogs" => array(
881     "icon" => "blogs",
882     "title" => "Blo.gs",
883     "rule" => array(
884     "blo\.gs[ /]([0-9.]{1,10})" => "\\1",
885     "blo\.gs" => ""
886     ),
887     "uri" => ""
888     ),
889     "blogshares" => array(
890     "icon" => "blogshares",
891     "title" => "BlogShares",
892     "rule" => array(
893     "BlogShares[ /]V?([0-9.]{1,10})" => "\\1",
894     "(^| |\()Blogshares(\.com| |\))" => ""
895     ),
896     "uri" => ""
897     ),
898     "blogslife" => array(
899     "icon" => "robot",
900     "title" => "BlogsLife",
901     "rule" => array(
902     "Blogslive" => ""
903     ),
904     "uri" => ""
905     ),
906     "blogsnow" => array(
907     "icon" => "blogsnow",
908     "title" => "BlogsNow",
909     "rule" => array(
910     "blogsnowbot" => "",
911     "BlogsNow" => ""
912     ),
913     "uri" => ""
914     ),
915     "blogstreet" => array(
916     "icon" => "blogstreet",
917     "title" => "BlogStreet",
918     "rule" => array(
919     "^BlogStreetBot" => ""
920     ),
921     "uri" => ""
922     ),
923     "blogsurf" => array(
924     "icon" => "robot",
925     "title" => "BlogSurf",
926     "rule" => array(
927     "nomadscafe_ra[/ ]([0-9.]{1,10})" => "\\1"
928     ),
929     "uri" => ""
930     ),
931     "blogtick" => array(
932     "icon" => "robot",
933     "title" => "BlogTick",
934     "rule" => array(
935     "BlogTickServer" => ""
936     ),
937     "uri" => ""
938     ),
939     "blogwatcher" => array(
940     "icon" => "blogwatcher",
941     "title" => "Blogwatcher",
942     "rule" => array(
943     "blogWatcher_Spider[/ ]([0-9.]{1,10})" => "\\1"
944     ),
945     "uri" => ""
946     ),
947     "blogwise" => array(
948     "icon" => "blogwise",
949     "title" => "Blogwise",
950     "rule" => array(
951     "Blogwise\.com(-MetaChecker)?[/ ]([0-9.]{1,10})" => "\\2"
952     ),
953     "uri" => ""
954     ),
955     "boardreader" => array(
956     "icon" => "boardreader",
957     "title" => "BoardReader",
958     "rule" => array(
959     "BoardReader[ \-](Image|Favicon)[ \-]Fetcher[ /]+([0-9.]{1,10})" => "\\2"
960     ),
961     "uri" => "http://www.boardreader.com"
962     ),
963     "bobby" => array(
964     "icon" => "bobby",
965     "title" => "Bobby",
966     "rule" => array(
967     "bobby[ /]([0-9.]{1,10})" => "\\1"
968     ),
969     "uri" => ""
970     ),
971     "boitho" => array(
972     "icon" => "robot",
973     "title" => "Boitho",
974     "rule" => array(
975     "Boitho\.com[ \-](dc|robot)?[/ ]([0-9.]{1,10})" => "\\2"
976     ),
977     "uri" => ""
978     ),
979     "booch" => array(
980     "icon" => "robot",
981     "title" => "Booch",
982     "rule" => array(
983     "^booch[_ /]([0-9.]{1,10})" => "\\1"
984     ),
985     "uri" => ""
986     ),
987     "book" => array(
988     "icon" => "book",
989     "title" => "Bookmark",
990     "rule" => array(
991     "http://www\.bookmark\.ne\.jp" => ""
992     ),
993     "uri" => ""
994     ),
995     "bookdog" => array(
996     "icon" => "bookdog",
997     "title" => "Bookdog",
998     "rule" => array(
999     "^Bookdog[ /]([0-9.]{1,10})" => "\\1"
1000     ),
1001     "uri" => ""
1002     ),
1003     "bordermanager" => array(
1004     "icon" => "bordermanager",
1005     "title" => "Border Manager",
1006     "rule" => array(
1007     "BorderManager[ /]([0-9.]{1,10})" => "\\1"
1008     ),
1009     "uri" => ""
1010     ),
1011     "botonparade" => array(
1012     "icon" => "botonparade",
1013     "title" => "Bot on Parade",
1014     "rule" => array(
1015     "BotOnParade" => ""
1016     ),
1017     "uri" => "http://www.bots-on-para.de/bot.html"
1018     ),
1019     "botje" => array(
1020     "icon" => "botje",
1021     "title" => "Botje",
1022     "rule" => array(
1023     "Plukkie[ /]([0-9.]{1,10})" => "\\1"
1024     ),
1025     "uri" => "http://www.botje.com/"
1026     ),
1027     "bottomfeeder" => array(
1028     "icon" => "bottomfeeder",
1029     "title" => "BottomFeeder",
1030     "rule" => array(
1031     "BottomFeeder[ /]([0-9.]{1,10})" => "\\1"
1032     ),
1033     "uri" => ""
1034     ),
1035     "browseremulator" => array(
1036     "icon" => "browseremulator",
1037     "title" => "BrowserEmulator",
1038     "rule" => array(
1039     "BrowserEmulator[ /]([0-9.]{1,10})" => "\\1"
1040     ),
1041     "uri" => "http://www.dejavu.org/emulator.htm"
1042     ),
1043     "browsershots" => array(
1044     "icon" => "browsershots",
1045     "title" => "Browsershots",
1046     "rule" => array(
1047     "Browsershots URL Check" => ""
1048     ),
1049     "uri" => "http://browsershots.org"
1050     ),
1051     "browserspy" => array(
1052     "icon" => "robot",
1053     "title" => "BrowserSpy",
1054     "rule" => array(
1055     "BrowserSpy" => ""
1056     ),
1057     "uri" => ""
1058     ),
1059     "bruinbot" => array(
1060     "icon" => "robot",
1061     "title" => "BruinBot",
1062     "rule" => array(
1063     "BruinBot" => ""
1064     ),
1065     "uri" => ""
1066     ),
1067     "bruno" => array(
1068     "icon" => "robot",
1069     "title" => "Bruno",
1070     "rule" => array(
1071     "^Bruno" => ""
1072     ),
1073     "uri" => ""
1074     ),
1075     "btbot" => array(
1076     "icon" => "btbot",
1077     "title" => "BitTorrent",
1078     "rule" => array(
1079     "BTbot/([0-9.]{1,10})" => "\\1"
1080     ),
1081     "uri" => ""
1082     ),
1083     "builtwith" => array(
1084     "icon" => "builtwith",
1085     "title" => "BuiltWith",
1086     "rule" => array(
1087     "BuiltWith[/ ]([0-9.]{1,10})" => "\\1"
1088     ),
1089     "uri" => "http://builtwith.com/bot.html"
1090     ),
1091     "bulkfeeds" => array(
1092     "icon" => "robot",
1093     "title" => "Bulkfeeds",
1094     "rule" => array(
1095     "Bulkfeeds[/ ]([a-z0-9.]{1,10})" => "\\1"
1096     ),
1097     "uri" => ""
1098     ),
1099     "burf" => array(
1100     "icon" => "burf",
1101     "title" => "Burf.com",
1102     "rule" => array(
1103     "^Norbert the Spider" => ""
1104     ),
1105     "uri" => "http://www.burf.com/"
1106     ),
1107     "butch" => array(
1108     "icon" => "robot",
1109     "title" => "Butch",
1110     "rule" => array(
1111     "Butch(__| )?([a-z0-9.]{1,10})" => "\\2"
1112     ),
1113     "uri" => ""
1114     ),
1115     "buzzlogic" => array(
1116     "icon" => "buzzlogic",
1117     "title" => "Buzzlogic",
1118     "rule" => array(
1119     "BuzzBot[ /]([0-9.]{1,10})" => "\\1"
1120     ),
1121     "uri" => "http://www.buzzlogic.com"
1122     ),
1123     "catchbot" => array(
1124     "icon" => "catchbot",
1125     "title" => "CatchBot",
1126     "rule" => array(
1127     "^CatchBot[/ ]([0-9.]{1,10})" => "\\1"
1128     ),
1129     "uri" => "http://www.catchbot.com"
1130     ),
1131     "camdiscover" => array(
1132     "icon" => "robot",
1133     "title" => "Camdiscover",
1134     "rule" => array(
1135     "^Camcrawler" => ""
1136     ),
1137     "uri" => ""
1138     ),
1139     "cazoodle" => array(
1140     "icon" => "cazoodle",
1141     "title" => "Cazoodle",
1142     "rule" => array(
1143     "^CazoodleBot/(Nutch|CazoodleBot)[/ \-]([0-9.]{1,10})" => "\\2",
1144     "^CazoodleBot[/ ]([a-z0-9.]{1,10})" => "\\1"
1145     ),
1146     "uri" => "http://www.cazoodle.com/cazoodlebot"
1147     ),
1148     "ccbot" => array(
1149     "icon" => "robot",
1150     "title" => "ccBot",
1151     "rule" => array(
1152     "CCBot[/ ]([0-9.]{1,10})" => "\\1"
1153     ),
1154     "uri" => "http://www.commoncrawl.org/bot.html"
1155     ),
1156     "ccgcrawl" => array(
1157     "icon" => "robot",
1158     "title" => "CCGCrawl",
1159     "rule" => array(
1160     "CCGCrawl[/ ]([0-9.]{1,10})" => "\\1"
1161     ),
1162     "uri" => "http://www.myworkbase.com/bot.html"
1163     ),
1164     "cerberian" => array(
1165     "icon" => "robot",
1166     "title" => "Cerberian Drtrs",
1167     "rule" => array(
1168     "^Cerberian Drtrs" => ""
1169     ),
1170     "uri" => ""
1171     ),
1172     "cfnetwork" => array(
1173     "icon" => "robot",
1174     "title" => "Cerberian Drtrs",
1175     "rule" => array(
1176     "^CFNetwork[/ ]([0-9.]{1,10})" => "\\1"
1177     ),
1178     "uri" => "http://www.cfnetwork.be/"
1179     ),
1180     "charlotte" => array(
1181     "icon" => "charlotte",
1182     "title" => "Charlotte",
1183     "rule" => array(
1184     "Charlotte[/ ]([0-9a-z.]{1,10})" => "\\1"
1185     ),
1186     "uri" => ""
1187     ),
1188     "cirilizator" => array(
1189     "icon" => "cirilizator",
1190     "title" => "Cirilizator",
1191     "rule" => array(
1192     "Cirilizator[/ ]([0-9.]{1,10})" => "\\1"
1193     ),
1194     "uri" => ""
1195     ),
1196     "claria" => array(
1197     "icon" => "robot",
1198     "title" => "Claria",
1199     "rule" => array(
1200     "(Claria|Diamond)(Bot)?[ /]([0-9.]{1,10})" => "\\3",
1201     "(Claria|Diamond)(Bot)" => ""
1202     ),
1203     "uri" => ""
1204     ),
1205     "claymont" => array(
1206     "icon" => "claymont",
1207     "title" => "Claymont",
1208     "rule" => array(
1209     "claymont\.com" => "",
1210     "OliverPerry" => ""
1211     ),
1212     "uri" => "http://www.claymont.com"
1213     ),
1214     "clush" => array(
1215     "icon" => "clush",
1216     "title" => "Clush",
1217     "rule" => array(
1218     "Clus(tered-Search-|h)Bot[ /]([0-9.]{1,10})" => "\\2"
1219     ),
1220     "uri" => ""
1221     ),
1222     "cmsworldmap" => array(
1223     "icon" => "cmsworldmap",
1224     "title" => "CMS World Map",
1225     "rule" => array(
1226     "cmsworldmap" => ""
1227     ),
1228     "uri" => "http://www.cmsworldmap.com/"
1229     ),
1230     "cobion" => array(
1231     "icon" => "robot",
1232     "title" => "Cobion",
1233     "rule" => array(
1234     " (QXW03018|obot)\)" => ""
1235     ),
1236     "uri" => ""
1237     ),
1238     "coccoc" => array(
1239 matthys 287 "icon" => "coccoc",
1240 matthys 209 "title" => "Coccoc",
1241 joku 63 "rule" => array(
1242     "coccoc[ /]([0-9.]{1,10})" => "\\1"
1243     ),
1244 matthys 287 "uri" => "http://help.coccoc.com"
1245 joku 63 ),
1246     "coldfusion" => array(
1247     "icon" => "coldfusion",
1248     "title" => "ColdFusion",
1249     "rule" => array(
1250     "^coldfusion" => ""
1251     ),
1252     "uri" => ""
1253     ),
1254     "combine" => array(
1255     "icon" => "robot",
1256     "title" => "Combine",
1257     "rule" => array(
1258     "Combine[ /]([0-9.]{1,10})" => "\\1"
1259     ),
1260     "uri" => ""
1261     ),
1262     "combot" => array(
1263     "icon" => "robot",
1264     "title" => "comBot",
1265     "rule" => array(
1266     "^comBot[ /]([0-9.]{1,10})" => "\\1"
1267     ),
1268     "uri" => ""
1269     ),
1270     "comet" => array(
1271     "icon" => "comet",
1272     "title" => "Comet",
1273     "rule" => array(
1274     "cometsearch@cometsystems" => ""
1275     ),
1276     "uri" => ""
1277     ),
1278     "commerobo" => array(
1279     "icon" => "robot",
1280     "title" => "Commerobo",
1281     "rule" => array(
1282     "Commerobo[/ ]([0-9.]{1,10})" => "\\1"
1283     ),
1284     "uri" => ""
1285     ),
1286     "comrite" => array(
1287     "icon" => "robot",
1288     "title" => "ComRite",
1289     "rule" => array(
1290     "Comrite[/ ]([0-9.]{1,10})" => "\\1"
1291     ),
1292     "uri" => "http://www.comrite.com/"
1293     ),
1294     "convera" => array(
1295     "icon" => "convera",
1296     "title" => "Convera",
1297     "rule" => array(
1298     "Convera(MultiMedia)?Crawler[/ ]([0-9.]{1,10})" => "\\2",
1299     "Convera Internet Spider V([0-9.]{1,10})" => "\\1"
1300     ),
1301     "uri" => ""
1302     ),
1303     "coolbot" => array(
1304     "icon" => "robot",
1305     "title" => "CoolBot",
1306     "rule" => array(
1307     "^CoolBot" => ""
1308     ),
1309     "uri" => ""
1310     ),
1311     "cosmix" => array(
1312     "icon" => "robot",
1313     "title" => "Cosmix",
1314     "rule" => array(
1315     "^(voyager|cfetch|CosmixCrawler|carleson)[/ ]([0-9.]{1,10})" => "\\2",
1316     ),
1317     "uri" => ""
1318     ),
1319     "cosmos" => array(
1320     "icon" => "robot",
1321     "title" => "Cosmos",
1322     "rule" => array(
1323     "^cosmos" => ""
1324     ),
1325     "uri" => ""
1326     ),
1327     "cosmoty" => array(
1328     "icon" => "robot",
1329     "title" => "Cosmoty",
1330     "rule" => array(
1331     "^beautybot[/ ]([0-9.]{1,10})" => "\\1"
1332     ),
1333     "uri" => "http://www.uchoose.de/crawler/beautybot/"
1334     ),
1335     "covario" => array(
1336     "icon" => "covario",
1337     "title" => "Covario",
1338     "rule" => array(
1339     "Covario-IDS[/ ]([0-9.]{1,10})" => "\\1"
1340     ),
1341     "uri" => "http://www.covario.com/ids/"
1342     ),
1343     "creativecommons" => array(
1344     "icon" => "creativecommons",
1345     "title" => "Creative Commons",
1346     "rule" => array(
1347     "CreativeCommons[/ ]([0-9.]{1,6}(-dev)?)" => "\\1"
1348     ),
1349     "uri" => ""
1350     ),
1351     "cscrawler" => array(
1352     "icon" => "robot",
1353     "title" => "CsCrawler",
1354     "rule" => array(
1355     "CsCrawler" => ""
1356     ),
1357     "uri" => "http://www.kde.cs.uni-kassel.de/lehre/ss2005/googlespam/crawler.html"
1358     ),
1359 joku 111 "jigsaw" => array(
1360     "icon" => "jigsaw",
1361     "title" => "Jigsaw",
1362     "rule" => array(
1363     "Jigsaw[ /]([0-9.]{1,10})" => "\\1"
1364     ),
1365     "uri" => "http://jigsaw.w3.org/css-validator/"
1366     ),
1367 joku 63 "csscheck" => array(
1368     "icon" => "w3c",
1369     "title" => "W3C CSS Validator",
1370     "rule" => array(
1371     "CSS(Check|_Validator).+[ /]([0-9.]{1,10})" => "\\2"
1372     ),
1373     "uri" => "http://jigsaw.w3.org/css-validator/"
1374     ),
1375     "custo" => array(
1376     "icon" => "robot",
1377     "title" => "Custo",
1378     "rule" => array(
1379     "Custo[ /]([0-9.]{1,10})" => "\\1"
1380     ),
1381     "uri" => ""
1382     ),
1383     "cybernavi" => array(
1384     "icon" => "robot",
1385     "title" => "CyberNavi",
1386     "rule" => array(
1387     "CyberNavi_WebGet[ /]([0-9.]{1,10})" => "\\1"
1388     ),
1389     "uri" => ""
1390     ),
1391     "cyberpatrol" => array(
1392     "icon" => "cyberpatrol",
1393     "title" => "CyberPatrol",
1394     "rule" => array(
1395     "^CyberPatrol" => ""
1396     ),
1397     "uri" => "http://www.cyberpatrol.com/cyberpatrolcrawler.asp"
1398     ),
1399     "cyberz" => array(
1400     "icon" => "cyberz",
1401     "title" => "Cyberz",
1402     "rule" => array(
1403     "Cyberz Communication Agent" => ""
1404     ),
1405     "uri" => ""
1406     ),
1407     "cydral" => array(
1408     "icon" => "robot",
1409     "title" => "Cydral",
1410     "rule" => array(
1411     "CydralSpider[ /]([0-9.]{1,10})" => "\\1"
1412     ),
1413     "uri" => ""
1414     ),
1415     "cynthia" => array(
1416     "icon" => "cynthia",
1417     "title" => "Cynthia Says",
1418     "rule" => array(
1419     "Cynthia[ /]([0-9.]{1,10})" => "\\1"
1420     ),
1421     "uri" => ""
1422     ),
1423     "d4x" => array(
1424     "icon" => "d4x",
1425     "title" => "Downloader for X",
1426     "rule" => array(
1427     "Downloader for X[ /]([0-9.]{1,10})" => "\\1"
1428     ),
1429     "uri" => ""
1430     ),
1431     "da" => array(
1432     "icon" => "da",
1433     "title" => "DA",
1434     "rule" => array(
1435     "^DA[ /]([0-9.]{1,10})" => "\\1"
1436     ),
1437     "uri" => ""
1438     ),
1439     "daum" => array(
1440     "icon" => "daum",
1441     "title" => "DAUM",
1442     "rule" => array(
1443     "DAUMOA[ /]([0-9.]{1,10})" => "\\1",
1444     "DAUM Web Robot" => "",
1445 joku 339 "daum.net" => "",
1446 joku 63 "Daum Communications Corp" => "",
1447     "EDI[ /]([0-9.]{1,10})" => "\\1",
1448     "Edacious.*Intelligent Web Robot" => "",
1449     "RaBot[/ ]([0-9.]{1,10}) Agent" => "\\1"
1450     ),
1451     "uri" => "http://ws.daum.net/"
1452     ),
1453     "daypop" => array(
1454     "icon" => "robot",
1455     "title" => "Daypop",
1456     "rule" => array(
1457     "daypopbot[/ ]([0-9.]{1,10})" => "\\1"
1458     ),
1459     "uri" => ""
1460     ),
1461     "delfi" => array(
1462     "icon" => "delfi",
1463     "title" => "Delfi",
1464     "rule" => array(
1465     "crawl at delfi dot lt" => ""
1466     ),
1467     "uri" => ""
1468     ),
1469     "depspid" => array(
1470     "icon" => "depspid",
1471     "title" => "DepSpid",
1472     "rule" => array(
1473     "DepSpid[/ ]([0-9.]{1,10})" => "\\1"
1474     ),
1475     "uri" => ""
1476     ),
1477     "devonagent" => array(
1478     "icon" => "devonagent",
1479     "title" => "DEVONagent",
1480     "rule" => array(
1481     "DEVONtech" => ""
1482     ),
1483     "uri" => ""
1484     ),
1485     "diffbot" => array(
1486     "icon" => "diffbot",
1487     "title" => "Diffbot",
1488     "rule" => array(
1489     " Diffbot" => ""
1490     ),
1491     "uri" => "http://www.diffbot.com"
1492     ),
1493     "diribot" => array(
1494     "icon" => "diribot",
1495     "title" => "Diri",
1496     "rule" => array(
1497     "diribot" => ""
1498     ),
1499     "uri" => "http://www.diri.bg"
1500     ),
1501     "directhit" => array(
1502     "icon" => "robot",
1503     "title" => "Direct Hit",
1504     "rule" => array(
1505     "EZResult -- Internet Search Engine" => ""
1506     ),
1507     "uri" => "http://www.directhit.com"
1508     ),
1509     "disco" => array(
1510     "icon" => "disco",
1511 matthys 209 "title" => "Disco",
1512 joku 63 "rule" => array(
1513     "disco/Nutch[/ -]([0-9.]{1,10})" => "\\1",
1514     "discobot[/ -]([0-9.]{1,10})" => "\\1",
1515     "disco-crawl@discoveryengine.com" => ""
1516     ),
1517     "uri" => "http://www.discoveryengine.com/"
1518     ),
1519     "discopump" => array(
1520     "icon" => "robot",
1521     "title" => "DISCo Pump",
1522     "rule" => array(
1523     "DISCo Pump[/ ]([0-9.]{1,10})" => "\\1"
1524     ),
1525     "uri" => ""
1526     ),
1527     "dkimreputation" => array(
1528     "icon" => "dkimreputation",
1529     "title" => "DKIM Reputation",
1530     "rule" => array(
1531     "DKIMRepBot[ /]([0-9.]{1,10})" => "\\1"
1532     ),
1533     "uri" => "http://www.dkim-reputation.org"
1534     ),
1535     "dnsdigger" => array(
1536     "icon" => "dnsdigger",
1537     "title" => "DNS-Digger",
1538     "rule" => array(
1539     "DNS-Digger-Explorer[ /]([0-9.]{1,10})" => "\\1"
1540     ),
1541     "uri" => "http://www.dnsdigger.com"
1542     ),
1543     "dnsvalidation" => array(
1544     "icon" => "dnsvalidation",
1545     "title" => "DNS Validation",
1546     "rule" => array(
1547     "DNSValidation[ /]([0-9.]{1,10})" => "\\1"
1548     ),
1549     "uri" => "http://www.dnsvalidation.com/"
1550     ),
1551     "doctorhtml" => array(
1552     "icon" => "robot",
1553     "title" => "DoctorHTML",
1554     "rule" => array(
1555     "Doctor[ \-]?HTML" => ""
1556     ),
1557     "uri" => ""
1558     ),
1559     "dolphin" => array(
1560     "icon" => "dolphin",
1561     "title" => "Dolphin",
1562     "rule" => array(
1563     "Dolphin[ /]([0-9.]{1,10})" => "\\1"
1564     ),
1565     "uri" => "http://telehouse.ru/crawler.html"
1566     ),
1567     "domaindatei" => array(
1568     "icon" => "robot",
1569     "title" => "Domaindatei",
1570     "rule" => array(
1571     "DomaindateiSpider[ /]([0-9.]{1,10})" => "\\1"
1572     ),
1573     "uri" => ""
1574     ),
1575     "dontbuylists" => array(
1576     "icon" => "dontbuylists",
1577     "title" => "Dontbuylists",
1578     "rule" => array(
1579     "DBLBot[ /]([0-9.]{1,10})" => "\\1"
1580     ),
1581     "uri" => "http://www.dontbuylists.com"
1582     ),
1583     "dotbot" => array(
1584     "icon" => "robot",
1585     "title" => "DotBot",
1586     "rule" => array(
1587     "DotBot[ /]([0-9.]{1,10})" => "\\1"
1588     ),
1589     "uri" => "http://www.dotnetdotcom.org"
1590     ),
1591     "doweb" => array(
1592     "icon" => "doweb",
1593     "title" => "DoWeb",
1594     "rule" => array(
1595     "^www.doweb.co.uk" => ""
1596     ),
1597     "uri" => "http://www.doweb.co.uk/"
1598     ),
1599     "downforeveryoneorjustme" => array(
1600     "icon" => "downforeveryoneorjustme",
1601     "title" => "Down for everyone or just me",
1602     "rule" => array(
1603     "downforeveryoneorjustme" => ""
1604     ),
1605     "uri" => "http://www.downforeveryoneorjustme.com"
1606     ),
1607     "downloadninja" => array(
1608     "icon" => "robot",
1609     "title" => "Download Ninja",
1610     "rule" => array(
1611     "Download Ninja[ /]([0-9.]{1,10})" => "\\1"
1612     ),
1613     "uri" => ""
1614     ),
1615     "drupal" => array(
1616     "icon" => "drupal",
1617     "title" => "Drupal",
1618     "rule" => array(
1619     "^Drupal" => ""
1620     ),
1621     "uri" => ""
1622     ),
1623     "dsns" => array(
1624     "icon" => "robot",
1625     "title" => "DSNS Scanner",
1626     "rule" => array(
1627     "^DSNS" => ""
1628     ),
1629     "uri" => ""
1630     ),
1631     "dtsagent" => array(
1632     "icon" => "robot",
1633     "title" => "DTS Agent",
1634     "rule" => array(
1635     "DTS Agent" => ""
1636     ),
1637     "uri" => ""
1638     ),
1639 matthys 342 "duckduckgo" => array(
1640     "icon" => "duckduckgo",
1641     "title" => "DuckDuckGo",
1642     "rule" => array(
1643     "DuckDuckGo-Favicons-Bot[ /]([0-9.]{1,10})" => "\\1"
1644     ),
1645     "uri" => "http://duckduckgo.com"
1646     ),
1647 joku 63 "earthcom" => array(
1648     "icon" => "earthcom",
1649     "title" => "Earthcom",
1650     "rule" => array(
1651     "EARTHCOM\.info[/ ]([0-9a-z.]{1,10})" => "\\1"
1652     ),
1653     "uri" => ""
1654     ),
1655     "ebay" => array(
1656     "icon" => "ebay",
1657     "title" => "eBay",
1658     "rule" => array(
1659     "eBay Relevance Ad Crawler" => ""
1660     ),
1661     "uri" => ""
1662     ),
1663     "echo" => array(
1664     "icon" => "robot",
1665     "title" => "Echo.com",
1666     "rule" => array(
1667     "_TrueRobot[/ ]([0-9.]{1,10})" => "\\1"
1668     ),
1669     "uri" => "http://www.echo.com/"
1670     ),
1671     "eert" => array(
1672     "icon" => "robot",
1673 matthys 209 "title" => "Eert",
1674 joku 63 "rule" => array(
1675     "eert spdr[/ ]([0-9.]{1,10})" => "\\1"
1676     ),
1677     "uri" => "http://bot.eert.net"
1678     ),
1679     "eknip" => array(
1680     "icon" => "eknip",
1681     "title" => "E-Knip",
1682     "rule" => array(
1683     "eknip[ /]([0-9a-z.]{1,10})" => "\\1"
1684     ),
1685     "uri" => ""
1686     ),
1687     "zoominfo" => array(
1688     "icon" => "zoominfo",
1689 matthys 209 "title" => "ZoomInfo", //Previous called Eliyon
1690 joku 63 "rule" => array(
1691     "NextGenSearchBot[/ ]([0-9.]{1,10})" => "\\1"
1692     ),
1693     "uri" => "http://www.zoominfo.com/business/nextgensearchbot.html"
1694     ),
1695     "emeraldshield" => array(
1696     "icon" => "emeraldshield",
1697     "title" => "EmeraldShield",
1698     "rule" => array(
1699     "^EmeraldShield" => ""
1700     ),
1701     "uri" => ""
1702     ),
1703     "empas" => array(
1704     "icon" => "empas",
1705     "title" => "Empas",
1706     "rule" => array(
1707     "DigExt; empas\)$" => "",
1708     "^EMPAS[_\-]ROBOT" => ""
1709     ),
1710     "uri" => ""
1711     ),
1712     "entireweb" => array(
1713     "icon" => "entireweb",
1714     "title" => "Entireweb",
1715     "rule" => array(
1716     "Speedy[ ]?Spider" => ""
1717     ),
1718     "uri" => ""
1719     ),
1720     "envolk" => array(
1721     "icon" => "envolk",
1722     "title" => "Envolk",
1723     "rule" => array(
1724     "envolk\[ITS\]spider[/ ]([0-9.]{1,10})" => "\\1",
1725     "envolk[/ ]([0-9.]{1,10})" => "\\1"
1726     ),
1727     "uri" => ""
1728     ),
1729     "esnet" => array(
1730     "icon" => "robot",
1731     "title" => "ES.NET",
1732     "rule" => array(
1733     "ES.NET Crawler[ /]([0-9.]{1,10})" => "\\1"
1734     ),
1735     "uri" => ""
1736     ),
1737     "estyle" => array(
1738     "icon" => "estyle",
1739     "title" => "eStyle Search",
1740     "rule" => array(
1741     "eStyleSearch[ /]([0-9.]{1,10})" => "\\1"
1742     ),
1743     "uri" => ""
1744     ),
1745     "eurip" => array(
1746     "icon" => "robot",
1747     "title" => "Eurip",
1748     "rule" => array(
1749     "EuripBot[ /]([0-9.]{1,10})" => "\\1"
1750     ),
1751     "uri" => "http://www.eurip.com"
1752     ),
1753     "eurodirectory" => array(
1754     "icon" => "robot",
1755     "title" => "Euro Directory",
1756     "rule" => array(
1757     "www\.euro-directory\.com" => ""
1758     ),
1759     "uri" => "http://www.euro-directory.com/"
1760     ),
1761     "euroseek" => array(
1762     "icon" => "euroseek",
1763     "title" => "EuroSeek",
1764     "rule" => array(
1765     "Arachnoidea" => ""
1766     ),
1767     "uri" => ""
1768     ),
1769     "evaal" => array(
1770     "icon" => "evaal",
1771     "title" => "Evaal",
1772     "rule" => array(
1773     "^EvaalSE" => ""
1774     ),
1775     "uri" => "http://www.evaal.com/"
1776     ),
1777     "eventax" => array(
1778     "icon" => "eventax",
1779     "title" => "Eventax",
1780     "rule" => array(
1781     "^eventax[ /]([0-9.]{1,10})" => "\\1"
1782     ),
1783     "uri" => "http://www.eventax.de/"
1784     ),
1785     "everbee" => array(
1786     "icon" => "everbee",
1787     "title" => "Everbee",
1788     "rule" => array(
1789     "EverbeeCrawler" => ""
1790     ),
1791     "uri" => ""
1792     ),
1793     "everest" => array(
1794     "icon" => "everest",
1795     "title" => "Everest",
1796     "rule" => array(
1797     "Everest-Vulcan Inc.[ /]([0-9.]{1,10})" => "\\1"
1798     ),
1799     "uri" => ""
1800     ),
1801     "exabot" => array(
1802     "icon" => "exabot",
1803     "title" => "ExaBot",
1804     "rule" => array(
1805     "^NG[ /]([0-9.]{1,10})" => "\\1",
1806     "Exabot/([0-9.]{1,10})" => "\\1",
1807     "ExaBotTest/([0-9.]{1,10})" => "\\1",
1808     "ExaBot-(Test|Images)/([0-9.]{1,10})" => "\\2",
1809     "ExaBot-Thumbnails" => ""
1810     ),
1811     "uri" => "http://www.exabot.com/go/robot"
1812     ),
1813     "exactseek" => array(
1814     "icon" => "exactseek",
1815     "title" => "ExactSeek",
1816     "rule" => array(
1817     "^exactseek[ \-]?(pagereaper|crawler)[ \-]?([0-9.]{1,10})" => "\\2",
1818     "ExactSeek[ \.\-]?(Crawler|com)" => ""
1819     ),
1820     "uri" => "http://www.exactseek.com/"
1821     ),
1822     "excite" => array(
1823     "icon" => "excite",
1824     "title" => "Excite",
1825     "rule" => array(
1826     "Architext[ \-]?Spider" => ""
1827     ),
1828     "uri" => ""
1829     ),
1830     "execrawl" => array(
1831     "icon" => "robot",
1832     "title" => "Execrawl",
1833     "rule" => array(
1834     "Execrawl[ /]([0-9.]{1,10})" => "\\1",
1835     "Execrawl" => ""
1836     ),
1837     "uri" => ""
1838     ),
1839     "expertmonitor" => array(
1840     "icon" => "robot",
1841     "title" => "ExpertMonitor",
1842     "rule" => array(
1843     "^NetMonitor[ /]([0-9.]{1,10})" => "\\1"
1844     ),
1845     "uri" => ""
1846     ),
1847     "explorerrss" => array(
1848     "icon" => "robot",
1849     "title" => "Explorer RSS",
1850     "rule" => array(
1851     "^Windows-RSS-Platform[ /]([0-9.]{1,10})" => "\\1"
1852     ),
1853     "uri" => ""
1854     ),
1855     "ezooms" => array(
1856     "icon" => "robot",
1857     "title" => "Ezooms",
1858     "rule" => array(
1859     "ezooms[/ ]([0-9a-z.\-]{1,10})" => "\\1"
1860     ),
1861     "uri" => ""
1862     ),
1863     "facebook" => array(
1864     "icon" => "facebook",
1865     "title" => "Facebook",
1866     "rule" => array(
1867     "FacebookFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
1868     "facebookexternalhit/([0-9.]{1,10})" => "\\1",
1869     "^facebook" => ""
1870     ),
1871     "uri" => "http://www.facebook.com/"
1872     ),
1873     "fast" => array(
1874     "icon" => "fast",
1875     "title" => "Fast",
1876     "rule" => array(
1877     "^FAST( Enterprise |-Web| MetaWeb )?Crawler[ /]([0-9.]{1,10})" => "\\2",
1878     "^FAST( Enterprise |-Web| MetaWeb | PartnerSite )?Crawler" => "",
1879     "^Fast Crawler" => "",
1880     "^libwww-perl[ /]([0-9.]{1,10}) FP[ /]([0-9.]{1,10})" => "\\2"
1881     ),
1882     "uri" => "http://www.alltheweb.com/"
1883     ),
1884     "fastbuzz" => array(
1885     "icon" => "fastbuzz",
1886     "title" => "Fastbuzz",
1887     "rule" => array(
1888     "^fastbuzz\.com" => ""
1889     ),
1890     "uri" => ""
1891     ),
1892     "favorg" => array(
1893     "icon" => "robot",
1894     "title" => "FavOrg",
1895     "rule" => array(
1896     "^FavOrg" => ""
1897     ),
1898     "uri" => ""
1899     ),
1900     "favorstar" => array(
1901     "icon" => "favorstar",
1902 matthys 209 "title" => "Favorstar",
1903 joku 63 "rule" => array(
1904     "favorstarbot[ /]([0-9.]{1,10})" => "\\1"
1905     ),
1906     "uri" => "http://favorstar.com/bot.html"
1907     ),
1908     "faxo" => array(
1909     "icon" => "robot",
1910     "title" => "Faxo",
1911     "rule" => array(
1912     "^Faxobot[ /]([0-9.]{1,10})" => "\\1"
1913     ),
1914     "uri" => "http://www.faxo.com/"
1915     ),
1916     "fdse" => array(
1917     "icon" => "robot",
1918     "title" => "FDSE Robot",
1919     "rule" => array(
1920     "FDSE[ \-]?robot" => ""
1921     ),
1922     "uri" => ""
1923     ),
1924     "feedback" => array(
1925     "icon" => "robot",
1926     "title" => "FeedBack",
1927     "rule" => array(
1928     "FeedBack[/ ]([0-9.]{1,10})" => "\\1"
1929     ),
1930     "uri" => ""
1931     ),
1932     "feedburner" => array(
1933     "icon" => "feedburner",
1934     "title" => "FeedBurner",
1935     "rule" => array(
1936     "^FeedBurner[/ ]([0-9.]{1,10})" => "\\1"
1937     ),
1938     "uri" => ""
1939     ),
1940     "feeddemon" => array(
1941     "icon" => "feeddemon",
1942     "title" => "FeedDemon",
1943     "rule" => array(
1944     "FeedDemon[/ ]([0-9.]{1,10})" => "\\1"
1945     ),
1946     "uri" => ""
1947     ),
1948     "feedfind" => array(
1949     "icon" => "feedfind",
1950     "title" => "FeedFind",
1951     "rule" => array(
1952     "Feed::Find[ /]([0-9.]{1,10})" => "\\1"
1953     ),
1954     "uri" => ""
1955     ),
1956     "feedonfeeds" => array(
1957     "icon" => "robot",
1958     "title" => "Feed On Feeds",
1959     "rule" => array(
1960     "FeedOnFeeds[/ ]([0-9.]{1,10})" => "\\1"
1961     ),
1962     "uri" => ""
1963     ),
1964     "feedparser" => array(
1965     "icon" => "robot",
1966     "title" => "Feedparser",
1967     "rule" => array(
1968     "UniversalFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
1969     "FeedParser" => ""
1970     ),
1971     "uri" => ""
1972     ),
1973     "feedreader" => array(
1974     "icon" => "feedreader",
1975     "title" => "Feedreader",
1976     "rule" => array(
1977     "^Feedreader" => ""
1978     ),
1979     "uri" => ""
1980     ),
1981     "feedserver" => array(
1982     "icon" => "robot",
1983     "title" => "FeedServer",
1984     "rule" => array(
1985     "FeedServer[/ ]([0-9.]{1,10})" => "\\1"
1986     ),
1987     "uri" => ""
1988     ),
1989     "feedster" => array(
1990     "icon" => "feedster",
1991     "title" => "Feedster",
1992     "rule" => array(
1993     "Feedster Crawler[/ ]([0-9.]{1,10})" => "\\1"
1994     ),
1995     "uri" => ""
1996     ),
1997     "feedvalidator" => array(
1998     "icon" => "feedvalidator",
1999     "title" => "Feed Validator",
2000     "rule" => array(
2001     "^FeedValidator[/ ]([0-9.]{1,10})" => "\\1"
2002     ),
2003     "uri" => ""
2004     ),
2005     "fdm" => array(
2006     "icon" => "robot",
2007     "title" => "Free Download Manager",
2008     "rule" => array(
2009     "^FDM[/ ]([0-9a-z.]{1,10})" => "\\1"
2010     ),
2011     "uri" => ""
2012     ),
2013     "filangy" => array(
2014     "icon" => "robot",
2015     "title" => "Filangy",
2016     "rule" => array(
2017     "Filangy[/ ]([0-9.]{1,10})" => "\\1"
2018     ),
2019     "uri" => "http://www.filangy.com/"
2020     ),
2021     "findanisp" => array(
2022     "icon" => "robot",
2023     "title" => "FindAnISP",
2024     "rule" => array(
2025     "FindAnISP" => ""
2026     ),
2027     "uri" => "http://www.findanisp.com/"
2028     ),
2029     "findengines" => array(
2030     "icon" => "findengines",
2031     "title" => "FindEngines",
2032     "rule" => array(
2033     "FindEngines! Bot" => ""
2034     ),
2035     "uri" => ""
2036     ),
2037     "findexa" => array(
2038     "icon" => "findexa",
2039     "title" => "Findexa",
2040     "rule" => array(
2041     "Findexa Crawler" => ""
2042     ),
2043     "uri" => ""
2044     ),
2045     "findlinks" => array(
2046     "icon" => "findlinks",
2047     "title" => "FindLinks",
2048     "rule" => array(
2049     "findlinks[ /]([0-9.]{1,10})" => "\\1",
2050     "^FindLinks" => ""
2051     ),
2052     "uri" => ""
2053     ),
2054     "findoor" => array(
2055     "icon" => "findoor",
2056 matthys 209 "title" => "Findoor",
2057 joku 63 "rule" => array(
2058     "^findoor(-Bot)?" => "\\1"
2059     ),
2060     "uri" => ""
2061     ),
2062     "firefly" => array(
2063     "icon" => "firefly",
2064     "title" => "Firefly",
2065     "rule" => array(
2066     "Firefly" => ""
2067     ),
2068     "uri" => ""
2069     ),
2070     "flashget" => array(
2071     "icon" => "flashget",
2072     "title" => "FlashGet",
2073     "rule" => array(
2074     "^FlashGet" => ""
2075     ),
2076     "uri" => ""
2077     ),
2078     "flatland" => array(
2079     "icon" => "flatland",
2080     "title" => "Flatland",
2081     "rule" => array(
2082     "^flatlandbot" => ""
2083     ),
2084     "uri" => "http://www.flatlandindustries.com/flatlandbot"
2085     ),
2086     "flickbot" => array(
2087     "icon" => "flickbot",
2088     "title" => "FlickBot",
2089     "rule" => array(
2090     "FlickBot[ /]([0-9.]{1,10})" => "\\1"
2091     ),
2092     "uri" => ""
2093     ),
2094     "flightdeckreports" => array(
2095     "icon" => "flightdeckreports",
2096     "title" => "Flight Deck Reports",
2097     "rule" => array(
2098     "FlightDeckReportsBot[ /]([0-9.]{1,10})" => "\\1"
2099     ),
2100     "uri" => "http://www.flightdeckreports.com/"
2101     ),
2102     "forex" => array(
2103     "icon" => "robot",
2104     "title" => "Forex",
2105     "rule" => array(
2106     "^Forex Trading Network Organization" => ""
2107     ),
2108     "uri" => "http://www.netforex.org/"
2109     ),
2110     "freshmeat" => array(
2111     "icon" => "freshmeat",
2112 matthys 209 "title" => "Freshmeat",
2113 joku 63 "rule" => array(
2114     "fmII URL validator[ /]([0-9.]{1,10})" => "\\1",
2115     "freshmeat.net URL validator[ /]([0-9.]{1,10})" => "\\1"
2116     ),
2117     "uri" => "http://www.freshmeat.net/"
2118     ),
2119     "friend" => array(
2120     "icon" => "friend",
2121     "title" => "Friend",
2122     "rule" => array(
2123     "www\.friend\.fr" => ""
2124     ),
2125     "uri" => "http://www.friend.fr/"
2126     ),
2127     "frontier" => array(
2128     "icon" => "frontier",
2129     "title" => "Frontier",
2130     "rule" => array(
2131     "Frontier[ /]([0-9.]{1,10})" => "\\1"
2132     ),
2133     "uri" => ""
2134     ),
2135     "fyberspider" => array(
2136     "icon" => "robot",
2137     "title" => "FyberSpider",
2138     "rule" => array(
2139     "FyberSpider[ /]([0-9.]{1,10})" => "\\1"
2140     ),
2141     "uri" => "http://www.fyberspider.com/"
2142     ),
2143     "gaisbot" => array(
2144     "icon" => "gais",
2145     "title" => "Gaisbot",
2146     "rule" => array(
2147     "Gaisbot[ /]([0-9.]{1,10})" => "\\1"
2148     ),
2149     "uri" => ""
2150     ),
2151     "galaxy" => array(
2152     "icon" => "galaxy",
2153     "title" => "Galaxy",
2154     "rule" => array(
2155     "GalaxyBot[ /]([0-9.]{1,10})" => "\\1",
2156     "www.galaxy.com" => ""
2157     ),
2158     "uri" => "http://www.galaxy.com/"
2159     ),
2160     "gamespy" => array(
2161     "icon" => "gamespy",
2162     "title" => "GameSpy",
2163     "rule" => array(
2164     "GameSpyHTTP[ /]([0-9.]{1,10})" => "\\1"
2165     ),
2166     "uri" => ""
2167     ),
2168     "garlik" => array(
2169     "icon" => "garlik",
2170     "title" => "Garlik",
2171     "rule" => array(
2172     "GarlikCrawler[ /]([0-9.]{1,10})" => "\\1"
2173     ),
2174     "uri" => "http://garlik.com/"
2175     ),
2176     "gdesktop" => array(
2177     "icon" => "gdesktop",
2178     "title" => "Google Desktop",
2179     "rule" => array(
2180     "compatible; Google Desktop" => ""
2181     ),
2182     "uri" => ""
2183     ),
2184     "genome" => array(
2185     "icon" => "robot",
2186     "title" => "Genome Machine",
2187     "rule" => array(
2188     "Genome[ \-]?Machine" => ""
2189     ),
2190     "uri" => ""
2191     ),
2192     "geohash" => array(
2193     "icon" => "geohash",
2194     "title" => "Geohash",
2195     "rule" => array(
2196     "GeoHasher(/Nutch)[ /-]([0-9.]{1,10})" => "\\2"
2197     ),
2198     "uri" => "http://geohash.org/"
2199     ),
2200     "geona" => array(
2201     "icon" => "robot",
2202     "title" => "Geona",
2203     "rule" => array(
2204     "GeonaBot[ /]([0-9.]{1,10})" => "\\1"
2205     ),
2206     "uri" => ""
2207     ),
2208     "geoblog" => array(
2209     "icon" => "robot",
2210     "title" => "The World as a Blog",
2211     "rule" => array(
2212     "The World as a Blog" => ""
2213     ),
2214     "uri" => ""
2215     ),
2216     "geourl" => array(
2217     "icon" => "geourl",
2218     "title" => "GeoUrl",
2219     "rule" => array(
2220     "geourl[ /]([0-9.]{1,10})" => "\\1",
2221     "^GeoURLBot[ /]([0-9.]{1,10})" => "\\1",
2222     ),
2223     "uri" => ""
2224     ),
2225     "getnetwise" => array(
2226     "icon" => "robot",
2227     "title" => "GetNetWise",
2228     "rule" => array(
2229     " Crayon Crawler" => ""
2230     ),
2231     "uri" => ""
2232     ),
2233     "getright" => array(
2234     "icon" => "getright",
2235     "title" => "GetRight",
2236     "rule" => array(
2237     "GetRight[ /]([0-9.]{1,10})" => "\\1"
2238     ),
2239     "uri" => ""
2240     ),
2241     "getsmart" => array(
2242     "icon" => "getsmart",
2243     "title" => "GetSmart",
2244     "rule" => array(
2245     "GetSmart[ /]([0-9.]{1,10})" => "\\1"
2246     ),
2247     "uri" => ""
2248     ),
2249     "gigabot" => array(
2250     "icon" => "gigablast",
2251     "title" => "Gigablast",
2252     "rule" => array(
2253     "(Gigabot|Sitesearch)[/ ]([0-9.]{1,10})" => "\\2",
2254     "GigabotSiteSearch[/ ]([0-9.]{1,10})" => "\\1",
2255 joku 336 "GigablastOpenSource" => ""
2256 joku 63 ),
2257     "uri" => ""
2258 matthys 328 ),
2259     "gimme" => array(
2260     "icon" => "gimme",
2261     "title" => "gimmeUSA",
2262     "rule" => array(
2263     "Gimme60bot[ /]([0-9.]{1,10})" => "\\1"
2264     ),
2265     "uri" => "http://gimme60.com"
2266 joku 63 ),
2267 matthys 328 "ginger" => array(
2268     "icon" => "ginger",
2269     "title" => "GingerCrawler",
2270     "rule" => array(
2271     "GingerCrawler[ /]([0-9.]{1,10})" => "\\1"
2272     ),
2273     "uri" => "http://www.gingersoftware.com/crawler_agent.htm"
2274     ),
2275 joku 63 "girafabot" => array(
2276     "icon" => "girafa",
2277     "title" => "Girafa",
2278     "rule" => array(
2279     "Girafabot" => ""
2280     ),
2281     "uri" => ""
2282     ),
2283     "globalspec" => array(
2284     "icon" => "globalspec",
2285     "title" => "GlobalSpec",
2286     "rule" => array(
2287     "Ocelli[ /]([0-9.]{1,10})" => "\\1"
2288     ),
2289     "uri" => ""
2290     ),
2291     "glucose" => array(
2292     "icon" => "glucose",
2293     "title" => "Glucose",
2294     "rule" => array(
2295     "glucose[ /]([0-9a-z.\-]{1,10})" => "\\1"
2296     ),
2297     "uri" => ""
2298     ),
2299     "gnomit" => array(
2300     "icon" => "gnomit",
2301     "title" => "Gnomit",
2302     "rule" => array(
2303     "gnomit[ /]([0-9.]{1,10})" => "\\1"
2304     ),
2305     "uri" => "http://www.gnomit.com/",
2306     ),
2307     "goforit" => array(
2308     "icon" => "goforit",
2309     "title" => "GoForIt",
2310     "rule" => array(
2311     "^GoForIt\.com" => "",
2312     "^GOFORITBOT" => ""
2313     ),
2314     "uri" => ""
2315     ),
2316     "goguides" => array(
2317     "icon" => "robot",
2318     "title" => "GoGuides",
2319     "rule" => array(
2320     "^GoGuidesBot[ /]([0-9.]{1,10})" => "\\1"
2321     ),
2322     "uri" => "http://www.goguides.org/"
2323     ),
2324     // Needs to be before google for correct detection
2325     "mediapartners" => array(
2326     "icon" => "google",
2327     "title" => "Mediapartners",
2328     "rule" => array (
2329     "Mediapartners-Google[ /]([0-9.]{1,10})" => "\\1",
2330     "Mediapartners-Google" => ""
2331     ),
2332     "uri" => ""
2333     ),
2334     "google" => array(
2335     "icon" => "google",
2336     "title" => "Google",
2337     "rule" => array (
2338     "Googl(e|ebot)(-Image)?/([0-9.]{1,10})" => "\\3",
2339     "Googl(e|ebot)(-Image)?/" => "",
2340     "^gsa-crawler" => "",
2341     "Google Web Preview" => ""
2342     ),
2343     "uri" => "http://www.google.com/"
2344     ),
2345     "googlesitemaps" => array(
2346     "icon" => "google",
2347     "title" => "Google-Sitemaps",
2348     "rule" => array (
2349     "Googl(e|ebot)(-Sitemaps)?/([0-9.]{1,10})" => "\\3",
2350     "GSiteCrawler[ /v]*([0-9.a-z]{1,10})" => "\\1",
2351     "Googl(e|ebot)(-Sitemaps)?/" => ""
2352     ),
2353     "uri" => ""
2354     ),
2355     "googlemobile" => array(
2356     "icon" => "google",
2357     "title" => "Google-Mobile",
2358     "rule" => array (
2359     "Googl(e|ebot)(-Mobile)?/([0-9.]{1,10})" => "\\3",
2360     "Googl(e|ebot)(-Mobile)?/" => ""
2361     ),
2362     "uri" => ""
2363     ),
2364     "googleads" => array(
2365     "icon" => "google",
2366     "title" => "Google-AdsBot",
2367     "rule" => array (
2368     "^AdsBot-Google" => "",
2369     ),
2370     "uri" => ""
2371     ),
2372     "googlefeeds" => array(
2373     "icon" => "google",
2374     "title" => "Google-Feedfetcher",
2375     "rule" => array (
2376     "^Feedfetcher-Google" => "",
2377     ),
2378     "uri" => ""
2379     ),
2380     "googlverification" => array(
2381     "icon" => "google",
2382     "title" => "Google-Site-Verification",
2383     "rule" => array (
2384     "Google-Site-Verification[ /]([0-9.]{1,10})" => "\\1"
2385     ),
2386     "uri" => ""
2387     ),
2388 matthys 207 // Needs to be AFTER Google detection
2389     "goo" => array(
2390     "icon" => "goo",
2391     "title" => "Goo",
2392     "rule" => array (
2393     "(gazz|ichiro|mog(et|imogi))[ /]([0-9.]{1,10})" => "\\3",
2394     "DoCoMo[ /]([0-9.]{1,10})" => "\\1"
2395     ),
2396     "uri" => ""
2397     ),
2398 joku 63 "goongee" => array(
2399     "icon" => "robot",
2400     "title" => "GoonGee",
2401     "rule" => array (
2402     "^Big Fish[ /]v?([0-9.]{1,10})" => "\\2"
2403     ),
2404     "uri" => "http://www.goongee.com/"
2405     ),
2406     "gpost" => array(
2407     "icon" => "gpost",
2408     "title" => "GPost",
2409     "rule" => array(
2410     "^GPostbot" => ""
2411     ),
2412     "uri" => ""
2413     ),
2414 matthys 309 "grapeshot" => array(
2415     "icon" => "grapeshot",
2416     "title" => "Grapeshot",
2417     "rule" => array(
2418     "GrapeshotCrawler[/ ]([0-9.]{1,10})" => "\\1"
2419     ),
2420     "uri" => "http://www.grapeshot.co.uk/crawler.php"
2421     ),
2422 joku 63 "gregarius" => array(
2423     "icon" => "robot",
2424     "title" => "Gregarius",
2425     "rule" => array(
2426     "^Gregarius[/ ]([0-9.]{1,10})" => ""
2427     ),
2428     "uri" => ""
2429     ),
2430     "grub" => array(
2431     "icon" => "grub",
2432     "title" => "Grub",
2433     "rule" => array(
2434     "grub[ \-]?client[ /\-]{1,5}([0-9.]{1,10})" => "\\1",
2435     "grub crawler" => "",
2436     "grub[/ ]([0-9.]{1,10})" => "\\1",
2437     "^GrubNG([0-9. ]{1,10})?" => "\\1"
2438     ),
2439     "uri" => "http://www.grub.org/"
2440     ),
2441     "gulliver" => array(
2442     "icon" => "robot",
2443     "title" => "Gulliver",
2444     "rule" => array(
2445     "Gulliver" => ""
2446     ),
2447     "uri" => ""
2448     ),
2449     "guruji" => array(
2450     "icon" => "guruji",
2451     "title" => "Guruji",
2452     "rule" => array(
2453     "GurujiBot[/ ]([0-9.]{1,10})" => "\\1"
2454     ),
2455     "uri" => "http://www.guruji.com/"
2456     ),
2457     "gush" => array(
2458     "icon" => "robot",
2459     "title" => "Gush",
2460     "rule" => array(
2461     "^Gush[/ ]([0-9.]{1,10})" => "\\1"
2462     ),
2463     "uri" => ""
2464     ),
2465     "gziptester" => array(
2466     "icon" => "robot",
2467     "title" => "Gzip Tester",
2468     "rule" => array(
2469     "g(id)?zip[ \-]?test(er)?" => ""
2470     ),
2471     "uri" => ""
2472     ),
2473     "hanzoweb" => array(
2474     "icon" => "hanzoweb",
2475     "title" => "Hanzoweb",
2476     "rule" => array(
2477     "^Hanzoweb" => ""
2478     ),
2479     "uri" => ""
2480     ),
2481     "harbot" => array(
2482     "icon" => "harbot",
2483     "title" => "Harbot",
2484     "rule" => array(
2485     "^Harbot GateStation" => ""
2486     ),
2487     "uri" => ""
2488     ),
2489     "hatena" => array(
2490     "icon" => "hatena",
2491     "title" => "Hatena",
2492     "rule" => array(
2493     "Hatena (Antenna|Bookmark|Pagetitle Agent)[ /]([0-9.]{1,10})" => "\\2"
2494     ),
2495     "uri" => ""
2496     ),
2497     "htmlparser" => array(
2498     "icon" => "htmlparser",
2499     "title" => "HTMLParser",
2500     "rule" => array(
2501     "HTMLParser[ /]([0-9.]{1,10})" => "\\1"
2502     ),
2503     "uri" => "http://htmlparser.sourceforge.net/"
2504     ),
2505     "helix" => array(
2506     "icon" => "helix",
2507     "title" => "Heritrix",
2508     "rule" => array(
2509     "^helix[ /]([0-9.]{1,10})" => "\\1"
2510     ),
2511     "uri" => "http://www.sitesearch.ca/helix/"
2512     ),
2513     "heritrix" => array(
2514     "icon" => "heritrix",
2515     "title" => "Heritrix",
2516     "rule" => array(
2517     "heritrix[ /]([0-9.]{1,10})" => "\\1",
2518     "archive.org_bot" => "",
2519     "InternetArchive[ /]([0-9.a-z]{1,10})" => "\\1"
2520     ),
2521     "uri" => "http://archive.org"
2522     ),
2523     "hiddenmarket" => array(
2524     "icon" => "robot",
2525     "title" => "HiddenMarket",
2526     "rule" => array(
2527     "HiddenMarket[ /\-]([0-9.]{1,10})" => "\\1"
2528     ),
2529     "uri" => ""
2530     ),
2531     "honda" => array(
2532     "icon" => "robot",
2533     "title" => "Honda",
2534     "rule" => array(
2535     "Honda-Search[ /]([0-9.]{1,10})" => "\\1"
2536     ),
2537     "uri" => "http://www.honda-search.com"
2538     ),
2539     "hoowwwer" => array(
2540     "icon" => "hoowwwer",
2541     "title" => "HooWWWer",
2542     "rule" => array(
2543     "HooWWWer[ /]([0-9.]{1,10})" => "\\1"
2544     ),
2545     "uri" => ""
2546     ),
2547     "hotzonu" => array(
2548     "icon" => "hotzonu",
2549     "title" => "Hotzonu",
2550     "rule" => array(
2551     "Hotzonu[ /]([0-9.]{1,10})" => "\\1"
2552     ),
2553     "uri" => ""
2554     ),
2555     "houxou" => array(
2556     "icon" => "robot",
2557     "title" => "Houxou",
2558     "rule" => array(
2559     "HouxouCrawler[ /]Nutch.([0-9.]{1,10})" => "\\1",
2560     "HouxouCrawler" => ""
2561     ),
2562     "uri" => ""
2563     ),
2564     "htdig" => array(
2565     "icon" => "htdig",
2566     "title" => "ht://Dig",
2567     "rule" => array(
2568     "htdig[ /]([0-9.]{1,10})" => "\\1",
2569     "htdig" => "\\1"
2570     ),
2571     "uri" => ""
2572     ),
2573     "html2jpg" => array(
2574     "icon" => "html2jpg",
2575     "title" => "HTML2JPG",
2576     "rule" => array(
2577     "^HTML2JPG" => ""
2578     ),
2579     "uri" => ""
2580     ),
2581     "httperf" => array(
2582     "icon" => "robot",
2583     "title" => "HTTPerf",
2584     "rule" => array(
2585     "httperf[ /]([0-9.]{1,10})" => "\\1"
2586     ),
2587     "uri" => ""
2588     ),
2589     "httpunit" => array(
2590     "icon" => "httpunit",
2591     "title" => "HttpUnit",
2592     "rule" => array(
2593     "httpunit[ /]([0-9.]{1,10})" => "\\1"
2594     ),
2595     "uri" => ""
2596     ),
2597     "httrack" => array(
2598     "icon" => "httrack",
2599     "title" => "HTTrack",
2600     "rule" => array(
2601     "HTTrack[ /]([0-9.]{1,10})" => "\\1"
2602     ),
2603     "uri" => ""
2604     ),
2605     "huaweisymantec" => array(
2606     "icon" => "huaweisymantec",
2607     "title" => "HuaweiSymantec",
2608     "rule" => array(
2609     "HuaweiSymantecSpider[ /]([0-9.]{1,10})" => "\\1"
2610     ),
2611     "uri" => "http://www.huaweisymantec.com/en/IRL/spider/"
2612     ),
2613     "hungary" => array(
2614     "icon" => "hungary",
2615     "title" => "Hungary",
2616     "rule" => array(
2617     "HuRob[ /]([0-9.]{1,10})" => "\\1"
2618     ),
2619     "uri" => ""
2620     ),
2621 joku 261 "i18n" => array(
2622     "icon" => "w3c",
2623     "title" => "W3C I18n Checker",
2624     "rule" => array(
2625     "^W3C_I18n-Checker[ /]([0-9.]{1,10})" => "\\1"
2626 joku 169 ),
2627 joku 261 "uri" => "http://validator.w3.org/services"
2628     ),
2629 joku 63 "iakke" => array(
2630     "icon" => "iakke",
2631 matthys 209 "title" => "Iakké",
2632 joku 63 "rule" => array(
2633     "^iakke_bot[ /]v([0-9.]{1,10})" => "\\1"
2634     ),
2635     "uri" => "http://fr.iakke.com/"
2636     ),
2637     "iask" => array(
2638     "icon" => "iask",
2639     "title" => "IAsk",
2640     "rule" => array(
2641     "iaskspider[ /]([0-9.]{1,10})" => "\\1",
2642     "^iaskspider" => ""
2643     ),
2644     "uri" => "http://iask.com"
2645     ),
2646     "icc" => array(
2647     "icon" => "icc",
2648     "title" => "ICC-Crawler",
2649     "rule" => array(
2650     "^ICC-Crawler" => ""
2651     ),
2652     "uri" => "http://kc.nict.go.jp/icc/crawl.html"
2653     ),
2654     "icerocket" => array(
2655     "icon" => "icerocket",
2656     "title" => "Icerocket",
2657     "rule" => array(
2658     "BlogzIce[ /]([0-9.]{1,10})" => "\\1",
2659     "BlogSearch[ /]([0-9.]{1,10})" => "\\1"
2660     ),
2661     "uri" => ""
2662     ),
2663     "icjobs" => array(
2664     "icon" => "icjobs",
2665     "title" => "iCjobs",
2666     "rule" => array(
2667     "iCjobs[ /]([0-9.]{1,10})" => "\\1"
2668     ),
2669     "uri" => "http://www.icjobs.de/"
2670     ),
2671     "icra" => array(
2672     "icon" => "icra",
2673     "title" => "ICRA",
2674     "rule" => array(
2675     "^ICRA_Semantic_spider[ /]([0-9.]{1,10})" => "\\1"
2676     ),
2677     "uri" => "http://www.icra.org"
2678     ),
2679     "iknow" => array(
2680     "icon" => "robot",
2681     "title" => "I know",
2682     "rule" => array(
2683     "Comaneci_bot[ /]([0-9.]{1,10})" => "\\1"
2684     ),
2685     "uri" => ""
2686     ),
2687     "ilial" => array(
2688     "icon" => "robot",
2689     "title" => "Ilial",
2690     "rule" => array(
2691     "ilial[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
2692     ),
2693     "uri" => ""
2694     ),
2695     "ilocal" => array(
2696     "icon" => "ilocal",
2697     "title" => "ilocal",
2698     "rule" => array(
2699     "^ilocal" => "",
2700     ),
2701     "uri" => "http://www.ilocal.nl"
2702     ),
2703     "ilse" => array(
2704     "icon" => "ilse",
2705     "title" => "Ilse",
2706     "rule" => array(
2707     "I(NGRID|lseRobot|lseBot)[ /]([0-9.]{1,10})" => "\\1"
2708     ),
2709     "uri" => "http://ilse.nl/"
2710     ),
2711     "iltrovatore" => array(
2712     "icon" => "iltrovatore",
2713     "title" => "IlTrovatore",
2714     "rule" => array(
2715     "iltrovatore-setaccio[ /]([0-9.]{1,10})" => "\\1",
2716     "Iltrovatore-Setaccio" => "",
2717     "iltrovatore[ /]([0-9.]{1,10})" => "\\1"
2718     ),
2719     "uri" => ""
2720     ),
2721     "indylibrary" => array(
2722     "icon" => "robot",
2723     "title" => "Indy Library",
2724     "rule" => array(
2725     "Indy[ \-]?Library" => ""
2726     ),
2727     "uri" => ""
2728     ),
2729     "inela" => array(
2730     "icon" => "robot",
2731     "title" => "Inela",
2732     "rule" => array(
2733     "InelaBot[ /]([0-9.]{1,10})" => ""
2734     ),
2735     "uri" => "http://inelegant.org/bot"
2736     ),
2737     "ineturl" => array(
2738     "icon" => "robot",
2739     "title" => "InetURL",
2740     "rule" => array(
2741     "InetURL.?[ /]([0-9.]{1,10})" => ""
2742     ),
2743     "uri" => ""
2744     ),
2745     "infoart" => array(
2746     "icon" => "robot",
2747     "title" => "InfoArt",
2748     "rule" => array(
2749     "InfoArt crawler" => ""
2750     ),
2751     "uri" => ""
2752     ),
2753     "infomine" => array(
2754     "icon" => "infomine",
2755     "title" => "INFOMINE",
2756     "rule" => array(
2757     "^DataFountains/DMOZ" => "",
2758     "^INFOMINE[ /]([0-9.]{1,10})" => "\\1"
2759     ),
2760     "uri" => "http://infomine.ucr.edu/"
2761     ),
2762     "infoseek" => array(
2763     "icon" => "infoseek",
2764     "title" => "Infoseek",
2765     "rule" => array(
2766     "SideWinder[ /]?([0-9a-z.]{1,10})" => "\\1",
2767     "Infoseek" => ""
2768     ),
2769     "uri" => ""
2770     ),
2771     "inktomi" => array(
2772     "icon" => "inktomi",
2773     "title" => "Inktomi",
2774     "rule" => array(
2775     "slurp@inktomi\.com" => ""
2776     ),
2777     "uri" => ""
2778     ),
2779     "innerprise" => array(
2780     "icon" => "robot",
2781     "title" => "Innerprise",
2782     "rule" => array(
2783     "^InnerpriseBot[ /]([0-9.]{1,10})" => "\\1",
2784     "URL[ _]Spider[ _]Pro[ /]([0-9.+]{1,10})" => "\\1",
2785     "^ES[ .]NET[ _]Crawler[ /]([0-9.]{1,10})" => "\\1"
2786     ),
2787     "uri" => "http://www.innerprise.com/"
2788     ),
2789     "inria" => array(
2790     "icon" => "inria",
2791     "title" => "Inria",
2792     "rule" => array(
2793     "^xyro_" => ""
2794     ),
2795     "uri" => ""
2796     ),
2797     "insitor" => array(
2798     "icon" => "insitor",
2799     "title" => "Insitor",
2800     "rule" => array(
2801     "^Insitor(,|\.|naut)" => ""
2802     ),
2803     "uri" => "http://www.insitor.com/"
2804     ),
2805     "internetninja" => array(
2806     "icon" => "robot",
2807     "title" => "Internet Ninja",
2808     "rule" => array(
2809     "^Internet Ninja[ /]([0-9.]{1,10})" => "\\1"
2810     ),
2811     "uri" => ""
2812     ),
2813     "internetseer" => array(
2814     "icon" => "internetseer",
2815     "title" => "InternetSeer",
2816     "rule" => array(
2817     "^InternetSeer\.com" => ""
2818     ),
2819     "uri" => ""
2820     ),
2821     "interseek" => array(
2822     "icon" => "interseek",
2823     "title" => "Interseek",
2824     "rule" => array(
2825     "Interseek.com" => ""
2826     ),
2827     "uri" => "http://www.interseek.com"
2828     ),
2829     "intravnews" => array(
2830     "icon" => "intravnews",
2831     "title" => "IntraVnews",
2832     "rule" => array(
2833     "IntraVnews[ /]([0-9.]{1,10})" => "\\1"
2834     ),
2835     "uri" => "http://www.intravnews.com/"
2836     ),
2837     "ip2location" => array(
2838     "icon" => "ip2location",
2839     "title" => "IP2LocationBot",
2840     "rule" => array(
2841     "^IP2(Map|Location)Bot[ /]([0-9.]{1,10})" => "\\2"
2842     ),
2843     "uri" => "http://www.ip2location.com"
2844     ),
2845     "ipworks" => array(
2846     "icon" => "ipworks",
2847     "title" => "IP*Works",
2848     "rule" => array(
2849     "^IP\*Works\! V([0-9.]{1,10})" => "\\1"
2850     ),
2851     "uri" => "http://www.nsoftware.com/ipworks/"
2852     ),
2853     "irca" => array(
2854     "icon" => "robot",
2855     "title" => "Novell iChain Cool Solutions caching",
2856     "rule" => array(
2857 matthys 209 "^ICRA_(label_generator|Semantic_spider)[ /]([0-9.]{1,10})" => "\\2",
2858     "^Mozilla[/ ]([0-9.]{1,10})[/ ]\(compatible[ ;]*ICS" => "\\1"
2859 joku 63 ),
2860     "uri" => "http://www.icra.org"
2861     ),
2862     "irvine" => array(
2863     "icon" => "robot",
2864     "title" => "Irvine",
2865     "rule" => array(
2866     "Irvine[ /]([0-9.]{1,10})" => "\\1"
2867     ),
2868     "uri" => ""
2869     ),
2870     "ips-agent" => array(
2871     "icon" => "robot",
2872 matthys 209 "title" => "IPS-agent",
2873 joku 63 "rule" => array(
2874     "ips-agent" => ""
2875     ),
2876     "uri" => ""
2877     ),
2878     "isara" => array(
2879     "icon" => "isara",
2880 matthys 209 "title" => "Isara",
2881 joku 63 "rule" => array(
2882     "Isara[ -]([0-9.]{1,10})" => "\\1"
2883     ),
2884     "uri" => "http://www.isara.org/"
2885     ),
2886     "isspider" => array(
2887     "icon" => "robot",
2888     "title" => "ISSpider",
2889     "rule" => array(
2890     "ISSpider[ /\-]([0-9.]{1,10})" => "\\1"
2891     ),
2892     "uri" => ""
2893     ),
2894     "it2media" => array(
2895     "icon" => "it2media",
2896     "title" => "IT2media",
2897     "rule" => array(
2898     "www.adressendeutschland.de" => ""
2899     ),
2900     "uri" => "http://www.adressendeutschland.de/"
2901     ),
2902     "ivia" => array(
2903     "icon" => "robot",
2904     "title" => "iVia",
2905     "rule" => array(
2906     "iVia Site Checker.?[ /]([0-9.]{1,10})" => "\\1"
2907     ),
2908     "uri" => ""
2909     ),
2910     "jeteye" => array(
2911     "icon" => "jeteye",
2912     "title" => "Jeteye",
2913     "rule" => array(
2914     "Jetbot[ /]([0-9.]{1,10})" => "\\1"
2915     ),
2916     "uri" => ""
2917     ),
2918     "jobsde" => array(
2919     "icon" => "jobsde",
2920     "title" => "jobs.de",
2921     "rule" => array(
2922     "www\.jobs\.de" => "",
2923     "jobs.de-Robot" => ""
2924     ),
2925     "uri" => "http://www.jobs.de/"
2926     ),
2927     "jpluck" => array(
2928     "icon" => "robot",
2929     "title" => "Jpluck",
2930     "rule" => array(
2931     "JPluck[ /]([0-9a-z.]{1,10})" => "\\1"
2932     ),
2933     "uri" => ""
2934     ),
2935     "jxta" => array(
2936     "icon" => "robot",
2937     "title" => "Jxta",
2938     "rule" => array(
2939     "falcon[ /]([0-9.]{1,10})" => "\\1"
2940     ),
2941     "uri" => ""
2942     ),
2943     "jyte" => array(
2944     "icon" => "jyte",
2945     "title" => "Jyte",
2946     "rule" => array(
2947     "jyte_fetcher[ /]([0-9.]{1,10})" => "\\1"
2948     ),
2949     "uri" => ""
2950     ),
2951     "jyxo" => array(
2952     "icon" => "jyxo",
2953     "title" => "Jyxo",
2954     "rule" => array(
2955     "Jyxobot[ /]([0-9.]{1,10})" => "\\1"
2956     ),
2957     "uri" => ""
2958     ),
2959     "kalooga" => array(
2960     "icon" => "kalooga",
2961     "title" => "Kalooga",
2962     "rule" => array(
2963     "kalooga[ /-]([0-9.]{1,10})" => "\\1",
2964     "^kalooga" => "",
2965     "KaloogaBot" => ""
2966     ),
2967     "uri" => "http://www.kalooga.com"
2968     ),
2969     "keywen" => array(
2970     "icon" => "keywen",
2971     "title" => "Keywen",
2972     "rule" => array(
2973     "EasyDL[ /]([0-9.]{1,10})" => "\\1"
2974     ),
2975     "uri" => ""
2976     ),
2977     "kilomonkey" => array(
2978     "icon" => "robot",
2979     "title" => "Kilomonkey",
2980     "rule" => array(
2981     "kmky-not-a-bot[ /]([0-9.]{1,10})" => "\\1"
2982     ),
2983     "uri" => "http://www.kilomonkey.com/notabot.txt"
2984     ),
2985     "kinja" => array(
2986     "icon" => "kinja",
2987     "title" => "Kinja",
2988     "rule" => array(
2989     "kinjabot[ /]([0-9.]{1,10})" => "\\1",
2990     "^kinjabot" => ""
2991     ),
2992     "uri" => ""
2993     ),
2994     "kiwi" => array(
2995     "icon" => "robot",
2996     "title" => "KiwiStatus",
2997     "rule" => array(
2998     "KiwiStatus[ /]([0-9.]{1,10})" => "\\1",
2999     "KiwiStatus" => ""
3000     ),
3001     "uri" => "http://www.nzs.com/kiei-status/"
3002     ),
3003     "lachesis" => array(
3004     "icon" => "robot",
3005     "title" => "Lachesis",
3006     "rule" => array(
3007     "lachesis" => ""
3008     ),
3009     "uri" => ""
3010     ),
3011     "lanshan" => array(
3012     "icon" => "robot",
3013     "title" => "Lachesis",
3014     "rule" => array(
3015     "lanshanbot[/ ]([0-9.]{1,10})" => "\\1"
3016     ),
3017     "uri" => ""
3018     ),
3019     "lapozz" => array(
3020     "icon" => "lapozz",
3021     "title" => "Lapozz",
3022     "rule" => array(
3023     "LapozzBot[/ ]?([0-9.]{1,10})" => "\\1"
3024     ),
3025     "uri" => ""
3026     ),
3027     "larbin" => array(
3028     "icon" => "robot",
3029     "title" => "Larbin",
3030     "rule" => array(
3031     "larbin[_/ ]?([0-9.]{1,10})" => "\\1"
3032     ),
3033     "uri" => ""
3034     ),
3035     "laurion" => array(
3036     "icon" => "robot",
3037     "title" => "Laurion",
3038     "rule" => array(
3039     "^IPiumBot" => ""
3040     ),
3041     "uri" => "http://www.laurion.com/"
3042     ),
3043     "leechget" => array(
3044     "icon" => "leechget",
3045     "title" => "LeechGet",
3046     "rule" => array(
3047     "^LeechGet[ /]([0-9.]{1,10})" => "\\1"
3048     ),
3049     "uri" => ""
3050     ),
3051     "linguaseek" => array(
3052     "icon" => "linguaseek",
3053     "title" => "Linguaseek",
3054     "rule" => array(
3055     "^LinguaBot[ /]v([0-9.]{1,10})" => "\\1"
3056     ),
3057     "uri" => "http://www.linguaseek.com/"
3058     ),
3059     "linguee" => array(
3060     "icon" => "linguee",
3061     "title" => "Linguee",
3062     "rule" => array(
3063     "^Linguee Bot" => ""
3064     ),
3065     "uri" => "http://www.linguee.com/"
3066     ),
3067 matthys 355 "linkapedia" => array(
3068     "icon" => "linkapedia",
3069     "title" => "Linkapedia",
3070     "rule" => array(
3071     "^linkapedia" => ""
3072     ),
3073     "uri" => "http://www.linkapedia.com"
3074     ),
3075 matthys 346 "linkdex" => array(
3076     "icon" => "linkdex",
3077     "title" => "Linkdex",
3078     "rule" => array(
3079     "linkdexbot[ /]([0-9.]{1,10})" => "\\1"
3080     ),
3081     "uri" => "http://www.linkdex.com/bots/"
3082     ),
3083 matthys 366 "linkedin" => array(
3084     "icon" => "linkedin",
3085     "title" => "LinkedIn",
3086     "rule" => array(
3087     "LinkedInBot[ /]([0-9.]{1,10})" => "\\1"
3088     ),
3089     "uri" => "http://www.linkedin.com"
3090     ),
3091 joku 63 "linkguard" => array(
3092     "icon" => "robot",
3093     "title" => "Linkguard",
3094     "rule" => array(
3095     "Linkguard Online[ /]([0-9.]{1,10})" => "\\1"
3096     ),
3097     "uri" => "http://www.linkguard.com/"
3098     ),
3099     "linklint" => array(
3100     "icon" => "linklint",
3101     "title" => "Linklint",
3102     "rule" => array(
3103     "^Linklint[-\-a-z /]*([0-9.]{1,10})" => "\\1"
3104     ),
3105     "uri" => "http://www.linklint.org/"
3106     ),
3107     "linkman" => array(
3108     "icon" => "linkman",
3109     "title" => "Linkman",
3110     "rule" => array(
3111     "\(compatible; Linkman\)" => ""
3112     ),
3113     "uri" => ""
3114     ),
3115     // Needs to be before linkcheck for correct detection
3116     "linkchecker" => array(
3117     "icon" => "w3c",
3118     "title" => "W3C Link Checker",
3119     "rule" => array(
3120     "^W3C-checklink[ /]([0-9.]{1,10})" => "\\1"
3121     ),
3122     "uri" => "http://validator.w3.org/checklink"
3123     ),
3124     "linkcheck" => array(
3125     "icon" => "linkcheck",
3126     "title" => "Linkcheck",
3127     "rule" => array(
3128     "checklink[ /]([0-9.]{1,10})" => "\\1",
3129     "Link[ \-]?(Chec(k|ker)|Val(et|idator))" => "",
3130     "Adaxas Spider" => "",
3131     "Agent-SharewarePlazaFileCheckBot[ /]([0-9.]{1,10})" => "\\1",
3132     "NetMechanic V([0-9.]{1,10})" => "\\1",
3133     "^InfoLink" => "",
3134     "InternetLinkAgent" => "",
3135     "; SPENG\)" => "",
3136     "SharewarePlazaFileCheckBot" => "",
3137     "fileboost.net" => "",
3138     "^billbot" => ""
3139     ),
3140     "uri" => ""
3141     ),
3142     "linkru" => array(
3143     "icon" => "robot",
3144     "title" => "Link.RU",
3145     "rule" => array(
3146     "^Link.RU bot" => ""
3147     ),
3148     "uri" => ""
3149     ),
3150     "linkssql" => array(
3151     "icon" => "robot",
3152     "title" => "Links SQL",
3153     "rule" => array(
3154     "links sql" => ""
3155     ),
3156     "uri" => ""
3157     ),
3158     "linksweeper" => array(
3159     "icon" => "robot",
3160     "title" => "Link Sweeper",
3161     "rule" => array(
3162     "LinkSweeper[ /]([0-9.]{1,10})" => "\\1"
3163     ),
3164     "uri" => ""
3165     ),
3166     "linkwalker" => array(
3167     "icon" => "robot",
3168     "title" => "Link Walker",
3169     "rule" => array(
3170     "^LinkWalker" => ""
3171     ),
3172     "uri" => ""
3173     ),
3174     "lipperhey" => array(
3175     "icon" => "lipperhey",
3176     "title" => "Lipperhey",
3177     "rule" => array(
3178     "Lipperhey Spider" => ""
3179     ),
3180     "uri" => "http://www.lipperhey.com"
3181     ),
3182     "livedoor" => array(
3183     "icon" => "livedoor",
3184     "title" => "Livedoor",
3185     "rule" => array(
3186     "^Livedoor( SF( - California Crawl)?|Checkers)[ /]" => ""
3187     ),
3188     "uri" => ""
3189     ),
3190     "livejournal" => array(
3191     "icon" => "livejournal",
3192     "title" => "Live Journal",
3193     "rule" => array(
3194     "^LiveJournal\.com" => ""
3195     ),
3196     "uri" => "http://www.livejournal.com"
3197     ),
3198     "ljpic" => array(
3199     "icon" => "ljpic",
3200     "title" => "ljpic",
3201     "rule" => array(
3202     "LjSEEK Picture-Bot[ /]+([0-9.]{1,10})" => "\\1"
3203     ),
3204     "uri" => "http://www.ljpic.com"
3205     ),
3206     "lmspider" => array(
3207     "icon" => "robot",
3208     "title" => "Lmspider",
3209     "rule" => array(
3210     "^lmspider" => ""
3211     ),
3212     "uri" => ""
3213     ),
3214     "locators" => array(
3215     "icon" => "robot",
3216     "title" => "Locaters",
3217     "rule" => array(
3218     "^FiNDoBot[/ ]([0-9a-z.]{1,10})" => "\\1"
3219     ),
3220     "uri" => ""
3221     ),
3222     "look" => array(
3223     "icon" => "look",
3224     "title" => "Look",
3225     "rule" => array(
3226     "www\.look\.com" => "",
3227     "Lookbot" => ""
3228     ),
3229     "uri" => ""
3230     ),
3231     "looksmart" => array(
3232     "icon" => "looksmart",
3233     "title" => "LookSmart",
3234     "rule" => array(
3235     "^Martini" => "",
3236     "^MantraAgent" => "",
3237     "FurlBot" => "",
3238     "looksmart-sv-fw" => ""
3239     ),
3240     "uri" => ""
3241     ),
3242     "loop" => array(
3243     "icon" => "loop",
3244     "title" => "LOOP",
3245     "rule" => array(
3246     "NetResearchServer[ /]([0-9.]{1,10})" => "\\1"
3247     ),
3248     "uri" => ""
3249     ),
3250     "lotkyll" => array(
3251     "icon" => "robot",
3252     "title" => "Lotkyll",
3253     "rule" => array(
3254     "Lotkyll" => ""
3255     ),
3256     "uri" => ""
3257     ),
3258 joku 335 "ltx71" => array(
3259     "icon" => "robot",
3260     "title" => "LTX71",
3261     "rule" => array(
3262     "ltx71" => ""
3263     ),
3264     "uri" => "http://ltx71.com/"
3265     ),
3266 joku 63 "lwp" => array(
3267     "icon" => "robot",
3268     "title" => "lwp",
3269     "rule" => array(
3270     "lwp(-trivial|::simple)[ /]([0-9.]{1,10})" => "\\2"
3271     ),
3272     "uri" => ""
3273     ),
3274     "lycos" => array(
3275     "icon" => "lycos",
3276     "title" => "Lycos",
3277     "rule" => array(
3278     "Lycos_Spider_" => ""
3279     ),
3280     "uri" => ""
3281     ),
3282     "magpierss" => array(
3283     "icon" => "rss",
3284     "title" => "MagpieRSS",
3285     "rule" => array(
3286     "MagpieRSS" => ""
3287     ),
3288     "uri" => "http://magpierss.sourceforge.net/"
3289     ),
3290     "mailru" => array(
3291     "icon" => "mailru",
3292 matthys 209 "title" => "Mail.Ru",
3293 joku 63 "rule" => array(
3294 matthys 195 "^Mail.Ru[ /]([0-9.]{1,10})" => "\\1",
3295     "Mail.RU_Bot[ /]([0-9.]{1,10})" => "\\1"
3296 joku 63 ),
3297 matthys 209 "uri" => "http://www.mail.ru/"
3298 joku 63 ),
3299     "mailsweeper" => array(
3300     "icon" => "robot",
3301     "title" => "Mail Sweeper",
3302     "rule" => array(
3303     "Mail[ \-]?Sweeper" => ""
3304     ),
3305     "uri" => ""
3306     ),
3307     "marvin" => array(
3308     "icon" => "robot",
3309     "title" => "Marvin",
3310     "rule" => array(
3311     "^Marvin" => ""
3312     ),
3313     "uri" => ""
3314     ),
3315     "matkurja" => array(
3316     "icon" => "matkurja",
3317     "title" => "Mat'Kurja",
3318     "rule" => array(
3319     "Mosad[ /]([0-9.]{1,10})" => "\\1"
3320     ),
3321     "uri" => ""
3322     ),
3323     "mavicanet" => array(
3324     "icon" => "mavicanet",
3325     "title" => "Mavicanet",
3326     "rule" => array(
3327     "Mavicanet robot" => ""
3328     ),
3329     "uri" => ""
3330     ),
3331 matthys 292 "meanpath" => array(
3332     "icon" => "meanpath",
3333 matthys 290 "title" => "Meanpath",
3334 matthys 280 "rule" => array(
3335     "meanpathbot[ /]([0-9.]{1,10})" => "\\1"
3336     ),
3337     "uri" => "http://www.meanpath.com/meanpathbot.html"
3338 matthys 275 ),
3339 matthys 280 "mediater" => array(
3340 joku 63 "icon" => "robot",
3341     "title" => "Mediater",
3342     "rule" => array (
3343     "^libwww[ /]([0-9.]{1,10})" => "\\1"
3344 matthys 280 ),
3345     "uri" => ""
3346 joku 63 ),
3347 matthys 305 "memory" => array(
3348     "icon" => "memory",
3349     "title" => "internet Memory",
3350     "rule" => array (
3351     "memoryBot[ /]([0-9.]{1,10})" => "\\1"
3352     ),
3353     "uri" => "http://internetmemory.org/en/"
3354     ),
3355 joku 63 "mercator" => array(
3356     "icon" => "robot",
3357     "title" => "Mercator",
3358     "rule" => array(
3359     "Mercator" => ""
3360     ),
3361     "uri" => ""
3362     ),
3363     "metacarta" => array(
3364     "icon" => "robot",
3365     "title" => "Metacarta",
3366     "rule" => array(
3367     "^RRC (crawler_admin@bigfoot.com)" => "",
3368     "^flunky" => "",
3369     "^Mozilla.*\(samualt9@bigfoot.com\)$" => ""
3370     ),
3371     "uri" => "http://www.metacarta.com"
3372     ),
3373     "metager" => array(
3374     "icon" => "metager",
3375     "title" => "MetaGer",
3376     "rule" => array(
3377     "MetaGer" => ""
3378     ),
3379     "uri" => ""
3380     ),
3381     "metamark" => array(
3382     "icon" => "robot",
3383     "title" => "Metamark",
3384     "rule" => array(
3385     "^XRL[ /]([0-9.a-z]{1,10})" => "\\1"
3386     ),
3387     "uri" => "http://metamark.net"
3388     ),
3389     "metamedic" => array(
3390     "icon" => "metamedic",
3391     "title" => "MetaMedic",
3392     "rule" => array(
3393     "MediBot[ /]([0-9.]{1,10})" => "\\1"
3394     ),
3395     "uri" => ""
3396     ),
3397     "mirago" => array(
3398     "icon" => "mirago",
3399     "title" => "Mirago",
3400     "rule" => array(
3401     "Mirago" => ""
3402     ),
3403     "uri" => ""
3404     ),
3405     "misterwong" => array(
3406     "icon" => "misterwong",
3407     "title" => "Mister Wong",
3408     "rule" => array(
3409     "Mister Wong-Bot[ /]([0-9.]{1,10})" => "\\1"
3410     ),
3411     "uri" => "http://www.mister-wong.de/"
3412     ),
3413     "miva" => array(
3414     "icon" => "miva",
3415     "title" => "Miva",
3416     "rule" => array(
3417     "AlgoFeedback@miva\.com" => ""
3418     ),
3419     "uri" => "http://www.miva.com/"
3420     ),
3421     "mj12" => array(
3422     "icon" => "mj12",
3423     "title" => "Majestic-12",
3424     "rule" => array(
3425     "Mj12bot[ /]v?([0-9.]{1,10})" => "\\1",
3426     "MJ12bot \(mini\)[ /]([0-9.]{1,10})" => "\\1"
3427     ),
3428     "uri" => "http://majestic12.co.uk/bot.php"
3429     ),
3430     "mlbot" => array(
3431     "icon" => "robot",
3432     "title" => "MLBot",
3433     "rule" => array(
3434     "^MLBot" => ""
3435     ),
3436     "uri" => "http://www.metadatalabs.com/mlbot"
3437     ),
3438     "mnogo" => array(
3439     "icon" => "mnogo",
3440     "title" => "mnoGoSearch",
3441     "rule" => array(
3442     "Mnogosearch[ /\-]([0-9.]{1,10})" => "\\1"
3443     ),
3444     "uri" => "http://www.mnogosearch.org/"
3445     ),
3446     "mobileok" => array(
3447     "icon" => "mobileok",
3448     "title" => "W3C mobileOK",
3449     "rule" => array(
3450     "^W3C-mobileOK" => ""
3451     ),
3452     "uri" => "http://www.w3.org/2006/07/mobileok-ddc"
3453     ),
3454 matthys 296 "mojeek" => array(
3455     "icon" => "mojeek",
3456     "title" => "Mojeek",
3457 joku 63 "rule" => array(
3458     "MojeekBot[ /]([0-9.]{1,10})" => "\\1"
3459     ),
3460 matthys 284 "uri" => "https://www.mojeek.com/bot.html"
3461 joku 63 ),
3462     "momspider" => array(
3463     "icon" => "robot",
3464     "title" => "MOM Spider",
3465     "rule" => array(
3466     "MOMspider[ /]([0-9.]{1,10})" => "\\1"
3467     ),
3468     "uri" => ""
3469     ),
3470     "moreover" => array(
3471     "icon" => "moreover",
3472     "title" => "Moreover",
3473     "rule" => array(
3474     "^Moreoverbot[ /]([0-9.]{1,10})" => "\\1"
3475     ),
3476     "uri" => ""
3477     ),
3478     "movabletype" => array(
3479     "icon" => "movabletype",
3480     "title" => "Movable Type",
3481     "rule" => array(
3482     "MovableType[ /]([0-9.]{1,10})" => "\\1"
3483     ),
3484     "uri" => ""
3485     ),
3486     "mozdex" => array(
3487     "icon" => "mozdex",
3488     "title" => "MozDex",
3489     "rule" => array(
3490     "mozDex[ /]([0-9.]{1,6}(-dev)?)" => "\\1"
3491     ),
3492     "uri" => ""
3493     ),
3494     "mqbot" => array(
3495     "icon" => "robot",
3496     "title" => "MQbot",
3497     "rule" => array(
3498     "MQbot" => ""
3499     ),
3500     "uri" => ""
3501     ),
3502     "msnbot" => array(
3503     "icon" => "bing",
3504 matthys 205 "title" => "Bing",
3505 joku 63 "rule" => array(
3506     "MSN(BOT|PTC)[ /]([0-9.]{1,10})" => "\\2",
3507     "MS Search ([0-9.]{1,10}) Robot" => "\\1",
3508     "MSNBOT-(MEDIA|PRODUCTS|NewsBlogs)[ /]([0-9.]{1,10})" => "\\2",
3509     "bingbot[ /]([0-9.]{1,10})" => "\\1"
3510     ),
3511     "uri" => ""
3512     ),
3513     "msnbot-mobile" => array(
3514     "icon" => "msn",
3515     "title" => "MSN Mobile",
3516     "rule" => array(
3517     "MSNBOT-(MOBILE|)[ /]([0-9.]{1,10})" => "\\2",
3518     "MSNBOT_Mobile" => "",
3519     "MSMOBOT" => ""
3520     ),
3521     "uri" => ""
3522     ),
3523     "mslivebot" => array(
3524     "icon" => "livesearch",
3525     "title" => "MS Live Search",
3526     "rule" => array(
3527     "MSNBOT-(Academic)[ /]([0-9.]{1,10})" => "\\2"
3528     ),
3529     "uri" => ""
3530     ),
3531     "msproxy" => array(
3532     "icon" => "robot",
3533     "title" => "MSProxy",
3534     "rule" => array(
3535     "MSProxy[ /]([0-9.]{1,10})" => "\\1"
3536     ),
3537     "uri" => ""
3538     ),
3539     "msrbot" => array(
3540     "icon" => "robot",
3541     "title" => "MSRBOT",
3542     "rule" => array(
3543     "^MSRBOT" => ""
3544     ),
3545     "uri" => "http://research.microsoft.com/research/sv/msrbot/"
3546     ),
3547     "mswebdav" => array(
3548     "icon" => "robot",
3549     "title" => "MS-WebDAV",
3550     "rule" => array(
3551     "Microsoft[ \-]?WebDAV[ \-]?MiniRedir" => ""
3552     ),
3553     "uri" => ""
3554     ),
3555     "mticon" => array(
3556     "icon" => "robot",
3557     "title" => "MTIcon",
3558     "rule" => array(
3559     "MTIcon[/ ]([0-9.]{1,10})" => "\\1"
3560     ),
3561     "uri" => ""
3562     ),
3563     "multipage-validator" => array(
3564     "icon" => "multipage-validator",
3565     "title" => "Multipage Validator",
3566     "rule" => array(
3567     "^W3C_Multipage_Validator[ /]([0-9.]{1,10})" => "\\1"
3568     ),
3569     "uri" => "http://www.validator.ca/"
3570     ),
3571     "myrss" => array(
3572     "icon" => "rss",
3573     "title" => "MyRSS",
3574     "rule" => array(
3575     "MyRSS.jp[/ ]([0-9.]{1,10})" => "\\1"
3576     ),
3577     "uri" => ""
3578     ),
3579     "multimap" => array(
3580     "icon" => "robot",
3581     "title" => "Multimap",
3582     "rule" => array(
3583     "Multimap Geotag Blog Parser[/ ]([0-9.]{1,10})" => "\\1"
3584     ),
3585     "uri" => ""
3586     ),
3587     "najdi" => array(
3588     "icon" => "najdi",
3589     "title" => "Najdi.si",
3590     "rule" => array(
3591     "Najdi.si" => ""
3592     ),
3593     "uri" => "http://www.najdi.si"
3594     ),
3595     "nameprotect" => array(
3596     "icon" => "nameprotect",
3597     "title" => "Name Protect",
3598     "rule" => array(
3599     "NPBot" => ""
3600     ),
3601     "uri" => ""
3602     ),
3603     "nationaldirectory" => array(
3604     "icon" => "robot",
3605     "title" => "National Directory",
3606     "rule" => array(
3607     "NationalDirectory-WebSpider[ /]([0-9.]{1,10})" => "\\1"
3608     ),
3609     "uri" => ""
3610     ),
3611     "natsumican" => array(
3612     "icon" => "robot",
3613     "title" => "Natsu Mican",
3614     "rule" => array(
3615     "NATSU[ \-]MICAN[/ ]([0-9a-z.]{1,10})" => "\\1"
3616     ),
3617     "uri" => ""
3618     ),
3619     "naverbot" => array(
3620     "icon" => "naverbot",
3621     "title" => "Naver",
3622     "rule" => array(
3623     "NaverBot([_\-]dloader)?[/ \-]([0-9.]{1,10})" => "\\2",
3624     "Naver(Bot)?" => "",
3625     "^nabot" => ""
3626     ),
3627     "uri" => ""
3628     ),
3629     "navisso" => array(
3630     "icon" => "navisso",
3631     "title" => "Navisso",
3632     "rule" => array(
3633     "Navisso(Bot)?" => ""
3634     ),
3635     "uri" => "http://www.navisso.com"
3636     ),
3637     "neofonie" => array(
3638     "icon" => "robot",
3639 matthys 205 "title" => "Neofonie",
3640 joku 63 "rule" => array(
3641     "www.neofonie.de" => ""
3642     ),
3643     "uri" => "http://www.neofonie.de/loesungen/search/robot.html"
3644     ),
3645     "neomo" => array(
3646     "icon" => "robot",
3647     "title" => "Neomo",
3648     "rule" => array(
3649     "Francis[ /]([0-9.]{1,10})" => "\\1"
3650     ),
3651     "uri" => ""
3652     ),
3653     "nessus" => array(
3654     "icon" => "nessus",
3655     "title" => "Nessus",
3656     "rule" => array(
3657     "Nessus\)$" => ""
3658     ),
3659     "uri" => ""
3660     ),
3661 matthys 279 "nerdybot" => array(
3662 matthys 280 "icon" => "robot",
3663     "title" => "NerdyBot",
3664     "rule" => array(
3665     "NerdyBot" => ""
3666     ),
3667     "uri" => "http://nerdybot.com/"
3668 matthys 279 ),
3669 joku 63 "nerdbynature" => array(
3670     "icon" => "nerdbynature",
3671     "title" => "NerdByNature",
3672     "rule" => array(
3673     "NerdByNature.Bot" => ""
3674     ),
3675     "uri" => "http://www.nerdbynature.net/bot"
3676     ),
3677     "netants" => array(
3678     "icon" => "netants",
3679     "title" => "NetAnts",
3680     "rule" => array(
3681     "NetAnts[ /]([0-9.]{1,10})" => "\\1"
3682     ),
3683     "uri" => ""
3684     ),
3685     "netcraft" => array(
3686     "icon" => "netcraft",
3687     "title" => "Netcraft",
3688     "rule" => array(
3689     "netcraft" => ""
3690     ),
3691     "uri" => ""
3692     ),
3693     "netinfo" => array(
3694     "icon" => "netinfo",
3695     "title" => "Netinfo",
3696     "rule" => array(
3697     "^NetinfoBot[ /]([0-9.]{1,10})" => "\\1"
3698     ),
3699     "uri" => "http://netinfo.bg/"
3700     ),
3701     "netluchs" => array(
3702     "icon" => "netluchs",
3703     "title" => "Netluchs",
3704     "rule" => array(
3705     "Netluchs[ /]([0-9.a-z]{1,10})" => "\\1"
3706     ),
3707     "uri" => "http://www.netluchs.de/"
3708     ),
3709     "netmechanic" => array(
3710     "icon" => "netmechanic",
3711     "title" => "NetMechanic",
3712     "rule" => array(
3713     "NetMechanic[ /V]{1,5}([0-9.]{1,10})" => "\\1"
3714     ),
3715     "uri" => ""
3716     ),
3717     "netnose" => array(
3718     "icon" => "netnose",
3719     "title" => "NetNose",
3720     "rule" => array(
3721     "NetNose[ \-]Crawler[/ ]([0-9.]{1,10})" => "\\1"
3722     ),
3723     "uri" => ""
3724     ),
3725     "netoskop" => array(
3726     "icon" => "robot",
3727     "title" => "Netoskop",
3728     "rule" => array(
3729     "netoskop" => ""
3730     ),
3731     "uri" => ""
3732     ),
3733     "netpromoter" => array(
3734     "icon" => "netpromoter",
3735     "title" => "NetPromoter",
3736     "rule" => array(
3737     "NetPromoter Spider" => ""
3738     ),
3739     "uri" => "http://www.net-promoter.com/"
3740     ),
3741     "netprospector" => array(
3742     "icon" => "robot",
3743     "title" => "Netprospector",
3744     "rule" => array(
3745     "^netprospector" => ""
3746     )
3747     ),
3748     "netpumper" => array(
3749     "icon" => "robot",
3750     "title" => "Netpumper",
3751     "rule" => array(
3752     "^NetPumper[/ ]([0-9.]{1,10})" => "\\1"
3753     ),
3754     "uri" => ""
3755     ),
3756     "netscapeproxy" => array(
3757     "icon" => "netscape",
3758     "title" => "Netscape Proxy",
3759     "rule" => array(
3760     "Netscape-Proxy[/ ]([0-9.]{1,10})" => "\\1"
3761     ),
3762     "uri" => ""
3763     ),
3764     "netspective" => array(
3765     "icon" => "robot",
3766     "title" => "NetSpective",
3767     "rule" => array(
3768     "^WebFilter Robot ([0-9.]{1,10})" => "\\1"
3769     ),
3770     "uri" => ""
3771     ),
3772     "netvibes" => array(
3773     "icon" => "netvibes",
3774     "title" => " Netvibes",
3775     "rule" => array(
3776     "^Netvibes" => "\\1"
3777     ),
3778     "uri" => ""
3779     ),
3780     "newsfire" => array(
3781     "icon" => "newsfire",
3782     "title" => "NewsFire",
3783     "rule" => array(
3784     "NewsFire[/ ]([0-9.]{1,10})" => "\\1"
3785     ),
3786     "uri" => ""
3787     ),
3788     "newsgator" => array(
3789     "icon" => "newsgator",
3790     "title" => "NewsGator",
3791     "rule" => array(
3792     "NewsGato(r|rOnline)[/ ]([0-9.]{1,10})" => "\\2"
3793     ),
3794     "uri" => ""
3795     ),
3796     "newzcrawler" => array(
3797     "icon" => "newzcrawler",
3798     "title" => "NewzCrawler",
3799     "rule" => array(
3800     "NewzCrawler[/ ]([0-9.]{1,10})" => "\\1"
3801     ),
3802     "uri" => ""
3803     ),
3804     "nextopia" => array(
3805     "icon" => "newzcrawler",
3806     "title" => "NewzCrawler",
3807     "rule" => array(
3808     "^NextopiaBOT.*[v ]([0-9.]{1,10})" => "\\1"
3809     ),
3810     "uri" => ""
3811     ),
3812     "ngsearch" => array(
3813     "icon" => "ngsearch",
3814     "title" => "NG Search",
3815     "rule" => array(
3816     "NG-Search[/ ]([0-9.]{1,10})" => "\\1"
3817     ),
3818     "uri" => ""
3819     ),
3820     "nimble" => array(
3821     "icon" => "robot",
3822     "title" => "Nimble",
3823     "rule" => array(
3824     "NimbleCrawler[/ ]([0-9.]{1,10})" => "\\1"
3825     ),
3826     "uri" => ""
3827     ),
3828     "nmap" => array(
3829     "icon" => "nmap",
3830     "title" => "Nmap",
3831     "rule" => array(
3832     "Nmap Scripting Engine" => ""
3833     ),
3834     "uri" => "http://nmap.org/book/nse.html"
3835     ),
3836     "nusearch" => array(
3837     "icon" => "robot",
3838     "title" => "NuSearch",
3839     "rule" => array(
3840     "^nuSearch" => ""
3841     ),
3842     "uri" => "http://www.nusearch.com/"
3843     ),
3844     "noago" => array(
3845     "icon" => "noago",
3846     "title" => "Noago",
3847     "rule" => array(
3848     "Noago Spider" => ""
3849     ),
3850     "uri" => "http://www.noago.com/"
3851     ),
3852     "noviforum" => array(
3853     "icon" => "noviforum",
3854     "title" => "Noviforum",
3855     "rule" => array(
3856     "TridentSpider[/ ]?([0-9.]{1,10})" => "\\1"
3857     ),
3858     "uri" => ""
3859     ),
3860     "noxtrum" => array(
3861     "icon" => "noxtrum",
3862     "title" => "noXtrum",
3863     "rule" => array(
3864     "noxtrumbot[/ ]?([0-9.]{1,10})" => "\\1"
3865     ),
3866     "uri" => ""
3867     ),
3868     "noyona" => array(
3869     "icon" => "robot",
3870     "title" => "Noyona",
3871     "rule" => array(
3872     "noyona.([0-9._]{1,10})" => "\\1"
3873     ),
3874     "uri" => "http://noyona.com/"
3875     ),
3876     "nsauditor" => array(
3877     "icon" => "nsauditor",
3878     "title" => "Nsauditor",
3879     "rule" => array(
3880     "Nsauditor[ /]([0-9.]{1,10})" => "\\1"
3881     ),
3882     "uri" => "http://www.nsauditor.com/"
3883     ),
3884     "obidosbot" => array(
3885     "icon" => "robot",
3886     "title" => "Bookwatch",
3887     "rule" => array(
3888     "obidos[ \-]?bot" => ""
3889     ),
3890     "uri" => ""
3891     ),
3892     "objectssearch" => array(
3893     "icon" => "robot",
3894     "title" => "Objects Search",
3895     "rule" => array(
3896     "ObjectsSearch[ /]([0-9.]{1,10})" => "\\1"
3897     ),
3898     "uri" => ""
3899     ),
3900     "obot" => array(
3901 matthys 297 "icon" => "ibm",
3902     "title" => "IBM (ONLY) Crawler",
3903 joku 63 "rule" => array(
3904 matthys 297 "oBot[ /]([0-9.]{1,10})" => "\\1"
3905 joku 63 ),
3906 matthys 297 "uri" => "http://filterdb.iss.net/crawler/"
3907     // Previous from "ONLY Solutions GmbH" – that is what the O stands for
3908 joku 63 ),
3909     "ocawa" => array(
3910     "icon" => "ocawa",
3911     "title" => "Ocawa",
3912     "rule" => array(
3913     "Ocawa[ /]([A-Z.a-z][0-9.]{1,10})" => "\\1",
3914     "Ocawa" => ""
3915     ),
3916     "uri" => "http://www.ocawa.com/"
3917     ),
3918     "octora" => array(
3919     "icon" => "octora",
3920     "title" => "Octora",
3921     "rule" => array(
3922     "^Octora (Beta)?" => ""
3923     ),
3924     "uri" => "http://www.octora.com/"
3925     ),
3926     "offlineexplorer" => array(
3927     "icon" => "robot",
3928     "title" => "OfflineExplorer",
3929     "rule" => array(
3930     "^Offline Explorer[ /]([0-9.]{1,10})" => "\\1"
3931     ),
3932     "uri" => ""
3933     ),
3934     "omea" => array(
3935     "icon" => "omea",
3936     "title" => "Omea Reader",
3937     "rule" => array(
3938     "Omea Reader[ /]([0-9.]{1,10})" => "\\1"
3939     ),
3940     "uri" => ""
3941     ),
3942     "onet" => array(
3943     "icon" => "onet",
3944     "title" => "Onet",
3945     "rule" => array(
3946     "OnetSzukaj[ /]([0-9.]{1,10})" => "\\1",
3947     "Onet\.pl" => "",
3948     "inktomi.search.onet" => ""
3949     ),
3950     "uri" => "http://www.onet.pl"
3951     ),
3952     "online24" => array(
3953     "icon" => "robot",
3954 matthys 209 "title" => "Online24",
3955 joku 63 "rule" => array(
3956     "^Online24-Bot .* ([0-9.]{1,10})" => "\\1"
3957     ),
3958     "uri" => "http://www.online24.de"
3959     ),
3960     "onlinewebcheck" => array(
3961     "icon" => "csehtmlvalidator",
3962     "title" => "CSE HTML Validator",
3963     "rule" => array(
3964     "onlinewebcheck" => ""
3965     ),
3966     "uri" => "http://www.onlinewebcheck.com"
3967     ),
3968     "onsearch" => array(
3969     "icon" => "onsearch",
3970 matthys 209 "title" => "OnSearch",
3971 joku 63 "rule" => array(
3972     "^onCHECK-Robot" => ""
3973     ),
3974     "uri" => "http://www.onsearch.de"
3975     ),
3976     "onto" => array(
3977     "icon" => "robot",
3978     "title" => "OntoSpider",
3979     "rule" => array(
3980     "^OntoSpider[ /]([0-9.]{1,10})" => "\\1"
3981     ),
3982     "uri" => "http://ontospider.i-n.info/"
3983     ),
3984     "openacoon" => array(
3985     "icon" => "robot",
3986     "title" => "OpenAcoon",
3987     "rule" => array(
3988     "^OpenAcoon v([0-9.]{1,10})" => "\\1"
3989     ),
3990     "uri" => "http://www.openacoon.de/"
3991     ),
3992     "openfind" => array(
3993     "icon" => "openfind",
3994     "title" => "Openfind",
3995     "rule" => array(
3996     "openbot[ /]([0-9.]{1,10})" => "\\1",
3997     "Openfind Robot[ /]([0-9.A-Z]{1,10})" => "\\1"
3998     ),
3999     "uri" => ""
4000     ),
4001     "opentagger" => array(
4002     "icon" => "robot",
4003     "title" => "OpenTagger",
4004     "rule" => array(
4005     "^OpenTaggerBot" => ""
4006     ),
4007     "uri" => "http://www.opentagger.com/opentaggerbot.htm"
4008     ),
4009     "opentext" => array(
4010     "icon" => "opentext",
4011     "title" => "OpenText",
4012     "rule" => array(
4013     "^OpenTextSiteCrawler[ /]([0-9.]{1,10})" => "\\1"
4014     ),
4015     "uri" => "http://www.opentext.net/"
4016     ),
4017     "openweb" => array(
4018     "icon" => "robot",
4019     "title" => "OpenWebSpider",
4020     "rule" => array(
4021     "^OpenWebSpider[ /]([0-9.]{1,10})" => "\\1",
4022     "^OpenWebSpider v([0-9.A-Z]{1,10})" => "\\1"
4023     ),
4024     "uri" => "http://www.openwebspider.org"
4025     ),
4026     "openx" => array(
4027     "icon" => "openx",
4028     "title" => "OpenX Spider",
4029     "rule" => array(
4030     "OpenX" => ""
4031     ),
4032     "uri" => "http://www.openx.org"
4033     ),
4034     "orange" => array(
4035     "icon" => "orange",
4036     "title" => "Orange",
4037     "rule" => array(
4038 joku 338 "OrangeBot-Mobile[ /]([0-9.]{1,10})" => "\\1",
4039     "OrangeBot[ /]([0-9.]{1,10})" => "\\1"
4040 joku 63 ),
4041     "uri" => "http://orange.com/"
4042     ),
4043     "organica" => array(
4044     "icon" => "robot",
4045     "title" => "Organica",
4046     "rule" => array(
4047     "crawler@organica\.us" => ""
4048     ),
4049     "uri" => ""
4050     ),
4051     "outfox" => array(
4052     "icon" => "robot",
4053     "title" => "Outfox Melon",
4054     "rule" => array(
4055     "OutfoxMelonBot[ /]([0-9.]{1,10})" => "\\1",
4056     "OutfoxBot[ /]([0-9.]{1,10})" => "\\1"
4057     ),
4058     "uri" => ""
4059     ),
4060     "overture" => array(
4061     "icon" => "overture",
4062     "title" => "Overture",
4063     "rule" => array(
4064     "Overture[ \-]?WebCrawler" => ""
4065     ),
4066     "uri" => ""
4067     ),
4068 joku 337 "owler" => array(
4069     "icon" => "robot",
4070     "title" => "Owler",
4071     "rule" => array(
4072     "Owler[ /]([0-9.]{1,10})" => "\\1",
4073     "Owler" => ""
4074     ),
4075     "uri" => ""
4076     ),
4077 joku 63 "page2rss" => array(
4078     "icon" => "page2rss",
4079     "title" => "Page2RSS",
4080     "rule" => array(
4081     "Page2RSS[ /]([0-9.]{1,10})" => "\\1"
4082     ),
4083     "uri" => "http://page2rss.com"
4084     ),
4085     "pagebytes" => array(
4086     "icon" => "robot",
4087     "title" => "PageBites",
4088     "rule" => array(
4089     "^PageBitesHyperBot[ /]([0-9.]{1,10})" => "\\1"
4090     ),
4091     "uri" => ""
4092     ),
4093 matthys 282 "pagesinventory" => array(
4094     "icon" => "pagesinventory",
4095     "title" => "PagesInventory",
4096     "rule" => array(
4097     "^PagesInventory" => ""
4098     ),
4099     "uri" => "http://www.pagesinventory.com"
4100     ),
4101 joku 63 "pagesjaunes" => array(
4102     "icon" => "pagesjaunes",
4103     "title" => "Pages Jaunes",
4104     "rule" => array(
4105     "PJBot[ /]([0-9.]{1,10})" => "\\1"
4106     ),
4107     "uri" => "http://www.pagesjaunes.fr/"
4108     ),
4109     "pagevalet" => array(
4110     "icon" => "wdg",
4111     "title" => "WDG Page Valet",
4112     "rule" => array(
4113     "^Page Valet[ /]([0-9.]{1,10})" => "\\1"
4114     ),
4115     "uri" => "http://www.htmlhelp.com/tools/validator/"
4116     ),
4117     "panopeabot" => array(
4118     "icon" => "robot",
4119     "title" => "PanopeaBot",
4120     "rule" => array(
4121     "PanopeaBot[/ ]([0-9.]{1,10})" => "\\1"
4122     ),
4123     "uri" => ""
4124     ),
4125     "parchmenthill" => array(
4126     "icon" => "robot",
4127     "title" => "Parchment Hill",
4128     "rule" => array(
4129     "ParchBot[ /]([0-9.]{1,10})" => "\\1"
4130     ),
4131     "uri" => "http://www.parchmenthill.com/search.htm"
4132     ),
4133     "pascient" => array(
4134     "icon" => "pascient",
4135     "title" => "Pascient",
4136     "rule" => array(
4137     "panscient.com" => ""
4138     ),
4139     "uri" => "http://www.panscient.com/"
4140     ),
4141     "peerbot" => array(
4142     "icon" => "peerbot",
4143     "title" => "Peerbot",
4144     "rule" => array(
4145     "^PEERbot" => ""
4146     ),
4147     "uri" => ""
4148     ),
4149     "php" => array(
4150     "icon" => "php",
4151     "title" => "PHP",
4152     "rule" => array(
4153     "^PHP[ /]([0-9.]{1,10})" => "\\1"
4154     ),
4155     "uri" => ""
4156     ),
4157     "phpcrawl" => array(
4158     "icon" => "robot",
4159     "title" => "PHPCrawl",
4160     "rule" => array(
4161     "^PHPCrawl" => ""
4162     ),
4163     "uri" => "http://phpcrawl.cuab.de/"
4164     ),
4165     "phpdig" => array(
4166     "icon" => "robot",
4167     "title" => "PhpDig",
4168     "rule" => array(
4169     "^PhpDig[ /]([0-9.]{1,10})" => "\\1"
4170     ),
4171     "uri" => "http://www.finbot.com/"
4172     ),
4173     "phpversiontracker" => array(
4174     "icon" => "phpversiontracker",
4175     "title" => "PHP version tracker",
4176     "rule" => array(
4177     "^PHP version tracker" => ""
4178     ),
4179     "uri" => "http://www.nexen.net/phpversion/bot.php"
4180     ),
4181     "pictureofinternet" => array(
4182     "icon" => "robot",
4183     "title" => "PictureOfInternet",
4184     "rule" => array(
4185     "^PictureOfInternet[ /]([0-9.]{1,10})" => ""
4186     ),
4187     "uri" => ""
4188     ),
4189     "pingdom" => array(
4190     "icon" => "pingdom",
4191     "title" => "Pingdom",
4192     "rule" => array(
4193     "^Pingdom GIGRIB v([0-9.]{1,10})" => "\\1",
4194     "^Pingdom" => ""
4195     ),
4196     "uri" => "http://www.pingdom.com/"
4197     ),
4198     "pinseri" => array(
4199     "icon" => "pinseri",
4200     "title" => "Pinseri",
4201     "rule" => array(
4202     "www\.pinseri\.com/bloglist" => ""
4203     ),
4204     "uri" => ""
4205     ),
4206     "plagger" => array(
4207     "icon" => "plagger",
4208     "title" => "Plagger",
4209     "rule" => array(
4210     "Plagger[ /]([0-9.]{1,10})" => "\\1"
4211     ),
4212     "uri" => "http://www.plugger.org"
4213     ),
4214     "planet" => array(
4215     "icon" => "planet",
4216     "title" => "Planet",
4217     "rule" => array(
4218     "Planet[ /]([0-9.]{1,10})" => "\\1"
4219     ),
4220     "uri" => ""
4221     ),
4222     "plantynet" => array(
4223     "icon" => "robot",
4224     "title" => "PlantyNet",
4225     "rule" => array(
4226     "PlantyNet_WebRobot[_ /]V?([0-9.]{1,10})" => "\\1"
4227     ),
4228     "uri" => ""
4229     ),
4230     "pluck" => array(
4231     "icon" => "pluck",
4232     "title" => "Pluck",
4233     "rule" => array(
4234     "PluckFeedCrawler[ /]([0-9.]{1,10})" => "\\1"
4235     ),
4236     "uri" => ""
4237     ),
4238     "plsearch" => array(
4239     "icon" => "plsearch",
4240     "title" => "PlanetSearch",
4241     "rule" => array(
4242     "fido[ /]([0-9.]{1,10}) Harvest" => "\\1"
4243     ),
4244     "uri" => ""
4245     ),
4246     "poe" => array(
4247     "icon" => "robot",
4248     "title" => "POE-Component",
4249     "rule" => array(
4250     "^POE-Component-Client-HTTP[/ ]([0-9.]{1,10})" => "\\1"
4251     ),
4252     "uri" => ""
4253     ),
4254     "pogodak" => array(
4255     "icon" => "pogodak",
4256     "title" => "Pogodak",
4257     "rule" => array(
4258     "Pogodak\.hr[/ ]?([0-9.]{1,10})" => "\\1"
4259     ),
4260     "uri" => ""
4261     ),
4262     "poodle" => array(
4263     "icon" => "robot",
4264     "title" => "Poodle predictor",
4265     "rule" => array(
4266     "P(oo|ooo)dle[ \-]?predictor[ \-]?([0-9.]{1,10})" => "\\1",
4267     "P(oo|ooo)dle[ \-]?predictor" => ""
4268     ),
4269     "uri" => "http://www.gritechnologies.com/tools/spider.go"
4270     ),
4271     "pompos" => array(
4272     "icon" => "pompos",
4273     "title" => "Pompos",
4274     "rule" => array(
4275     "Pompos[ /]([0-9.]{1,10})" => "\\1"
4276     ),
4277     "uri" => ""
4278     ),
4279     "popdex" => array(
4280     "icon" => "robot",
4281     "title" => "Popdexter",
4282     "rule" => array(
4283     "Popdexter" => ""
4284     ),
4285     "uri" => ""
4286     ),
4287     "postrank" => array(
4288     "icon" => "postrank",
4289     "title" => "PostRank",
4290     "rule" => array(
4291     "^PostRank[ /]+([0-9.]{1,10})" => "\\1"
4292     ),
4293     "uri" => "http://www.postrank.com/"
4294     ),
4295     "powermarks" => array(
4296     "icon" => "robot",
4297     "title" => "Powermarks",
4298     "rule" => array(
4299     "Powermarks[ /]([0-9.]{1,10})" => "\\1"
4300     ),
4301     "uri" => ""
4302     ),
4303 matthys 366 "pinterest" => array(
4304     "icon" => "pinterest",
4305 joku 63 "title" => "PROBE!",
4306     "rule" => array(
4307 matthys 366 "Pinterest[ /]([0-9.]{1,10})" => "\\1"
4308 joku 63 ),
4309 matthys 366 "uri" => "http://www.pinterest.com/"
4310 joku 63 ),
4311 matthys 366 "probe" => array(
4312     "icon" => "robot",
4313     "title" => "PROBE!",
4314     "rule" => array(
4315     "^PROBE!" => ""
4316     ),
4317     "uri" => ""
4318     ),
4319 joku 63 "projecthoneypot" => array(
4320     "icon" => "projecthoneypot",
4321     "title" => "Project Honeypot",
4322     "rule" => array(
4323     "^PHPot Verispider[ /v]+([0-9.]{1,10})" => "\\1",
4324     "projecthoneypot" => ""
4325     ),
4326     "uri" => "http://www.projecthoneypot.org"
4327     ),
4328     "proxycache" => array(
4329     "icon" => "robot",
4330     "title" => "Proxy Cache",
4331     "rule" => array(
4332     "^Mozilla/[0-9.]{1,10} \(compatible\;\)$" => ""
4333     ),
4334     "uri" => ""
4335     ),
4336     "proxyhunter" => array(
4337     "icon" => "robot",
4338     "title" => "ProxyHunter",
4339     "rule" => array(
4340     "ProxyHunter" => ""
4341     ),
4342     "uri" => ""
4343     ),
4344     "psbot" => array(
4345     "icon" => "picsearch",
4346     "title" => "PicSearch",
4347     "rule" => array(
4348     "^psbot" => ""
4349     ),
4350     "uri" => ""
4351     ),
4352     "pubsub" => array(
4353     "icon" => "pubsub",
4354     "title" => "PubSub",
4355     "rule" => array(
4356     "^PubSub-RSS-Reader[ /]([0-9.]{1,10})" => "\\1",
4357     "^PubSub\.com" => ""
4358     ),
4359     "uri" => ""
4360     ),
4361 joku 330 "pubarch" => array(
4362 joku 334 "icon" => "robot",
4363 joku 330 "title" => "PubArchive",
4364     "rule" => array(
4365     "publiclibraryarchive.org" => ""
4366     ),
4367     "uri" => ""
4368     ),
4369 joku 63 "pukiwiki" => array(
4370     "icon" => "pukiwiki",
4371     "title" => "PukiWiki",
4372     "rule" => array(
4373     "PukiWiki[ /]([0-9.]{1,10})" => "\\1"
4374     ),
4375     "uri" => ""
4376     ),
4377     "pwebotxy" => array(
4378     "icon" => "pwebotxy",
4379     "title" => "PWeBot/X.Y",
4380     "rule" => array(
4381     "^PWeBot[ /]([0-9.]{1,10})" => "\\1"
4382     ),
4383     "uri" => "http://www.programacionweb.net/robot.php"
4384     ),
4385     "pxys" => array(
4386     "icon" => "robot",
4387     "title" => "PXYS",
4388     "rule" => array(
4389     "^pxys" => ""
4390     ),
4391     "uri" => ""
4392     ),
4393     "qango" => array(
4394     "icon" => "qango",
4395     "title" => "Qango",
4396     "rule" => array(
4397     "^Qango.com" => ""
4398     ),
4399     "uri" => "http://www.quango.com/"
4400     ),
4401     "qihoo" => array(
4402     "icon" => "qihoo",
4403     "title" => "Qihoo",
4404     "rule" => array(
4405     "QihooBot[ /]([0-9.]{1,10})" => "\\1"
4406     ),
4407     "uri" => "http://www.qihoo.com/"
4408     ),
4409     "qseero" => array(
4410     "icon" => "robot",
4411     "title" => "Qseero",
4412     "rule" => array(
4413     "Qseero v([0-9.]{1,10})" => "\\1"
4414     ),
4415     "uri" => "http://www.q0.com/"
4416     ),
4417     "quantcast" => array(
4418     "icon" => "robot",
4419     "title" => "Quantcast",
4420     "rule" => array(
4421     "Quantcastbot[ /]([0-9.]{1,10})" => "\\1"
4422     ),
4423     "uri" => "http://www.quantcast.com/"
4424     ),
4425     "quepasa" => array(
4426     "icon" => "quepasa",
4427     "title" => "Quepasa",
4428     "rule" => array(
4429     "Quepasa[ \-]?Creep" => ""
4430     ),
4431     "uri" => ""
4432     ),
4433     "questfinder" => array(
4434     "icon" => "robot",
4435     "title" => "QuestFinder",
4436     "rule" => array(
4437     "www\.questfinder\.com" => ""
4438     ),
4439     "uri" => ""
4440     ),
4441 matthys 351 "qwantify" => array(
4442     "icon" => "qwantify",
4443     "title" => "Qwantify",
4444     "rule" => array(
4445     "Qwantify[ /]([0-9.]{1,10})" => "\\1"
4446     ),
4447     "uri" => "https://www.qwant.com/"
4448     ),
4449 joku 63 "qweery" => array(
4450     "icon" => "robot",
4451     "title" => "Qweery",
4452     "rule" => array(
4453     "^QweeryBot[ /]([0-9.]{1,10})" => "\\1"
4454     ),
4455     "uri" => "http://qweerybot.qweery.nl"
4456     ),
4457     "racaicrawler" => array(
4458     "icon" => "robot",
4459     "title" => "RacaiCrawler",
4460     "rule" => array(
4461     "RacaiCrawler[ -]([0-9.]{1,10})" => "\\1"
4462     )
4463     ),
4464     "radian6" => array(
4465     "icon" => "robot",
4466     "title" => "Radian6",
4467     "rule" => array(
4468     "www\.radian6\.com" => ""
4469     ),
4470     "uri" => "http://www.radian6.com"
4471     ),
4472     "rambler" => array(
4473     "icon" => "rambler",
4474     "title" => "Rambler",
4475     "rule" => array(
4476     "StackRambler[ /]([0-9.]{1,10})" => "\\1"
4477     ),
4478     "uri" => ""
4479     ),
4480     "ramiba" => array(
4481     "icon" => "robot",
4482 matthys 209 "title" => "Ramiba",
4483 joku 63 "rule" => array(
4484     "^ramiba(-bot)?" => "\\1"
4485     ),
4486     "uri" => ""
4487     ),
4488     "rankur" => array(
4489     "icon" => "rankur",
4490     "title" => "Rankur",
4491     "rule" => array(
4492     "^RankurBot/Rankur([0-9.]{1,10})" => "\\1"
4493     ),
4494     "uri" => "http://rankur.com/",
4495     ),
4496 joku 261 "red" => array(
4497     "icon" => "red",
4498     "title" => "RED",
4499     "rule" => array(
4500     "RED[ /]([0-9.]{1,10})" => "\\1"
4501     ),
4502     "uri" => "http://redbot.org/"
4503 joku 181 ),
4504 joku 63 "rediff" => array(
4505     "icon" => "rediff",
4506 matthys 209 "title" => "Rediff",
4507 joku 63 "rule" => array(
4508     "^RedBot/redbot[ /\-]([0-9.]{1,10})" => "\\1"
4509     ),
4510     "uri" => "http://www.rediff.com",
4511     ),
4512     "repia" => array(
4513     "icon" => "robot",
4514     "title" => "Repia",
4515     "rule" => array(
4516     "webmaster@repia\.com" => ""
4517     ),
4518     "uri" => ""
4519     ),
4520     "robotgenius" => array(
4521     "icon" => "robot",
4522     "title" => "Robot Genius",
4523     "rule" => array(
4524     "^robotgenius" => ""
4525     ),
4526     "uri" => "http://robotgenius.net",
4527     ),
4528     "robozilla" => array(
4529     "icon" => "robot",
4530     "title" => "Robozilla",
4531     "rule" => array(
4532     "Robozilla" => ""
4533     ),
4534     "uri" => ""
4535     ),
4536 matthys 302 "rogerbot" => array(
4537 matthys 306 "icon" => "moz",
4538     "title" => "Moz Rogerbot",
4539 matthys 302 "rule" => array(
4540     "rogerbot[ /]([0-9.]{1,10})" => "\\1"
4541     ),
4542     "uri" => "http://moz.com/help/guides/moz-procedures/who-is-rogerbot"
4543     ),
4544 joku 63 "rojo" => array(
4545     "icon" => "rojo",
4546     "title" => "Rojo",
4547     "rule" => array(
4548     "Rojo[ /]([0-9.]{1,10})" => "\\1"
4549     ),
4550     "uri" => ""
4551     ),
4552     "rss-atom" => array(
4553     "icon" => "rss",
4554     "title" => "RSS / Atom",
4555     "rule" => array(
4556     "^Apple-PubSub" => "",
4557     "^AppleSyndication" => ""
4558     ),
4559     "uri" => ""
4560     ),
4561     "rssbot" => array(
4562     "icon" => "rss",
4563 matthys 209 "title" => "RSS-bot",
4564 joku 63 "rule" => array(
4565     "rss-bot[ /]([0-9.]{1,10})" => "\\1"
4566     ),
4567     "uri" => ""
4568     ),
4569     "rssbandit" => array(
4570     "icon" => "rssbandit",
4571     "title" => "RssBandit",
4572     "rule" => array(
4573     "RssBandit[ /]([0-9.]{1,10})" => "\\1"
4574     ),
4575     "uri" => ""
4576     ),
4577     "rssimages" => array(
4578     "icon" => "rss",
4579 matthys 209 "title" => "RssImages",
4580 joku 63 "rule" => array(
4581     "rssImagesBot[ /]([0-9.]{1,10})" => "\\1"
4582     ),
4583     "uri" => ""
4584     ),
4585     "rssmicro" => array(
4586     "icon" => "rssmicro",
4587     "title" => "RSSMicro",
4588     "rule" => array(
4589     "RSSMicro\.com" => ""
4590     ),
4591     "uri" => "http://www.rssmicro.com"
4592     ),
4593     "rssowl" => array(
4594     "icon" => "rssowl",
4595     "title" => "RSSOwl",
4596     "rule" => array(
4597     "RSSOwl[ /]([0-9a-z.]{1,10})" => "\\1"
4598     ),
4599     "uri" => ""
4600     ),
4601     "rssreader" => array(
4602     "icon" => "rss",
4603     "title" => "RssReader",
4604     "rule" => array(
4605     "RssReader[ /]([0-9.]{1,10})" => ""
4606     ),
4607     "uri" => ""
4608     ),
4609     "rtgi" => array(
4610     "icon" => "rtgi",
4611 matthys 209 "title" => "Rtgi",
4612 joku 63 "rule" => array(
4613     "RTGI" => ""
4614     ),
4615     "uri" => "http://rtgi.fr/"
4616     ),
4617     "rufusbot" => array(
4618     "icon" => "robot",
4619     "title" => "RufusBot",
4620     "rule" => array(
4621     "RufusBot" => ""
4622     ),
4623     "uri" => ""
4624     ),
4625 matthys 304 "runet" => array(
4626     "icon" => "runet",
4627     "title" => "iTrack RuNet Crawler",
4628     "rule" => array(
4629     "Runet-Research-Crawler" => ""
4630     ),
4631     "uri" => "http://www.itrack.ru/research/cmsrate/"
4632     ),
4633 joku 63 "runnk" => array(
4634     "icon" => "robot",
4635     "title" => "Runnk",
4636     "rule" => array(
4637     "Runnk RSS finder" => ""
4638     ),
4639     "uri" => "http://www.runnk.com/il/law"
4640     ),
4641     "sagool" => array(
4642     "icon" => "robot",
4643     "title" => "Sagool",
4644     "rule" => array(
4645     "MaSagool" => ""
4646     ),
4647     "uri" => "http://sagool.jp/"
4648     ),
4649     "sanszbot" => array(
4650     "icon" => "robot",
4651     "title" => "Sansz",
4652     "rule" => array(
4653     "SanszBot" => ""
4654     ),
4655     "uri" => ""
4656     ),
4657     "saucereader" => array(
4658     "icon" => "saucereader",
4659     "title" => "Sauce Reader",
4660     "rule" => array(
4661     "Sauce[ ]?Reader[ /]([0-9.]{1,10})" => "\\1"
4662     ),
4663     "uri" => ""
4664     ),
4665     "sbider" => array(
4666     "icon" => "sbider",
4667     "title" => "SBIder",
4668     "rule" => array(
4669     "SBIder[/ ]([0-9.]{1,10})" => "\\1",
4670     "SBIder[/ ]SBIder.([0-9.]{1,10})" => "\\1"
4671     ),
4672     "uri" => ""
4673     ),
4674     "scirus" => array(
4675     "icon" => "robot",
4676     "title" => "Scirus",
4677     "rule" => array(
4678     "FAST-WebCrawler/[0-9a-z.]{1,10}/Scirus" => ""
4679     ),
4680     "uri" => ""
4681     ),
4682     "scoutjet" => array(
4683     "icon" => "scoutjet",
4684     "title" => "ScoutJet",
4685     "rule" => array(
4686     "ScoutJet" => ""
4687     ),
4688     "uri" => "http://www.scoutjet.com/"
4689     ),
4690 joku 261 "scrapy" => array(
4691     "icon" => "scrapy",
4692     "title" => "Scrapy",
4693     "rule" => array(
4694     "Scrapy[ /]([0-9.]{1,10})" => "\\1"
4695     ),
4696     "uri" => "http://scrapy.org"
4697     ),
4698 joku 63 "scrubby" => array(
4699     "icon" => "scrubby",
4700     "title" => "Scrubby",
4701     "rule" => array(
4702     "Scrubby[ /]([0-9.]{1,10})" => "\\1"
4703     ),
4704     "uri" => ""
4705     ),
4706     "sdm" => array(
4707     "icon" => "sdm",
4708     "title" => "SUN Download Manager",
4709     "rule" => array(
4710     "Sun Download Manager[/ ]([0-9.]{1,10})" => "\\1"
4711     ),
4712     "uri" => ""
4713     ),
4714     "sealinks" => array(
4715     "icon" => "robot",
4716     "title" => "Sea Links",
4717     "rule" => array(
4718     "SEA-Links( HTML-Scanner Pingoo\!)?[ /]([0-9.]{1,10})" => "\\2"
4719     ),
4720     "uri" => ""
4721     ),
4722     "search17" => array(
4723     "icon" => "robot",
4724     "title" => "Search 17",
4725     "rule" => array(
4726     "Search17Bot[ /]([0-9.]{1,10})" => "\\1"
4727     ),
4728     "uri" => "http://www.search17.com/bot.php"
4729     ),
4730     "search2" => array(
4731     "icon" => "search2",
4732     "title" => "Search2.net",
4733     "rule" => array(
4734     "^S2Bot[ /]([0-9.]{1,10})" => "\\1"
4735     ),
4736     "uri" => "http://search2.net/"
4737     ),
4738     "searchbot" => array(
4739     "icon" => "robot",
4740     "title" => "Searchbot",
4741     "rule" => array(
4742     "Searchbot[ /]([0-9.]{1,10})" => "\\1"
4743     ),
4744     "uri" => ""
4745     ),
4746     "searchch" => array(
4747     "icon" => "robot",
4748     "title" => "Search.ch",
4749     "rule" => array(
4750     "search\.ch[ /]?V?([0-9.]{1,10})" => "\\1"
4751     ),
4752     "uri" => ""
4753     ),
4754     "searchengineworld" => array(
4755     "icon" => "robot",
4756     "title" => "SearchEngineWorld",
4757     "rule" => array(
4758     "searchengineworld" => ""
4759     ),
4760     "uri" => "http://www.searchengineworld.com/"
4761     ),
4762     "searchhippo" => array(
4763     "icon" => "searchhippo",
4764     "title" => "Searchhippo",
4765     "rule" => array(
4766     "searchhippo" => ""
4767     ),
4768     "uri" => "http://www.searchhippo.com/"
4769     ),
4770     "searchthruus" => array(
4771     "icon" => "robot",
4772     "title" => "SearchThruUs",
4773     "rule" => array(
4774     "www\.unitek-systems\.co\.uk[ /]([0-9.]{1,10})" => "\\1"
4775     ),
4776     "uri" => ""
4777     ),
4778     "securecomputing" => array(
4779     "icon" => "robot",
4780     "title" => "Secure Computing",
4781     "rule" => array(
4782     "securecomputing" => ""
4783     ),
4784     "uri" => ""
4785     ),
4786     "seekport" => array(
4787     "icon" => "seekport",
4788     "title" => "Seekport",
4789     "rule" => array(
4790     "Seekbot[ /]([0-9.]{1,10})" => "\\1"
4791     ),
4792     "uri" => ""
4793     ),
4794     "semanticdiscovery" => array(
4795     "icon" => "robot",
4796     "title" => "Semantic Discovery",
4797     "rule" => array(
4798     "semanticdiscovery[ /]([0-9.]{1,10})" => "\\1"
4799     ),
4800     "uri" => ""
4801     ),
4802 matthys 319 "semrush" => array(
4803     "icon" => "semrush",
4804     "title" => "SEMrush",
4805     "rule" => array(
4806     "SemrushBot[ /]([0-9.]{1,10})" => "\\1"
4807     ),
4808     "uri" => "http://www.semrush.com/bot.html"
4809     ),
4810 joku 63 "sengine" => array(
4811     "icon" => "sengine",
4812     "title" => "Sengine",
4813     "rule" => array(
4814     "netEstate NE Crawler" => ""
4815     ),
4816     "uri" => "http://www.sengine.info/"
4817     ),
4818     "sensis" => array(
4819     "icon" => "sensis",
4820     "title" => "Sensis",
4821     "rule" => array(
4822     "^Sensis(.com.au)? Web Crawler" => ""
4823     ),
4824     "uri" => "http://sensis.com.au"
4825     ),
4826     "seokicks" => array(
4827     "icon" => "seokicks",
4828     "title" => "SEOkicks",
4829     "rule" => array(
4830     "SEOkicks-Robot" => ""
4831     ),
4832     "uri" => "http://www.seokicks.de/"
4833     ),
4834     "seoprofiler" => array(
4835     "icon" => "seoprofiler",
4836     "title" => "SEOprofiler",
4837     "rule" => array(
4838     "spbot[ /]([0-9.]{1,10})" => "\\1"
4839     ),
4840     "uri" => "http://www.seoprofiler.com/"
4841     ),
4842     "setooz" => array(
4843     "icon" => "setooz",
4844     "title" => "Setooz",
4845     "rule" => array(
4846     "OOZBOT[ /]([0-9.]{1,10})" => "\\1"
4847     ),
4848     "uri" => "http://www.setooz.com/oozbot.html"
4849     ),
4850     "seznam" => array(
4851     "icon" => "seznam",
4852     "title" => "Seznam",
4853     "rule" => array(
4854     "SeznamBot[ /]([0-9.]{1,10})" => "\\1",
4855     "Seznam" => ""
4856     ),
4857     "uri" => "http://www.seznam.cz"
4858     ),
4859     "sharpreader" => array(
4860     "icon" => "sharpreader",
4861     "title" => "SharpReader",
4862     "rule" => array(
4863     "SharpReader[ /]([0-9.]{1,10})" => "\\1"
4864     ),
4865     "uri" => ""
4866     ),
4867     "shelob" => array(
4868     "icon" => "shelob",
4869     "title" => "Sherlock Spider",
4870     "rule" => array(
4871     "^Shelob" => ""
4872     ),
4873     "uri" => "http://www.gmx.net"
4874     ),
4875     "sherlockspider" => array(
4876     "icon" => "robot",
4877     "title" => "Sherlock Spider",
4878     "rule" => array(
4879     "sherlock_spider" => ""
4880     ),
4881     "uri" => ""
4882     ),
4883     "shim" => array(
4884     "icon" => "robot",
4885     "title" => "Shim Crawler",
4886     "rule" => array(
4887     "shim[ \-]crawler" => ""
4888     ),
4889     "uri" => ""
4890     ),
4891     "shopwiki" => array(
4892     "icon" => "shopwiki",
4893     "title" => "ShopWiki",
4894     "rule" => array(
4895     "^ShopWiki[ /]([0-9.]{1,10})" => "\\1"
4896     ),
4897     "uri" => ""
4898     ),
4899     "shoula" => array(
4900     "icon" => "robot",
4901     "title" => "Shoula",
4902     "rule" => array(
4903     "^Shoula.com Crawler ([0-9.]{1,10})" => "\\1"
4904     ),
4905     "uri" => "http://www.shoula.com"
4906     ),
4907     "siege" => array(
4908     "icon" => "robot",
4909     "title" => "Siege",
4910     "rule" => array(
4911     "Siege[ /]([0-9.]{1,10})" => "\\1"
4912     ),
4913     "uri" => ""
4914     ),
4915     "siets" => array(
4916     "icon" => "robot",
4917     "title" => "Siets",
4918     "rule" => array(
4919     "SietsCrawler[ /]([0-9.]{1,10})" => "\\1"
4920     ),
4921     "uri" => ""
4922     ),
4923     "simpy" => array(
4924     "icon" => "simpy",
4925     "title" => "Simpy",
4926     "rule" => array(
4927     "^(argus|simpy)[ /]([0-9.]{1,10})" => "\\2",
4928     ),
4929     "uri" => ""
4930     ),
4931     "singingfish" => array(
4932     "icon" => "singingfish",
4933     "title" => "SingingFish",
4934     "rule" => array(
4935     "asterias[ /]([0-9.]{1,10})" => "\\1",
4936     "Asterias Crawler v([0-9.]{1,10})" => "\\1",
4937     "asterias" => ""
4938     ),
4939     "uri" => ""
4940     ),
4941     "sirketce" => array(
4942     "icon" => "robot",
4943     "title" => "Sirketce",
4944     "rule" => array(
4945     "Sirketcebot[ /v]+([0-9.]{1,10})" => "\\1"
4946     ),
4947     "uri" => "http://www.sirketce.com/bot.html"
4948     ),
4949     "sirobot" => array(
4950     "icon" => "robot",
4951     "title" => "SiroBot",
4952     "rule" => array(
4953     "sirobot" => ""
4954     ),
4955     "uri" => ""
4956     ),
4957     "sistrix" => array(
4958     "icon" => "sistrix",
4959     "title" => "SISTRIX",
4960     "rule" => array(
4961     "SISTRIX Crawler" => ""
4962     ),
4963     "uri" => "http://crawler.sistrix.net/"
4964     ),
4965     "sitebar" => array(
4966     "icon" => "sitebar",
4967     "title" => "SiteBar",
4968     "rule" => array(
4969     "SiteBar[ /]([0-9.]{1,10})" => "\\1"
4970     ),
4971     "uri" => ""
4972     ),
4973     "sitebot" => array(
4974     "icon" => "sitebot",
4975     "title" => "SiteBot",
4976     "rule" => array(
4977     "SiteBot[ /]([0-9.]{1,10})" => "\\1"
4978     ),
4979     "uri" => "http://www.sitebot.org/robot/"
4980     ),
4981 matthys 273 "siteexplorer" => array(
4982     "icon" => "siteexplorer",
4983     "title" => "SiteExplorer",
4984     "rule" => array(
4985     "SiteExplorer[ /]([0-9a-z.]{1,10})" => "\\1"
4986     ),
4987     "uri" => "http://siteexplorer.info/"
4988     ),
4989 joku 63 "sitesell" => array(
4990     "icon" => "sitesell",
4991     "title" => "SiteSell",
4992     "rule" => array(
4993     "SBIder[/ ]([0-9a-z.\-]{1,10})" => "\\1"
4994     ),
4995     "uri" => ""
4996     ),
4997     "sitespider" => array(
4998     "icon" => "robot",
4999     "title" => "SiteSpider",
5000     "rule" => array(
5001     "^SiteSpider" => ""
5002     ),
5003     "uri" => ""
5004     ),
5005     "sitesucker" => array(
5006     "icon" => "sitesucker",
5007     "title" => "SiteSucker",
5008     "rule" => array(
5009     "Sitesucker[ /]([0-9.]{1,10})" => "\\1"
5010     ),
5011     "uri" => "http://www.sitesucker.us/"
5012     ),
5013     "sitidi" => array(
5014     "icon" => "robot",
5015     "title" => "SitiDi",
5016     "rule" => array(
5017     "SitiDiBot[ /]([0-9.]{1,10})" => "\\1"
5018     ),
5019     "uri" => ""
5020     ),
5021 joku 329 "sixy" => array(
5022     "icon" => "robot",
5023     "title" => "Sixy.ch",
5024     "rule" => array(
5025     "sixy.ch[ /]([0-9a-z.]{1,10})" => "\\1"
5026     ),
5027     "uri" => "http://sixy.ch"
5028     ),
5029 joku 63 "skaffe" => array(
5030     "icon" => "robot",
5031     "title" => "Skaffe",
5032     "rule" => array(
5033     "Skampy[ /]([0-9.\-]{1,10})" => "\\1"
5034     ),
5035     "uri" => "http://www.skaffe.com"
5036     ),
5037     "skizzle" => array(
5038     "icon" => "skizzle",
5039     "title" => "Skizzle",
5040     "rule" => array(
5041     "SKIZZLE! Distributed Internet Spider[ /v]+([0-9a-z.\-]{1,10})" => "\\1"
5042     ),
5043     "uri" => "http://www.skizzle.com"
5044     ),
5045     "slider" => array(
5046     "icon" => "robot",
5047     "title" => "Slider",
5048     "rule" => array(
5049     "^Slider[ /]([0-9.]{1,10})" => "\\1"
5050     ),
5051     "uri" => ""
5052     ),
5053     "slugch" => array(
5054     "icon" => "robot",
5055 matthys 209 "title" => "Slugch",
5056 joku 63 "rule" => array(
5057     "^slug\.ch crawl ([0-9a-z.\-]{1,10})" => "\\1"
5058     ),
5059     "uri" => ""
5060     ),
5061     "smartware" => array(
5062     "icon" => "robot",
5063     "title" => "SmartWareSoft",
5064     "rule" => array(
5065     "^SWSBot-Images[ /]([0-9.]{1,10})" => "\\1"
5066     ),
5067     "uri" => "http://www.smartwaresoft.com/swsbot12.html"
5068     ),
5069     "snookit" => array(
5070     "icon" => "snookit",
5071     "title" => "Snookit",
5072     "rule" => array(
5073     "^snookit" => ""
5074     ),
5075     "uri" => "http://www.snookit.com/"
5076     ),
5077     "snoopy" => array(
5078     "icon" => "robot",
5079     "title" => "Snoopy",
5080     "rule" => array(
5081     "^Snoopy.+([0-9.]{1,10})" => "\\1",
5082     "sna-([0-9.]{1,10})" => "\\1"
5083     ),
5084     "uri" => "http://snoopy.sourceforge.net/"
5085     ),
5086     "snyke" => array(
5087     "icon" => "robot",
5088     "title" => "Snyke",
5089     "rule" => array(
5090     "^SnykeBot[ /]([0-9.]{1,10})" => "\\1"
5091     ),
5092     "uri" => "http://www.snyke.com"
5093     ),
5094     "socialradar" => array(
5095     "icon" => "socialradar",
5096     "title" => "Social Radar",
5097     "rule" => array(
5098     "Socialradarbot[ /]([0-9.]{1,10})" => "\\1"
5099     ),
5100     "uri" => "http://infegy.com/"
5101     ),
5102     "soegning" => array(
5103     "icon" => "soegning",
5104 matthys 209 "title" => "Søgning",
5105 joku 63 "rule" => array(
5106     "soegning\.dk[/ ]spider[ /]([0-9.]{1,10})" => "\\1"
5107     ),
5108     "uri" => ""
5109     ),
5110     "soft411" => array(
5111     "icon" => "soft411",
5112     "title" => "Soft411",
5113     "rule" => array(
5114     "SOFT411 Directory" => ""
5115     ),
5116     "uri" => ""
5117     ),
5118     "sogou" => array(
5119     "icon" => "sogou",
5120     "title" => "Sogou",
5121     "rule" => array(
5122     "Sogou web spider[ /]([0-9.]{1,10})" => "\\1"
5123     ),
5124     "uri" => "http://www.sogou.com/docs/help/webmasters.htm#07"
5125     ),
5126     "sohu" => array(
5127     "icon" => "robot",
5128     "title" => "Sohu",
5129     "rule" => array(
5130     "sohu[ \-](agent|search)" => ""
5131     ),
5132     "uri" => ""
5133     ),
5134     "somewhere" => array(
5135     "icon" => "robot",
5136 matthys 209 "title" => "Somewhere.com",
5137 joku 63 "rule" => array(
5138     "Mozilla\@somewhere\.com" => "\\1"
5139     ),
5140     "uri" => "http://www.somewhere.com/"
5141     ),
5142     "sopheus" => array(
5143     "icon" => "robot",
5144     "title" => "Sopheus",
5145     "rule" => array(
5146     "Sopheus Project[ /]([0-9.]{1,10})" => "\\1"
5147     ),
5148     "uri" => "http://www.thenetplanet.com"
5149     ),
5150     "soso" => array(
5151     "icon" => "soso",
5152     "title" => "Soso",
5153     "rule" => array(
5154     "^Soso(image)?spider" => ""
5155     ),
5156     "uri" => "http://help.soso.com/soso-image-spider.htm"
5157     ),
5158     "souppot" => array(
5159     "icon" => "robot",
5160     "title" => "SoupPot",
5161     "rule" => array(
5162     "SoupPotBot" => ""
5163     ),
5164     "uri" => ""
5165     ),
5166     "specificmedia" => array(
5167     "icon" => "specificmedia",
5168     "title" => "Specific Media",
5169     "rule" => array(
5170     "^SMBot[ /]([0-9.]{1,10})" => "\\1"
5171     ),
5172     "uri" => ""
5173     ),
5174     "sphider" => array(
5175     "icon" => "sphider",
5176     "title" => "Sphider",
5177     "rule" => array(
5178     "Sphider" => ""
5179     ),
5180     "uri" => "http://www.sphider.eu"
5181     ),
5182     "spinn3r" => array(
5183     "icon" => "robot",
5184     "title" => "Spinn3r",
5185     "rule" => array(
5186     "Spinn3r[ /]([0-9.]{1,10})" => "\\1"
5187     ),
5188     "uri" => "http://spinn3r.com/robot"
5189     ),
5190     "sproose" => array(
5191     "icon" => "robot",
5192 matthys 209 "title" => "Sproose",
5193 joku 63 "rule" => array(
5194     "^sproose[ /]([0-9a-z.]{1,10})" => "\\1"
5195     ),
5196     "uri" => "http://www.sproose.com/bot.html"
5197     ),
5198     "spurlbot" => array(
5199     "icon" => "robot",
5200     "title" => "SpurlBot",
5201     "rule" => array(
5202     "SpurlBot[/ ]([0-9.]{1,10})" => "\\1"
5203     ),
5204     "uri" => ""
5205     ),
5206     "stardownloader" => array(
5207     "icon" => "stardownloader",
5208     "title" => "Star Downloader",
5209     "rule" => array(
5210     "^Star Downloader( Pro)?" => ""
5211     ),
5212     "uri" => ""
5213     ),
5214     "steeler" => array(
5215     "icon" => "robot",
5216     "title" => "Steeler",
5217     "rule" => array(
5218     "Steeler[ /]([0-9.]{1,10})" => "\\1"
5219     ),
5220     "uri" => ""
5221     ),
5222     "strategicboard" => array(
5223     "icon" => "strategicboard",
5224     "title" => "Strategic Board",
5225     "rule" => array(
5226     "Strategic Board Bot" => ""
5227     ),
5228     "uri" => "http://www.strategicboard.com"
5229     ),
5230     "suchbaer" => array(
5231     "icon" => "robot",
5232 matthys 209 "title" => "Suchbaer.de",
5233 joku 63 "rule" => array(
5234     "^suchbaer\.de" => ""
5235     ),
5236     "uri" => "http://www.suchbaer.de/"
5237     ),
5238     "suchbot" => array(
5239     "icon" => "robot",
5240 matthys 209 "title" => "Suchbot",
5241 joku 63 "rule" => array(
5242     "^suchbot" => ""
5243     ),
5244     "uri" => ""
5245     ),
5246     "suchende" => array(
5247     "icon" => "suchende",
5248 matthys 209 "title" => "Suchen.de",
5249 joku 63 "rule" => array(
5250     "^gonzo([0-9]{1,2}).*www.suchen.de" => "\\1",
5251     "^gonzo/([0-9.]{1,10})" => "\\1"
5252     ),
5253     "uri" => "http://www.suchen.de/"
5254     ),
5255     "suchknecht" => array(
5256     "icon" => "robot",
5257     "title" => "Suchknecht",
5258     "rule" => array(
5259     "^Suchknecht.at-Robot" => ""
5260     ),
5261     "uri" => "http://www.suchknecht.at/"
5262     ),
5263     "suchpad" => array(
5264     "icon" => "robot",
5265 matthys 209 "title" => "Suchpad",
5266 joku 63 "rule" => array(
5267     "^suchpadbot[ /]([0-9.]{1,10})" => "\\1"
5268     ),
5269     "uri" => "http://www.suchpad.de"
5270     ),
5271     "sunrise" => array(
5272     "icon" => "sunrise",
5273     "title" => "Sunrise",
5274     "rule" => array(
5275     "^Sunrise[ /]([0-9a-z.]{1,10})" => "\\1"
5276     ),
5277     "uri" => ""
5278     ),
5279     "superbot" => array(
5280     "icon" => "superbot",
5281     "title" => "SuperBot",
5282     "rule" => array(
5283     "SuperBot[ /]([0-9.]{1,10})" => "\\1"
5284     ),
5285     "uri" => ""
5286     ),
5287     "surfcontrol" => array(
5288     "icon" => "robot",
5289     "title" => "SurfControl",
5290     "rule" => array(
5291     "SurfControl" => "",
5292     "ScSpider[ /]([0-9.]{1,10})" => "\\1"
5293     ),
5294     "uri" => ""
5295     ),
5296     "surfnet" => array(
5297     "icon" => "robot",
5298     "title" => "SURFnet",
5299     "rule" => array(
5300     "AVSearch[ \-]([0-9.]{1,10})" => "\\1"
5301     ),
5302     "uri" => ""
5303     ),
5304     "surfsafely" => array(
5305     "icon" => "robot",
5306     "title" => "Surfsafely",
5307     "rule" => array(
5308     "Submission Spider at surfsafely.com" => ""
5309     ),
5310     "uri" => "http://www.surfsafely.com"
5311     ),
5312     "surphace" => array(
5313     "icon" => "spherescout",
5314     "title" => "Surphace",
5315     "rule" => array(
5316     "Sphere Scout.+([0-9.]{1,10})" => "\\1",//Previous called Sphere Scout
5317     "Surphace.+v([0-9.]{1,10})" => "\\1"
5318     ),
5319     "uri" => "http://www.surphace.com"
5320     ),
5321     "surveybot" => array(
5322     "icon" => "surveybot",
5323     "title" => "Whois Survey",
5324     "rule" => array(
5325     "SurveyBot[ /]([0-9.]{1,10})" => "\\1"
5326     ),
5327     "uri" => ""
5328     ),
5329     "swoogle" => array(
5330     "icon" => "robot",
5331     "title" => "Swoogle",
5332     "rule" => array(
5333     "^Swooglebot[ /]([0-9.]{1,10})" => "\\1"
5334     ),
5335     "uri" => "http://swoogle.umbc.edu/swooglebot.htm"
5336     ),
5337     "swse" => array(
5338     "icon" => "robot",
5339     "title" => "SWSE",
5340     "rule" => array(
5341     "sw\.deri\.org" => ""
5342     ),
5343     "uri" => "http://sw.deri.org/2006/04/multicrawler/robots.html"
5344     ),
5345     "swish-e" => array(
5346     "icon" => "swish-e",
5347     "title" => "Swish-e",
5348     "rule" => array(
5349     "^swish-e" => ""
5350     ),
5351     "uri" => "http://swish-e.org/"
5352     ),
5353     "sygol" => array(
5354     "icon" => "sygol",
5355     "title" => "Sygol",
5356     "rule" => array(
5357     "www.sygol.(com|net)" => ""
5358     ),
5359     "uri" => "http://www.sygol.com"
5360     ),
5361     "syllabs" => array(
5362     "icon" => "syllabs",
5363     "title" => "Syllabs",
5364     "rule" => array(
5365     "Focal[-]([0-9.]{1,10})" => "\\1"
5366     ),
5367     "uri" => "http://www.syllabs.com/crawler.html"
5368     ),
5369     "synapse" => array(
5370     "icon" => "robot",
5371     "title" => "Synapse",
5372     "rule" => array(
5373     " Synapse\)" => ""
5374     ),
5375     "uri" => "http://ws.apache.org/synapse/"
5376     ),
5377     "sync2it" => array(
5378     "icon" => "robot",
5379 matthys 209 "title" => "Sync2it",
5380 joku 63 "rule" => array(
5381     "^\!Susie" => ""
5382     ),
5383     "uri" => "http://www.sync2it.com/bms/susie.php"
5384     ),
5385     "syncit" => array(
5386     "icon" => "robot",
5387 matthys 209 "title" => "Syncit",
5388 joku 63 "rule" => array(
5389     "^SyncIT[ /]([0-9.]{1,10})" => "\\1"
5390     ),
5391     "uri" => "http://www.syncit.com/"
5392     ),
5393     "syndic8" => array(
5394     "icon" => "syndic8",
5395     "title" => "Syndic8",
5396     "rule" => array(
5397     "Syndic8[ /]([0-9.]{1,10})" => "\\1"
5398     ),
5399     "uri" => "http://www.syndic8.com/"
5400     ),
5401     "syndicatie" => array(
5402     "icon" => "robot",
5403     "title" => "Syndicatie.nl",
5404     "rule" => array(
5405     "Syndicatie\.nl robot v ([0-9.]{1,10})" => "\\1",
5406     "Syndicatie\.nl robot;" => ""
5407     ),
5408     "uri" => ""
5409     ),
5410     "synomia" => array(
5411     "icon" => "robot",
5412     "title" => "Synomia",
5413     "rule" => array(
5414     "^SynoBot" => ""
5415     ),
5416     "uri" => ""
5417     ),
5418     "synoo" => array(
5419     "icon" => "robot",
5420     "title" => "SynooBot",
5421     "rule" => array(
5422     "SynooBot[ /]([0-9.]{1,10})" => "\\1",
5423     ),
5424     "uri" => ""
5425     ),
5426     "szukacz" => array(
5427     "icon" => "szukacz",
5428     "title" => "Szukacz",
5429     "rule" => array(
5430     "Szukacz[ /]([0-9.]{1,10})" => "\\1"
5431     ),
5432     "uri" => ""
5433     ),
5434     "tagoo" => array(
5435     "icon" => "tagoobot",
5436     "title" => "Tagoo",
5437     "rule" => array(
5438     "Tagoobot[ /]([0-9.]{1,10})" => "\\1"
5439     ),
5440     "uri" => "http://www.tagoo.ru"
5441     ),
5442     "tagword" => array(
5443     "icon" => "tagword",
5444     "title" => "Tagword",
5445     "rule" => array(
5446     "^Tagword" => ""
5447     ),
5448     "uri" => "http://tagword.com/dmoz_survey.php"
5449     ),
5450     "trailfire" => array(
5451     "icon" => "trailfire",
5452     "title" => "Trailfire",
5453     "rule" => array(
5454     "^Trailfire-bot[ /]([0-9.]{1,10})" => "\\1"
5455     ),
5456     "uri" => "http://trailfire.com"
5457     ),
5458     "tamu" => array(
5459     "icon" => "tamu",
5460     "title" => "Tamu Crawler",
5461     "rule" => array(
5462     "IRLbot[ /]([0-9.]{1,10})" => "\\1",
5463     "TAMU_CS_IRL_CRAWLER[ /]([0-9.]{1,10})" => "\\1"
5464     ),
5465     "uri" => "http://irl.cs.tamu.edu/crawler/"
5466     ),
5467     "taptubot" => array(
5468     "icon" => "taptubot",
5469     "title" => "Taptu",
5470     "rule" => array(
5471     "taptubot" => ""
5472     ),
5473     "uri" => "http://www.taptu.com/corp/taptubot"
5474     ),
5475     "targetseek" => array(
5476     "icon" => "robot",
5477     "title" => "TargetSeek",
5478     "rule" => array(
5479     "TargetSeek[ /]([0-9.]{1,10})" => "\\1"
5480     ),
5481     "uri" => "http://www.targetgroups.net/TargetSeek.html"
5482     ),
5483     "taw" => array(
5484     "icon" => "taw",
5485     "title" => "TAW",
5486     "rule" => array(
5487     "TAW[ /]([0-9.]{1,10})" => "\\1"
5488     ),
5489     "uri" => "http://www.tawdis.net"
5490     ),
5491     "tcd" => array(
5492     "icon" => "tcd",
5493     "title" => "Trinity College Dublin",
5494     "rule" => array(
5495     "^TCDBOT/Nutch-([0-9.]{1,10})" => "\\1"
5496     ),
5497     "uri" => "http://www.tcd.ie"
5498     ),
5499     "technorati" => array(
5500     "icon" => "technorati",
5501     "title" => "Technorati",
5502     "rule" => array(
5503     "Technoratibot[ /]([0-9.]{1,10})" => "\\1"
5504     ),
5505     "uri" => ""
5506     ),
5507     "teleport" => array(
5508     "icon" => "teleport",
5509     "title" => "Teleport",
5510     "rule" => array(
5511     "Teleport[ \-]?Pro" => ""
5512     ),
5513     "uri" => ""
5514     ),
5515     "terrar" => array(
5516     "icon" => "robot",
5517     "title" => "Terrar",
5518     "rule" => array(
5519     "^Fresh Search :: Terrar" => ""
5520     ),
5521     "uri" => ""
5522     ),
5523     "theophrastus" => array(
5524     "icon" => "robot",
5525     "title" => "Theophrastus",
5526     "rule" => array(
5527     "Theophrastus[ /]([0-9.]{1,10})" => "\\1"
5528     ),
5529     "uri" => "http://users.cs.cf.ac.uk/N.A.Smith/theophrastus.php"
5530     ),
5531     "thumbnailscz" => array(
5532     "icon" => "robot",
5533 matthys 209 "title" => "Thumbnails.cz",
5534 joku 63 "rule" => array(
5535     "^thumbnail\.cz robot[ /]([0-9.]{1,10})" => "\\1"
5536     ),
5537     "uri" => ""
5538     ),
5539     "thumbshot" => array(
5540     "icon" => "robot",
5541 matthys 209 "title" => "Thumbshots",
5542 joku 63 "rule" => array(
5543     "^thumbshots.*(Version: |v)([0-9.]{2,10})e" => "\\1",
5544     "^thumbshots-de" => ""
5545     ),
5546     "uri" => "http://www.thumbshots.de"
5547     ),
5548     "thunderstone" => array(
5549     "icon" => "thunderstone",
5550     "title" => "Thunderstone",
5551     "rule" => array(
5552     "T-H-U-N-D-E-R-S-T-O-N-E" => "",
5553     "search.thunderstone.com" => ""
5554     ),
5555     "uri" => "http://search.thunderstone.com/"
5556     ),
5557     "timbobot" => array(
5558     "icon" => "robot",
5559 matthys 209 "title" => "TimboBot",
5560 joku 63 "rule" => array(
5561     "timboBot" => ""
5562     ),
5563     "uri" => ""
5564     ),
5565     "topsy" => array(
5566     "icon" => "topsy",
5567     "title" => "Topsy",
5568     "rule" => array(
5569     "Butterfly[ /]([0-9.]{1,10})" => "\\1"
5570     ),
5571     "uri" => "http://labs.topsy.com/butterfly.html"
5572     ),
5573     "trayce" => array(
5574     "icon" => "robot",
5575 matthys 209 "title" => "Trayce",
5576 joku 63 "rule" => array(
5577     "traycebot[ /]([0-9a-z.\-]{1,10})" => "\\1"
5578     ),
5579     "uri" => ""
5580     ),
5581     "tricus" => array(
5582     "icon" => "robot",
5583     "title" => "Tricus",
5584     "rule" => array(
5585     "B_l_i_t_z_B_O_T_@_t_r_i_c_u_s_\._c_o_m" => ""
5586     ),
5587     "uri" => ""
5588     ),
5589     "topicblogs" => array(
5590     "icon" => "robot",
5591     "title" => "Topicblogs",
5592     "rule" => array(
5593     "topicblogs[ /]([0-9.]{1,10})" => "\\1"
5594     ),
5595     "uri" => ""
5596     ),
5597     "touche" => array(
5598     "icon" => "touche",
5599 matthys 209 "title" => "Touché",
5600 joku 63 "rule" => array(
5601     "^Touche" => ""
5602     ),
5603     "uri" => "http://touche.com.ve"
5604     ),
5605     "tuezilla" => array(
5606     "icon" => "robot",
5607 matthys 209 "title" => "TÃœzilla",
5608 joku 63 "rule" => array(
5609     "tuezilla.de" => ""
5610     ),
5611     "uri" => "http://tuezilla.de/t_st-odp-entries-agent.html"
5612     ),
5613     "turnitin" => array(
5614     "icon" => "turnitin",
5615     "title" => "Turnitin",
5616     "rule" => array(
5617     "TurnitinBot[ /]([0-9.]{1,10})" => "\\1"
5618     ),
5619     "uri" => ""
5620     ),
5621     "tutorgig" => array(
5622     "icon" => "robot",
5623     "title" => "TutorGig",
5624     "rule" => array(
5625     "TutorGig(Bot)?[ /]([0-9.]{1,10})" => "\\2"
5626     ),
5627     "uri" => ""
5628     ),
5629     "twiceler" => array(
5630     "icon" => "cuill",
5631 matthys 209 "title" => "Cuill",
5632 joku 63 "rule" => array(
5633     "Twiceler[ /-]([0-9.]{1,10})" => "\\1",
5634     "Twiceler" => ""
5635     ),
5636     "uri" => "http://www.cuill.com/twiceler/robot.html"
5637     ),
5638     "twingly" => array(
5639     "icon" => "twingly",
5640     "title" => "Twingly",
5641     "rule" => array(
5642     "Twingly Recon" => ""
5643     ),
5644     "uri" => "http://www.twingly.com/"
5645     ),
5646 matthys 320 "twitter" => array(
5647     "icon" => "twitter",
5648     "title" => "Twitter",
5649     "rule" => array(
5650     "Twitterbot[ /-]([0-9.]{1,10})" => "\\1"
5651     ),
5652     "uri" => "https://dev.twitter.com/cards/getting-started#crawling"
5653     ),
5654 joku 63 "typepad" => array(
5655     "icon" => "typepad",
5656     "title" => "TypePad",
5657     "rule" => array(
5658     "TypePad/([0-9a-z.]{1,10})" => "\\1"
5659     ),
5660     "uri" => ""
5661     ),
5662     "udmsearch" => array(
5663     "icon" => "robot",
5664     "title" => "UdmSearch",
5665     "rule" => array(
5666     "UdmSearch[/ ]([0-9.]{1,10})" => "\\1"
5667     ),
5668     "uri" => ""
5669     ),
5670     "ukwizz" => array(
5671     "icon" => "ukwizz",
5672     "title" => "UKWizz",
5673     "rule" => array(
5674     "^Mackster.*ukwizz" => ""
5675     ),
5676     "uri" => "http://www.ukwizz.com"
5677     ),
5678     "ultraseek" => array(
5679     "icon" => "robot",
5680     "title" => "Ultraseek",
5681     "rule" => array(
5682     "Ultraseek" => ""
5683     ),
5684     "uri" => ""
5685     ),
5686     "ultraspider" => array(
5687     "icon" => "robot",
5688     "title" => "UltraSpider",
5689     "rule" => array(
5690     "UltraSpider3000[/ ]([0-9.]{1,10})" => "\\1"
5691     ),
5692     "uri" => "http://www.search.ch"
5693     ),
5694     "umai" => array(
5695     "icon" => "robot",
5696 matthys 209 "title" => "Umai",
5697 joku 63 "rule" => array(
5698     "umai[/ ]([0-9.]{1,10})" => "\\1"
5699     ),
5700     "uri" => ""
5701     ),
5702     "unchaos" => array(
5703     "icon" => "robot",
5704     "title" => "Unchaos",
5705     "rule" => array(
5706     "unchaos_crawler[_ /]([0-9.]{1,10})" => "\\1",
5707     "unchaos" => ""
5708     ),
5709     "uri" => ""
5710     ),
5711     "unido" => array(
5712     "icon" => "robot",
5713 matthys 209 "title" => "UNIdo",
5714 joku 63 "rule" => array(
5715     "^unido-bot" => "\\1"
5716     ),
5717     "uri" => "http://mobicom.cs.uni-dortmund.de/bot.html"
5718     ),
5719     "updated" => array(
5720     "icon" => "robot",
5721     "title" => "Updated",
5722     "rule" => array(
5723     "updated[ /]([0-9a-z.]{1,10})" => "\\1"
5724     ),
5725     "uri" => ""
5726     ),
5727     "uptimebot" => array(
5728     "icon" => "robot",
5729     "title" => "UptimeBot",
5730     "rule" => array(
5731     "^UptimeBot" => ""
5732     ),
5733     "uri" => "http://www.uptimebot.com/"
5734     ),
5735     "urifetch" => array(
5736     "icon" => "robot",
5737     "title" => "URI::Fetch",
5738     "rule" => array(
5739     "^URI::Fetch[ /]([0-9.]{1,10})" => "\\1"
5740     ),
5741     "uri" => ""
5742     ),
5743     "urlbase" => array(
5744     "icon" => "robot",
5745     "title" => "URLBase",
5746     "rule" => array(
5747     "URLBase[ /]([0-9.]{1,10})" => "\\1"
5748     ),
5749     "uri" => ""
5750     ),
5751     "urlblaze" => array(
5752     "icon" => "robot",
5753     "title" => "URLBlaze",
5754     "rule" => array(
5755     "^URLBlaze" => ""
5756     ),
5757     "uri" => ""
5758     ),
5759     "urlcontr" => array(
5760     "icon" => "robot",
5761     "title" => "MS URL Control",
5762     "rule" => array(
5763     "Microsoft URL[ \-]?Control" => ""
5764     ),
5765     "uri" => ""
5766     ),
5767     "urlgetfile" => array(
5768     "icon" => "robot",
5769     "title" => "URLGetFile",
5770     "rule" => array(
5771     "^URLGetFile" => ""
5772     ),
5773     "uri" => ""
5774     ),
5775     "urlscope" => array(
5776     "icon" => "robot",
5777     "title" => "UrlScope",
5778     "rule" => array(
5779     "UrlScope" => ""
5780     ),
5781     "uri" => ""
5782     ),
5783     "urltrends" => array(
5784     "icon" => "urltrends",
5785 matthys 209 "title" => "UrlTrends",
5786 joku 63 "rule" => array(
5787     "Snappy/([0-9.]{1,10})" => "\\1",
5788     ),
5789     "uri" => ""
5790     ),
5791     "usww" => array(
5792     "icon" => "usww",
5793 matthys 209 "title" => "USWW",
5794 joku 63 "rule" => array(
5795     "usww\.com" => "",
5796     "Mozilla/5\.0 URL-Spider" => ""
5797     ),
5798     "uri" => "http://www.usww.com/"
5799     ),
5800     "usyd" => array(
5801     "icon" => "robot",
5802     "title" => "USyd-NLP-Spider",
5803     "rule" => array(
5804     "^USyd-NLP-Spider" => ""
5805     ),
5806     "uri" => "http://www.it.usyd.edu.au/~vinci/bot.html"
5807     ),
5808     "vagabondo" => array(
5809     "icon" => "wiseguys",
5810     "title" => "WiseGuys",
5811     "rule" => array(
5812     "Vagabondo[ /]([0-9.]{1,10})" => "\\1",
5813     "Vagabondo-WAP[ /]([0-9.]{1,10})" => "\\1"
5814     ),
5815     "uri" => ""
5816     ),
5817     "unicorn" => array(
5818     "icon" => "w3c",
5819     "title" => "W3C Unicorn",
5820     "rule" => array(
5821     "Unicorn[ /]([0-9.]{1,10})" => "\\1",
5822     ),
5823     "uri" => "http://validator.w3.org/unicorn/"
5824     ),
5825     "validator" => array(
5826     "icon" => "w3c",
5827     "title" => "W3C Validator",
5828     "rule" => array(
5829     "W3C_Validator[ /]([0-9.]{1,10})" => "\\1"
5830     ),
5831     "uri" => "http://validator.w3.org/"
5832     ),
5833     "validator.nu" => array(
5834     "icon" => "validatornu",
5835     "title" => "Validator.nu",
5836     "rule" => array(
5837     "^Validator.nu[ /]([0-9.]{1,10})" => "\\1",
5838     "^Validator.nu/LV" => "\\1"
5839     ),
5840     "uri" => "http://validator.nu/"
5841     ),
5842     "verity" => array(
5843     "icon" => "robot",
5844     "title" => "Verity",
5845     "rule" => array(
5846     "^vspider[ /]([0-9.]{1,10})" => "\\1",
5847     "^vspider" => ""
5848     ),
5849     "uri" => "http://www.verity.com/"
5850     ),
5851     "versionsproject" => array(
5852     "icon" => "robot",
5853     "title" => "Versions-project",
5854     "rule" => array(
5855     "InfoFly[ /]([0-9.]{1,10})" => "\\1"
5856     ),
5857     "uri" => "http://www.versions-project.org/"
5858     ),
5859     "verticalmatch" => array(
5860     "icon" => "robot",
5861     "title" => "VerticalMatch",
5862     "rule" => array(
5863     "^VMBot[ /]([0-9.]{1,10})" => "\\1"
5864     ),
5865     "uri" => "http://www.VerticalMatch.com/"
5866     ),
5867     "verzamelgids" => array(
5868     "icon" => "robot",
5869     "title" => "Verzamelgids",
5870     "rule" => array(
5871     "Verzamelgids[ /]([0-9.]{1,10})" => "\\1"
5872     ),
5873     "uri" => "http://www.verzamelgids.nl/"
5874     ),
5875     "vestris" => array(
5876     "icon" => "vestris",
5877     "title" => "Vestris",
5878     "rule" => array(
5879     "AlkalineBOT[ /]([0-9.]{1,10})" => "\\1"
5880     ),
5881     "uri" => "http://alkaline.vestris.com/"
5882     ),
5883     "vindex" => array(
5884     "icon" => "vindex",
5885     "title" => "Vindex",
5886     "rule" => array(
5887     "Vindex[ /]([0-9.]{1,10})" => "\\1"
5888     ),
5889     "uri" => ""
5890     ),
5891     "visvo" => array(
5892     "icon" => "robot",
5893     "title" => "Visvo",
5894     "rule" => array(
5895     "VisBot[ /]([0-9.]{1,10})" => "\\1"
5896     ),
5897     "uri" => "http://www.visvo.com"
5898     ),
5899     "voila" => array(
5900     "icon" => "voila",
5901     "title" => "Voila",
5902     "rule" => array(
5903     "VoilaBot[ /]?[a-z ]*([0-9.]{1,10})" => "\\1",
5904     "VoilaBot;[ /]([0-9.]{1,10})" => "\\1"
5905     ),
5906     "uri" => ""
5907     ),
5908     "vonna" => array(
5909     "icon" => "robot",
5910     "title" => "Vonna",
5911     "rule" => array(
5912     "Vonna.com b o t" => ""
5913     ),
5914     "uri" => ""
5915     ),
5916     "vortex" => array(
5917     "icon" => "robot",
5918     "title" => "Vortex",
5919     "rule" => array(
5920     "Vortex[ /]([0-9.]{1,10})" => "\\1"
5921     ),
5922     "uri" => "http://marty.anstey.ca/robots/vortex/"
5923     ),
5924     "w3sitesearch" => array(
5925     "icon" => "w3sitesearch",
5926     "title" => "W3SiteSearch",
5927     "rule" => array(
5928     "^W3SiteSearch Crawler[\_v]*([0-9.]{1,10})" => "\\1"
5929     ),
5930     "uri" => "http://www.w3sitesearch.de"
5931     ),
5932     "wagger" => array(
5933     "icon" => "robot",
5934     "title" => "Wagger",
5935     "rule" => array(
5936     "^Waggr" => ""
5937     ),
5938     "uri" => "http://www.waggr.com/"
5939     ),
5940     "wanadoo" => array(
5941     "icon" => "robot",
5942     "title" => "Wanadoo",
5943     "rule" => array(
5944     "^SurferF3[ /]([0-9./]{1,10})" => "\\1"
5945     ),
5946     "uri" => "http://www.wanadoo.fr/"
5947     ),
5948     "wapalizer" => array(
5949     "icon" => "robot",
5950     "title" => "Wapalizer",
5951     "rule" => array(
5952     "wapalizer[ /]([0-9.]{1,10})" => "\\1"
5953     ),
5954     "uri" => "http://www.wapdrive.com/"
5955     ),
5956     "watson" => array(
5957     "icon" => "addy",
5958     "title" => "Dr.Watson",
5959     "rule" => array(
5960     "Watson[ /]([0-9.]{1,10})" => "\\1",
5961     "watson\.addy\.com" => ""
5962     ),
5963     "uri" => ""
5964     ),
5965     "wavefire" => array(
5966     "icon" => "robot",
5967     "title" => "Wavefire",
5968     "rule" => array(
5969     "^Wavefire[ /]([0-9.]{1,10})" => "\\1"
5970     ),
5971     "uri" => ""
5972     ),
5973     "waypath" => array(
5974     "icon" => "waypath",
5975     "title" => "Waypath",
5976     "rule" => array(
5977     "Waypath[ \-]?Scout" => "",
5978     "Waypath (development )?crawler" => ""
5979     ),
5980     "uri" => ""
5981     ),
5982     "wauuu" => array(
5983     "icon" => "wauuu",
5984     "title" => "Wauuu",
5985     "rule" => array(
5986     "Wauuu[/ ]([0-9.]{1,10})" => "\\2"
5987     ),
5988     "uri" => "http://www.wauuu.com"
5989     ),
5990     "wdg" => array(
5991     "icon" => "wdg",
5992     "title" => "WDG Validator",
5993     "rule" => array(
5994     "^WDG_(Site)?Validator[/ ]([0-9.]{1,10})" => "\\2"
5995     ),
5996     "uri" => "http://www.htmlhelp.com/tools/validator/"
5997     ),
5998     "webagogo" => array(
5999     "icon" => "webagogo",
6000     "title" => "Webagogo",
6001     "rule" => array(
6002     "^Webagogo" => ""
6003     ),
6004     "uri" => "http://www.webagogo.be/"
6005     ),
6006     "webalta" => array(
6007     "icon" => "webalta",
6008     "title" => "WebAlta",
6009     "rule" => array(
6010     "^WebAlta( Crawler)?[/ ]([0-9.]{1,10})" => "\\2"
6011     ),
6012     "uri" => "http://www.webalta.net/ru/about_webmaster.html"
6013     ),
6014     "webdigity" => array(
6015     "icon" => "robot",
6016     "title" => "Webdigity Whois Service",
6017     "rule" => array(
6018     "^webdigity whois service" => ""
6019     ),
6020     "uri" => "http://www.webdigity.com/ws"
6021     ),
6022     "webelixir" => array(
6023     "icon" => "webelixir",
6024     "title" => "Webelixir",
6025     "rule" => array(
6026     "^webelixir" => ""
6027     ),
6028     "uri" => "http://www.webelixir.net/"
6029     ),
6030     "webbotru" => array(
6031     "icon" => "robot",
6032     "title" => "Webbot.ru",
6033     "rule" => array(
6034     " Webbot[/ ]([0-9.]{1,10})" => "\\1"
6035     ),
6036     "uri" => "http://www.webbot.ru/bot.html"
6037     ),
6038     "webcapture" => array(
6039     "icon" => "robot",
6040     "title" => "WebCapture",
6041     "rule" => array(
6042     "WebCapture[/ ]([0-9.]{1,10})" => "\\1"
6043     ),
6044     "uri" => ""
6045     ),
6046     "webcollage" => array(
6047     "icon" => "robot",
6048     "title" => "Webcollage",
6049     "rule" => array(
6050     "webcollage" => ""
6051     ),
6052     "uri" => ""
6053     ),
6054     "webcopier" => array(
6055     "icon" => "webcopier",
6056     "title" => "WebCopier",
6057     "rule" => array(
6058     "WebCopier[/ ]v?([0-9.]{1,10})" => "\\1"
6059     ),
6060     "uri" => ""
6061     ),
6062     "webcorp" => array(
6063     "icon" => "webcorp",
6064     "title" => "WebCorp",
6065     "rule" => array(
6066     "WebCorp[/ ]+([0-9.]{1,10})" => "\\1"
6067     ),
6068     "uri" => "http://www.webcorp.org.uk/"
6069     ),
6070     "webcrawl" => array(
6071     "icon" => "robot",
6072     "title" => "WebCrawl",
6073     "rule" => array(
6074     "webcrawl\.net" => ""
6075     ),
6076     "uri" => ""
6077     ),
6078     "webdownloader" => array(
6079     "icon" => "robot",
6080     "title" => "Web Downloader",
6081     "rule" => array(
6082     "Web Downloader[/ ]([0-9.]{1,10})" => "\\1"
6083     ),
6084     "uri" => ""
6085     ),
6086     "webfetch" => array(
6087     "icon" => "robot",
6088 matthys 209 "title" => "WebFetch",
6089 joku 63 "rule" => array(
6090     "^webfetch[/ ]([0-9.]{1,10})" => "\\1"
6091     ),
6092     "uri" => ""
6093     ),
6094     "webfind" => array(
6095     "icon" => "robot",
6096 matthys 209 "title" => "WebFind",
6097 joku 63 "rule" => array(
6098     "^WebFindBot" => ""
6099     ),
6100     "uri" => "http://www.web-find.com"
6101     ),
6102     "webglimpse" => array(
6103     "icon" => "robot",
6104     "title" => "Webglimpse",
6105     "rule" => array(
6106     "^Webglimpse[/ ]([0-9.]{1,10})" => "\\1"
6107     ),
6108     "uri" => "http://webglimpse.net"
6109     ),
6110     "webgobbler" => array(
6111     "icon" => "robot",
6112     "title" => "webGobbler",
6113     "rule" => array(
6114     "^webGobbler[/ ]([0-9.]{1,10})" => "\\1"
6115     ),
6116     "uri" => ""
6117     ),
6118     "webimages" => array(
6119     "icon" => "webimages",
6120     "title" => "WebImages",
6121     "rule" => array(
6122     "^WebImages[/ ]([0-9.]{1,10})" => "\\1"
6123     ),
6124     "uri" => "http://herbert.groot.jebbink.nl/"
6125     ),
6126     "weblight" => array(
6127     "icon" => "robot",
6128     "title" => "WebLight",
6129     "rule" => array(
6130     "^WebLight[/ ]([0-9.]{1,10})" => "\\1"
6131     ),
6132     "uri" => "http://www.illumit.com/Products/weblight/"
6133     ),
6134     "weblinks" => array(
6135     "icon" => "robot",
6136     "title" => "WebLink's",
6137     "rule" => array(
6138     "^Weblink.s checker" => ""
6139     ),
6140     "uri" => ""
6141     ),
6142     "webmeasurement" => array(
6143     "icon" => "robot",
6144     "title" => "Webmeasurement",
6145     "rule" => array(
6146     "^webmeasurement-bot" => ""
6147     ),
6148     "uri" => "http://rvs.informatik.uni-leipzig.de"
6149     ),
6150     "webminer" => array(
6151     "icon" => "robot",
6152     "title" => "WebMiner",
6153     "rule" => array(
6154     "^WebMiner[/ ]([0-9.]{1,10})" => "\\1"
6155     ),
6156     "uri" => ""
6157     ),
6158     "webmin" => array(
6159     "icon" => "webmin",
6160     "title" => "Webmin",
6161     "rule" => array(
6162     "^webmin" => ""
6163     ),
6164     "uri" => ""
6165     ),
6166     "webmon" => array(
6167     "icon" => "webmon",
6168     "title" => "Webmon",
6169     "rule" => array(
6170     "WebMon[ /]([0-9.]{1,10})" => "\\1"
6171     ),
6172     "uri" => "http://www.markwell.btinternet.co.uk/webmon/"
6173     ),
6174     "webox" => array(
6175     "icon" => "robot",
6176     "title" => " WeBoX",
6177     "rule" => array(
6178     "WeBoX[/ ]([0-9.]{1,10})" => "\\1"
6179     ),
6180     "uri" => ""
6181     ),
6182     "webpatrol" => array(
6183     "icon" => "webpatrol",
6184     "title" => "WebPatrol",
6185     "rule" => array(
6186     "^WebPatrol[ /]([0-9.]{1,10})" => "\\1"
6187     ),
6188     "uri" => "http://soft.macfeeling.com/WebPatrol.html"
6189     ),
6190     "webpix" => array(
6191     "icon" => "webpix",
6192     "title" => "WebPix",
6193     "rule" => array(
6194     "WebPix[/ ]([0-9.]{1,10})" => "\\1"
6195     ),
6196     "uri" => ""
6197     ),
6198     "webrace" => array(
6199     "icon" => "robot",
6200     "title" => "WebRACE",
6201     "rule" => array(
6202     "^WebRACE[/ ]([0-9.]{1,10})" => "\\1"
6203     ),
6204     "uri" => ""
6205     ),
6206     "webreaper" => array(
6207     "icon" => "webreaper",
6208     "title" => "WebReaper",
6209     "rule" => array(
6210     "^WebReaper " => ""
6211     ),
6212     "uri" => "http://www.webreaper.net/"
6213     ),
6214     "webresult" => array(
6215     "icon" => "robot",
6216     "title" => "Webresult",
6217     "rule" => array(
6218     "Der webresult\.de Robot" => ""
6219     ),
6220     "uri" => ""
6221     ),
6222     "webring" => array(
6223     "icon" => "robot",
6224     "title" => "Webring Checker",
6225     "rule" => array(
6226     "WebRingChecker[/ ]([0-9.]{1,10})" => "\\1"
6227     ),
6228     "uri" => ""
6229     ),
6230     "webripper" => array(
6231     "icon" => "webripper",
6232     "title" => "WebRipper",
6233     "rule" => array(
6234     "^WebRipper" => ""
6235     ),
6236     "uri" => "http://calluna-software.com"
6237     ),
6238     "webscaled" => array(
6239     "icon" => "webscaled",
6240     "title" => "Webscaled",
6241     "rule" => array(
6242     "Swarm" => ""
6243     ),
6244     "uri" => "http://webscaled.com/"
6245     ),
6246     "websearchau" => array(
6247     "icon" => "websearchau",
6248     "title" => "WebSearch.COM.AU",
6249     "rule" => array(
6250     "WebSearch.COM.AU[/ ]+([0-9.]{1,10})" => "\\1"
6251     ),
6252     "uri" => "http://WebSearch.com.au/"
6253     ),
6254     "websearchbench" => array(
6255     "icon" => "robot",
6256     "title" => "WebSearchBench",
6257     "rule" => array(
6258     "WebSearchBench WebCrawler[v/ ]+([0-9.]{1,10})" => "\\1"
6259     ),
6260     "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6261     ),
6262     "websense" => array(
6263     "icon" => "websense",
6264     "title" => "Websense",
6265     "rule" => array(
6266     "(Sqworm|websense|Konqueror/3\.(0|1)(-rc[1-6])?; i686 Linux; 2002[0-9]{4})" => ""
6267     ),
6268     "uri" => ""
6269     ),
6270     "websiteshadow" => array(
6271     "icon" => "websiteshadow",
6272     "title" => "Websiteshadow",
6273     "rule" => array(
6274     "Websiteshadowbot[ /]([0-9.]{1,10})" => "\\1"
6275     ),
6276     "uri" => "http://websiteshadow.com"
6277     ),
6278     "websiteworth" => array(
6279     "icon" => "robot",
6280     "title" => "WebsiteWorth",
6281     "rule" => array(
6282     "WebsiteWorth[v/ ]+([0-9.]{1,10})" => "\\1"
6283     ),
6284     "uri" => "http://directory.sootle.com/website-worth/tata.php"
6285     ),
6286     "websquash" => array(
6287     "icon" => "websquash",
6288     "title" => "Websquash",
6289     "rule" => array(
6290     "webs(quash\.com|ite[ \-]?Monitor)" => ""
6291     ),
6292     "uri" => ""
6293     ),
6294     "webstripper" => array(
6295     "icon" => "robot",
6296     "title" => "WebStripper",
6297     "rule" => array(
6298     "WebStripper[ /]([0-9.]{1,10})" => "\\1"
6299     ),
6300     "uri" => ""
6301     ),
6302     "webzip" => array(
6303     "icon" => "webzip",
6304     "title" => "WebZIP",
6305     "rule" => array(
6306     "Web[ \-]?ZIP[ /]([0-9.]{1,10})" => "\\1"
6307     ),
6308     "uri" => ""
6309     ),
6310     "wep" => array(
6311     "icon" => "robot",
6312     "title" => "WEP Search",
6313     "rule" => array(
6314     "WEP Search[ /]([0-9.]{1,10})" => "\\1"
6315     ),
6316     "uri" => ""
6317     ),
6318     "westwind" => array(
6319     "icon" => "robot",
6320     "title" => "West Wind Internet Protocols",
6321     "rule" => array(
6322     "^West Wind Internet Protocols[ /]([0-9.]{1,10})" => "\\1"
6323     ),
6324     "uri" => "http://www.west-wind.com/wwipstuff.asp"
6325     ),
6326     "wget" => array(
6327     "icon" => "wget",
6328     "title" => "Wget",
6329     "rule" => array(
6330 joku 308 "Wget[ /]([0-9.]{1,10})" => "\\1",
6331     "Wget" => ""
6332 joku 63 ),
6333     "uri" => ""
6334     ),
6335     "whizbang" => array(
6336     "icon" => "whizbang",
6337     "title" => "WhizBang",
6338     "rule" => array(
6339     "WhizBang" => ""
6340     ),
6341     "uri" => "http://www.whizbang.com/crawler/"
6342     ),
6343     "whois" => array(
6344     "icon" => "whois",
6345     "title" => "Who.is",
6346     "rule" => array(
6347     "Who.is Bot" => ""
6348     ),
6349     "uri" => "http://www.who.is/"
6350     ),
6351     "wikiwix" => array(
6352     "icon" => "wikiwix",
6353     "title" => "Wikiwix",
6354     "rule" => array(
6355     "wikiwix-bot-([0-9.]{1,10})" => "\\1"
6356     ),
6357     "uri" => "http://www.wikiwix.com/"
6358     ),
6359     "wingflyer" => array(
6360     "icon" => "robot",
6361     "title" => "WingFlyer",
6362     "rule" => array(
6363     "^WebFetch" => ""
6364     ),
6365     "uri" => "http://www.wingflyer.com/"
6366     ),
6367     "wininet" => array(
6368     "icon" => "robot",
6369     "title" => "WinInet",
6370     "rule" => array(
6371     "TeamSoft WinInet Component" => ""
6372     ),
6373     "uri" => "http://www.winsoft.sk/wininet.htm"
6374     ),
6375     "winhttp" => array(
6376     "icon" => "robot",
6377     "title" => "WinHTTP",
6378     "rule" => array(
6379     "WinHttp\.WinHttpRequest\.([0-9.]{1,10})" => "\\1"
6380     ),
6381     "uri" => ""
6382     ),
6383     "wire" => array(
6384     "icon" => "robot",
6385     "title" => "WIRE",
6386     "rule" => array(
6387     "^WIRE[ /]([0-9.]{1,10})" => "\\1"
6388     ),
6389     "uri" => ""
6390     ),
6391     "wmp" => array(
6392     "icon" => "robot",
6393     "title" => "WMP",
6394     "rule" => array(
6395     "^WMP" => ""
6396     ),
6397     "uri" => ""
6398     ),
6399     "woozweb" => array(
6400     "icon" => "woozweb",
6401     "title" => "Woozweb",
6402     "rule" => array(
6403     "woozweb" => ""
6404     ),
6405     "uri" => "http://www.woozweb.com/"
6406     ),
6407     "wordchamp" => array(
6408     "icon" => "robot",
6409     "title" => "WordChamp",
6410     "rule" => array(
6411     "^WordChampBot" => ""
6412     ),
6413     "uri" => "http://www.wordchamp.com/"
6414     ),
6415     "wordpress" => array(
6416     "icon" => "wordpress",
6417     "title" => "WordPress",
6418     "rule" => array(
6419     "WordPress[ /]([0-9.]{1,10})" => "\\1"
6420     ),
6421     "uri" => ""
6422     ),
6423     "worio" => array(
6424     "icon" => "worio",
6425     "title" => "Worio",
6426     "rule" => array(
6427     "woriobot" => ""
6428     ),
6429     "uri" => "http://worio.com/"
6430     ),
6431     "worldlight" => array(
6432     "icon" => "worldlight",
6433     "title" => "WorldLight",
6434     "rule" => array(
6435     "^WorldLight" => ""
6436     ),
6437     "uri" => ""
6438     ),
6439     "worqmada" => array(
6440     "icon" => "robot",
6441     "title" => "WorQmada",
6442     "rule" => array(
6443     "WorQmada[ /]([0-9.]{1,10})" => "\\1"
6444     ),
6445     "uri" => ""
6446     ),
6447     "wotbox" => array(
6448     "icon" => "wotbox",
6449     "title" => "Wotbox",
6450     "rule" => array(
6451     "Wotbox[ /]?[a-z]*([0-9.]{1,10})" => "\\1"
6452     ),
6453     "uri" => ""
6454     ),
6455     "wp" => array(
6456     "icon" => "wp",
6457     "title" => "Wirtualna Polska",
6458     "rule" => array(
6459     "NetSprint[ /\-]{1,4}([0-9.]{1,10})" => "\\1"
6460     ),
6461     "uri" => "http://wp.pl"
6462     ),
6463     "wsb" => array(
6464     "icon" => "robot",
6465     "title" => "WebSearchBench",
6466     "rule" => array(
6467     "WSB WebCrawler V([0-9.]{1,10})" => "\\1",
6468     "WSB " => ""
6469     ),
6470     "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6471     ),
6472     "wume" => array(
6473     "icon" => "robot",
6474     "title" => "WUME Lab's",
6475     "rule" => array(
6476     "^wume_crawler[ /]([0-9.]{1,10})" => "\\1",
6477     ),
6478     "uri" => "http://wume.cse.lehigh.edu/~xiq204/crawler/"
6479     ),
6480     "wusage" => array(
6481     "icon" => "wusage",
6482     "title" => "Wusage",
6483     "rule" => array(
6484     "Wusage[ /]([0-9.]{1,10})" => "\\1",
6485     ),
6486     "uri" => "http://www.boutell.com/wusage/"
6487     ),
6488     "wwgrapevine" => array(
6489     "icon" => "wwgrapevine",
6490     "title" => "WWgrapevine",
6491     "rule" => array(
6492     "wwgrapevine[ /]([0-9.]{1,10})" => "\\1"
6493     ),
6494     "uri" => ""
6495     ),
6496     "wws" => array(
6497     "icon" => "robot",
6498     "title" => "WWSBOT",
6499     "rule" => array(
6500     "WWSBOT[ /]([0-9.]{1,10})" => "\\1",
6501     ),
6502     "uri" => "http://www.analyzer.nu"
6503     ),
6504     "www4mail" => array(
6505     "icon" => "robot",
6506 matthys 209 "title" => "WWW4mail",
6507 joku 63 "rule" => array(
6508     "^www4mail[ /]([0-9.]{1,10})" => "\\1"
6509     ),
6510     "uri" => "http://www.www4mail.org/"
6511     ),
6512     "wwwc" => array(
6513     "icon" => "wwwc",
6514     "title" => "WWWC",
6515     "rule" => array(
6516     "^WWWC[ /]([0-9.]{1,10})" => "\\1"
6517     ),
6518     "uri" => ""
6519     ),
6520     "wwwd" => array(
6521     "icon" => "robot",
6522     "title" => "WWWD",
6523     "rule" => array(
6524     "^WWWD[ /]([0-9.]{1,10})" => "\\1"
6525     ),
6526     "uri" => ""
6527     ),
6528     "wwweasel" => array(
6529     "icon" => "wwweasel",
6530     "title" => "WWWeasel",
6531     "rule" => array(
6532     "WWWeasel( Robot)?[/ ]v?([0-9.]{1,10})" => "\\2"
6533     ),
6534     "uri" => ""
6535     ),
6536     "wwwfi" => array(
6537     "icon" => "wwwfi",
6538     "title" => "www.fi",
6539     "rule" => array(
6540     "www\.fi crawler" => ""
6541     ),
6542     "uri" => "http://www.fi/"
6543     ),
6544     "wwwmechanize" => array(
6545     "icon" => "robot",
6546     "title" => "WWW-Mechanize",
6547     "rule" => array(
6548     "^WWW-Mechanize[/ ]([0-9.]{1,10})" => "\\1"
6549     ),
6550     "uri" => ""
6551     ),
6552     "wwwoffle" => array(
6553     "icon" => "robot",
6554     "title" => "WWWoffle",
6555     "rule" => array(
6556     "^wwwoffle[/ ]([0-9.]{1,10})" => "\\1"
6557     ),
6558     "uri" => ""
6559     ),
6560     "wwwster" => array(
6561     "icon" => "robot",
6562     "title" => "WWWster",
6563     "rule" => array(
6564     "^wwwster[/ ]([0-9.]{1,10})" => "\\1"
6565     ),
6566     "uri" => ""
6567     ),
6568     "wysigot" => array(
6569     "icon" => "wysigot",
6570     "title" => "Wysigot",
6571     "rule" => array(
6572     "Wysigot[/ ]([0-9.]{1,10})" => "\\1"
6573     ),
6574     "uri" => ""
6575     ),
6576     "xaldon" => array(
6577     "icon" => "xaldon",
6578     "title" => "Xaldon",
6579     "rule" => array(
6580     "Xaldon WebSpider" => ""
6581     ),
6582     "uri" => "http://www.xaldon.de/"
6583     ),
6584     "xenu" => array(
6585     "icon" => "xenu",
6586     "title" => "Xenu Link Sleuth",
6587     "rule" => array(
6588     "Xenu Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6589     "Xenu(&#039;s)? Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6590     "Xenu_Link_Sleuth_([0-9a-z.]{1,10})" => "\\1"
6591     ),
6592     "uri" => "http://home.snafu.de/tilman/xenulink.html"
6593     ),
6594     "xerka" => array(
6595     "icon" => "xerka",
6596     "title" => "Xerka",
6597     "rule" => array(
6598     "^Xerka WebBot v([0-9a-z.]{1,10})" => "\\1"
6599     ),
6600     "uri" => "http://www.diana-teknologia.com/www1/english/xerka.htm"
6601     ),
6602     "xirq" => array(
6603     "icon" => "robot",
6604     "title" => "XIRQ",
6605     "rule" => array(
6606     "^xirq[ /]([0-9a-z.]{1,10})" => "\\1"
6607     ),
6608     "uri" => "http://www.xirq.com"
6609     ),
6610     "xmlslurp" => array(
6611     "icon" => "robot",
6612     "title" => "XMLSlurp",
6613     "rule" => array(
6614     "^XMLSlurp[ /]([0-9a-z.]{1,10})" => "\\1"
6615     ),
6616     "uri" => ""
6617     ),
6618     "xml-sitemaps" => array(
6619     "icon" => "xml-sitemaps",
6620     "title" => "XML-Sitemaps",
6621     "rule" => array(
6622     "XML-Sitemaps[ /]([0-9a-z.]{1,10})" => "\\1"
6623     ),
6624     "uri" => ""
6625     ),
6626     "xmlrpc" => array(
6627     "icon" => "robot",
6628     "title" => "Trackback",
6629     "rule" => array(
6630     "XMLRPC" => ""
6631     ),
6632     "uri" => ""
6633     ),
6634 matthys 294 "xovi" => array(
6635     "icon" => "xovi",
6636     "title" => "Xovi",
6637     "rule" => array(
6638     "XoviBot[ /]([0-9a-z.]{1,10})" => "\\1"
6639     ),
6640     "uri" => "http://www.xovibot.net"
6641     ),
6642 joku 63 "yacy" => array(
6643     "icon" => "yacy",
6644     "title" => "Yacy",
6645     "rule" => array(
6646     "yacy\.net" => ""
6647     ),
6648     "uri" => ""
6649     ),
6650     "yahoo" => array(
6651     "icon" => "yahoo",
6652     "title" => "Yahoo",
6653     "rule" => array(
6654     "Yahoo(! ([a-z]{1,3} )?Slurp|-)" => "",
6655     "Yahoo-MMCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6656     "Yahoo-VerticalCrawler-FormerWebCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6657     "^AnzwersCrawl[/ ]([0-9a-z.]{1,10})" => "\\1",
6658     "Y!J(-BSC|-SRD)*[/ ]([0-9a-z.]{1,10})" => "\\2",
6659     "Y!OASIS/TEST" => "",
6660     "Harvest-NG[/ ]([0-9a-z.]{1,10})" => "\\1",
6661     "Y!J; for robot study" => "",
6662     "Yahoo Japan; for robot study" => ""
6663     ),
6664     "uri" => "http://www.yahoo.com"
6665     ),
6666     "yahoo-feed" => array(
6667     "icon" => "yahoo",
6668     "title" => "Yahoo Feedseeker",
6669     "rule" => array(
6670     "^YahooFeedSeeker[/ ]([0-9a-z.]{1,10})" => "\\1"
6671     ),
6672     "uri" => "http://www.yahoo.com"
6673     ),
6674     "yandex" => array(
6675     "icon" => "yandex",
6676     "title" => "Yandex",
6677     "rule" => array(
6678     "Yandex[/ ]([0-9.]{1,10})" => "\\1",
6679     "Yandex(Bot|Images|Media|Antivirus)[/ ]([0-9.]{1,10})" => "\\2"
6680     ),
6681     "uri" => "http://yandex.com/bots"
6682     ),
6683     "yanga" => array(
6684     "icon" => "yanga",
6685     "title" => "Yanga",
6686     "rule" => array (
6687     "^Yanga.*v([0-9.]{1,10})" => "\\1"
6688     ),
6689     "uri" => "http://www.yanga.co.uk/"
6690     ),
6691     "yap" => array(
6692     "icon" => "yap",
6693     "title" => "Yap",
6694     "rule" => array(
6695     "^YapBot[_/ ]v([0-9.]{1,10})" => "\\1"
6696     ),
6697     "uri" => "http://www.yapinc.com/"
6698     ),
6699     "yarienavoir" => array(
6700     "icon" => "robot",
6701     "title" => "Yarienavoir",
6702     "rule" => array(
6703     "^yarienavoir.net[/ ]([0-9.]{1,10})" => "\\1"
6704     ),
6705     "uri" => "http://www.yarienavoir.net/"
6706     ),
6707     "yell" => array(
6708     "icon" => "yell",
6709     "title" => "Yell",
6710     "rule" => array(
6711     "YellCrawl[ /]V?([0-9.]{1,10})" => "\\1",
6712     "Yellbot[ /]Nutch-([0-9.]{1,10})" => "\\1",
6713     ),
6714     "uri" => ""
6715     ),
6716     "youdao" => array(
6717     "icon" => "youdao",
6718     "title" => "Youdao",
6719     "rule" => array(
6720     "YodaoBot-(Image|Mobile)?[ /]([0-9.]{1,10})" => "\\2",
6721     "YoudaoBot[ /]([0-9.]{1,10})" => "\\1"
6722     ),
6723     "uri" => "http://www.youdao.com/help/webmaster/spider/"
6724     ),
6725     "yoogli" => array(
6726     "icon" => "yoogli",
6727     "title" => "Yoogli",
6728     "rule" => array(
6729     "yoogliFetchAgent[ /]([0-9.]{1,10})" => "\\1"
6730     ),
6731     "uri" => "http://www.yoogli.com"
6732     ),
6733     "yotta" => array(
6734     "icon" => "robot",
6735     "title" => "Yotta",
6736     "rule" => array(
6737     "Yotta(Shopping|Cars)_Bot[ /]([0-9.]{1,10})" => "\\2",
6738     "OmniExplorer_Bot[ /]([0-9.]{1,10})" => "\\1"
6739     ),
6740     "uri" => "http://www.yottacars.com"
6741     ),
6742     "yoono" => array(
6743     "icon" => "yoono",
6744     "title" => "Yoono",
6745     "rule" => array(
6746     "Yoono" => ""
6747     ),
6748     "uri" => "http://www.yoono.com/"
6749     ),
6750     "yowedo" => array(
6751     "icon" => "robot",
6752     "title" => "Yowedo",
6753     "rule" => array(
6754     "Yowedo[ /]([0-9.]{1,10})" => "\\1"
6755     ),
6756     "uri" => "http://yowedo.com/en/partners.html"
6757     ),
6758     "yuntis" => array(
6759     "icon" => "robot",
6760 matthys 209 "title" => "Yuntis",
6761 joku 63 "rule" => array(
6762     "Gulper Web Bot[ /]([0-9.]{1,10})" => "\\1"
6763     ),
6764     "uri" => "http://yuntis.ecsl.cs.sunysb.edu/help/robot/"
6765     ),
6766     "zao" => array(
6767     "icon" => "robot",
6768     "title" => "Zao",
6769     "rule" => array(
6770     "Zao[ /]([0-9.]{1,10})" => "\\1",
6771     "Zao-crawler" => ""
6772     ),
6773     "uri" => ""
6774     ),
6775     "zealbot" => array(
6776     "icon" => "zeal",
6777     "title" => "ZealBot",
6778     "rule" => array(
6779     "Zealbot[ /]([0-9.]{1,10})" => "\\1"
6780     ),
6781     "uri" => ""
6782     ),
6783     "zearchit" => array(
6784     "icon" => "zearchit",
6785     "title" => "Zearchit",
6786     "rule" => array(
6787     "Zearchit" => ""
6788     ),
6789     "uri" => "http://www.zearchit.de/"
6790     ),
6791     "zebz" => array(
6792     "icon" => "robot",
6793     "title" => "ze.bz",
6794     "rule" => array(
6795     "^ZeBot_(lseek\.net|www\.ze\.bz)" => ""
6796     ),
6797     "uri" => "http://www.ze.bz/"
6798     ),
6799     "zedzo" => array(
6800     "icon" => "robot",
6801     "title" => "Zedzo",
6802     "rule" => array(
6803     "zedzo.digest[ /]([0-9.]{1,10})" => "\\1"
6804     ),
6805     "uri" => "http://www.zedzo.com/"
6806     ),
6807     "zerx" => array(
6808     "icon" => "zerx",
6809     "title" => "Zerx",
6810     "rule" => array(
6811     "^zerxbot[ /](Version|v)*[ /]*([0-9.]{1,10})" => "\\2"
6812     ),
6813     "uri" => "http://www.zerx.com/"
6814     ),
6815     "zeus" => array(
6816     "icon" => "zeus",
6817     "title" => "Zeus",
6818     "rule" => array(
6819     "Zeus" => ""
6820     ),
6821     "uri" => "http://www.zeus.com"
6822     ),
6823     "zippp" => array(
6824     "icon" => "robot",
6825     "title" => "Zippp",
6826     "rule" => array(
6827     "ZipppBot[ /]([0-9.]{1,10})" => "\\1"
6828     ),
6829     "uri" => ""
6830     ),
6831     "zippy" => array(
6832     "icon" => "robot",
6833     "title" => "Zippy",
6834     "rule" => array(
6835     "^Zippy[ v/]*([0-9.]{1,10})" => "\\1"
6836     ),
6837     "uri" => "http://www.zippyfinder.com"
6838     ),
6839     "zoeky" => array(
6840     "icon" => "robot",
6841     "title" => "Zoeky",
6842     "rule" => array(
6843     "Zoekybot[ /]([0-9.]{1,10})" => "\\1"
6844     ),
6845     "uri" => ""
6846     ),
6847     "zoom" => array(
6848     "icon" => "zoom",
6849 matthys 209 "title" => "ZoomSpider",
6850 joku 63 "rule" => array(
6851     "^ZoomSpider" => ""
6852     ),
6853     "uri" => "http://www.wrensoft.com/"
6854     ),
6855     "zspider" => array(
6856     "icon" => "robot",
6857 matthys 209 "title" => "Zspider",
6858 joku 63 "rule" => array(
6859     "zspider[ /]([0-9.a-z]{1,10})" => "\\1"
6860     ),
6861     "uri" => "http://feedback.redkolibri.com/"
6862     ),
6863 matthys 281 "zumbot" => array(
6864     "icon" => "robot",
6865     "title" => "ZUM Search",
6866     "rule" => array(
6867     "ZumBot[ /]([0-9.]{1,10})" => "\\1"
6868     ),
6869     "uri" => "http://help.zum.com/inquiry"
6870     ),
6871 joku 63 "zyborg" => array(
6872     "icon" => "zyborg",
6873     "title" => "WiseNutBot",
6874     "rule" => array(
6875     "(WISE|Zy)bo(rg|t)[ /]([0-9.]{1,10})" => "\\3"
6876     ),
6877     "uri" => ""
6878     ),
6879     // Catch up for the originals, they got to stay in that order.
6880     "blogbot" => array(
6881     "icon" => "blogbot",
6882     "title" => "BlogBot",
6883     "rule" => array(
6884     "Blog[ \-]?Bot" => ""
6885     ),
6886     "uri" => "http://www.blogbot.com/"
6887     ),
6888     "centrum" => array(
6889     "icon" => "centrum",
6890     "title" => "Centrum",
6891     "rule" => array(
6892     "holmes[/ ]([0-9.]{1,10})" => "\\1",
6893     "^Centrum-checker" => ""
6894     ),
6895     "uri" => ""
6896     ),
6897     "httpclient" => array(
6898     "icon" => "robot",
6899     "title" => "HTTPClient",
6900     "rule" => array(
6901     "HTTP[ \-]?Client[ /]([0-9.]{1,10})" => "\\1",
6902     "HTTP[ \-]?Client" => ""
6903     ),
6904     "uri" => "http://www.innovation.ch/java/HTTPClient/"
6905     ),
6906     "incywincy" => array(
6907     "icon" => "robot",
6908     "title" => "IncyWincy",
6909     "rule" => array(
6910     "^IncyWincy[ /]([0-9.]{1,10})" => "\\1",
6911     "^IncyWincy" => ""
6912     ),
6913     "uri" => ""
6914     ),
6915     "java" => array(
6916     "icon" => "java",
6917     "title" => "Java",
6918     "rule" => array(
6919     "^java[ /]*([0-9.a-z]{1,10})" => "\\1"
6920     ),
6921     "uri" => ""
6922     ),
6923     "libfetch" => array(
6924     "icon" => "robot",
6925     "title" => "Libfetch",
6926     "rule" => array(
6927     "^(fetch )?libfetch[ /]([0-9.]{1,10})" => "\\2"
6928     ),
6929     "uri" => "http://www.freebsd.org/"
6930     ),
6931     "libwww" => array(
6932     "icon" => "libwww",
6933 matthys 209 "title" => "LibWWW",
6934 joku 63 "rule" => array(
6935     "^libww(w|w-perl|w-FM)[ /]([0-9.]{1,10})" => "\\2",
6936     "^libww(w|w-perl|w-FM)" => "",
6937     "MyApp.*libww(w|w-perl|w-FM)" => ""
6938     ),
6939     "uri" => ""
6940     ),
6941     "litefinder" => array(
6942     "icon" => "litefinder",
6943     "title" => "LiteFinder",
6944     "rule" => array(
6945     "LiteFinder[ /]([0-9.]{1,10})" => "\\1"
6946     ),
6947     "uri" => "http://www.litefinder.net/about.html"
6948     ),
6949     "nutchorg" => array(
6950     "icon" => "nutchorg",
6951     "title" => "Nutch",
6952     "rule" => array(
6953     "Nutc(hOrg|hCVS|h)?[ /]([0-9.]{1,10})" => "\\2",
6954     "Nutch" => ""
6955     ),
6956     "uri" => "http://lucene.apache.org/nutch/"
6957     ),
6958     "pythonurl" => array(
6959     "icon" => "pythonurl",
6960     "title" => "Python-url",
6961     "rule" => array(
6962     "Python[ \-]?urllib" => ""
6963     ),
6964     "uri" => ""
6965     ),
6966     // Know Robots as SPAM BOTS
6967     "SPAM" => array(
6968     "icon" => "robot",
6969     "title" => "SPAM",
6970     "rule" => array(
6971     "NASA Search[/ ]([0-9.]{1,10})" => "\\1",
6972     "^PHOTO CHECK" => "",
6973     "^FOTOCHECKER" => "",
6974     "^IPTC CHECK" => "",
6975     "^DataCha0s" => "",
6976     "^Mac Finder" => "",
6977     "^Missigua Locator[ /]([0-9.]{1,10})" => "\\1",
6978     "^Missouri College Browse" => "",
6979     "Email[ \-]?Siphon" => "",
6980     "atSpider" => "",
6981     "autoemailspider" => "",
6982     "^Demo Bot" => "",
6983     "^Program Shareware" => "",
6984     "^Snapbot" => "",
6985     "^snap.com" => "",
6986     "^Guestbook Auto Submitter" => "",
6987     "panscient.com" => "",
6988     ),
6989     "uri" => ""
6990     ),
6991     // Things we don't know by now
6992     "robot" => array(
6993     "icon" => "robot",
6994     "title" => "Robot",
6995     "rule" => array(
6996     "(robot|spider|harvest|(?<!orange)bot|(?<!msie)crawler)" => ""
6997     )
6998     )
6999     );
7000 joku 261 ?>

Properties

Name Value
svn:keywords Id