ViewVC Help
View File | Revision Log | Show Annotations | View Changeset | Root Listing
root/BBClone/trunk/lib/robot.php
Revision: 334
Committed: Sun Dec 14 14:28:13 2014 UTC (9 years, 11 months ago) by joku
File size: 156722 byte(s)
Log Message:
typo

File Contents

# Content
1 <?php
2 /* This file is part of BBClone (A PHP based Web Counter on Steroids)
3 *
4 * SVN FILE $Id$
5 *
6 * Copyright (C) 2001-2015, the BBClone Team (see doc/authors.txt for details)
7 *
8 * This program is free software: you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License as published by
10 * the Free Software Foundation, either version 3 of the License, or
11 * (at your option) any later version.
12 *
13 * This program is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 * GNU General Public License for more details.
17 *
18 * See doc/copying.txt for details
19 */
20
21 /////////////////////
22 // Robot Detection //
23 /////////////////////
24
25 $robot = array(
26 "1noon" => array(
27 "icon" => "1noon",
28 "title" => "1noon",
29 "rule" => array(
30 "1Noonbot[/ ]([0-9.]{1,10})" => "\\1",
31 "^Yeti$" => ""
32 ),
33 "uri" => ""
34 ),
35 "123people" => array(
36 "icon" => "123people",
37 "title" => "123people",
38 "rule" => array(
39 "123peoplebot[ /]([0-9.]{1,10})" => "\\1"
40 ),
41 "uri" => "http://www.123people.fr/"
42 ),
43 "123spider" => array(
44 "icon" => "robot",
45 "title" => "123Spider",
46 "rule" => array(
47 "123spider-Bot \(Version: ([0-9.]{1,10})" => "\\1"
48 ),
49 "uri" => "http://www.123spider.de/"
50 ),
51 "192com" => array(
52 "icon" => "robot",
53 "title" => "192.com",
54 "rule" => array(
55 "192.comAgent" => ""
56 ),
57 "uri" => "http://www.192.com/"
58 ),
59 "200please" => array(
60 "icon" => "200please",
61 "title" => "200please Crawler",
62 "rule" => array(
63 "200PleaseBot[ /]([0-9.]{1,10})" => "\\1"
64 ),
65 "uri" => "http://www.200please.com/bot"
66 ),
67 "2dehands" => array(
68 "icon" => "2dehands",
69 "title" => "2deHands",
70 "rule" => array(
71 "2dehands\.nl" => ""
72 ),
73 "uri" => ""
74 ),
75 "80legs" => array(
76 "icon" => "80legs",
77 "title" => "80legs",
78 "rule" => array(
79 "008[/ ]([0-9.]{1,10}).*80legs" => "\\1"
80 ),
81 "uri" => "http://www.80legs.com/"
82 ),
83 "a1sitemap" => array(
84 "icon" => "a1sitemap",
85 "title" => "A1 Sitemap",
86 "rule" => array(
87 "^A1 Sitemap Generator[ /]([0-9.]{1,10})" => "\\1",
88 "miggibot[ /]([0-9.]{1,10})" => "\\1"
89 ),
90 "uri" => "http://www.micro-sys.dk/products/sitemap-generator/"
91 ),
92 "a2b" => array(
93 "icon" => "a2b",
94 "title" => "A2B",
95 "rule" => array(
96 "www\.a2b\.cc" => ""
97 ),
98 "uri" => "http://www.a2b.cc"
99 ),
100 "abacho" => array(
101 "icon" => "robot",
102 "title" => "Abacho",
103 "rule" => array(
104 "^ABACHOBot" => ""
105 ),
106 "uri" => ""
107 ),
108 "abcdatos" => array(
109 "icon" => "abcdatos",
110 "title" => "ABCdatos",
111 "rule" => array(
112 "^ABCdatos BotLink[ /]([0-9.]{1,10})" => "\\1"
113 ),
114 "uri" => "http://www.abcdatos.com/"
115 ),
116 "abot" => array(
117 "icon" => "abot",
118 "title" => "aBot",
119 "rule" => array(
120 "^abot[ /]([0-9.]{1,10})" => "\\1"
121 ),
122 "uri" => ""
123 ),
124 "about" => array(
125 "icon" => "about",
126 "title" => "About",
127 "rule" => array(
128 "Libby[_/ ]([0-9.]{1,10})" => "\\1",
129 "About[_/ ]([0-9.]{1,10})libwww-perl" => "\\1"
130 ),
131 "uri" => ""
132 ),
133 "aboutus" => array(
134 "icon" => "aboutus",
135 "title" => "AboutUs",
136 "rule" => array(
137 "AboutUsBot" => ""
138 ),
139 "uri" => "http://www.aboutus.org/"
140 ),
141 "ackerm" => array(
142 "icon" => "robot",
143 "title" => "Ackerm",
144 "rule" => array(
145 "www.ackerm.com" => ""
146 ),
147 "uri" => "http://www.ackerm.com/"
148 ),
149 "acoi" => array(
150 "icon" => "acoi",
151 "title" => "AcoiRobot",
152 "rule" => array(
153 "^AcoiRobot" => ""
154 ),
155 "uri" => "http://monetdb.cwi.nl/acoi/projects.html"
156 ),
157 "acoon" => array(
158 "icon" => "acoon",
159 "title" => "Acoon",
160 "rule" => array(
161 "Acoon[ \-]?Robot" => ""
162 ),
163 "uri" => ""
164 ),
165 "accoona" => array(
166 "icon" => "accoona",
167 "title" => "Accoona",
168 "rule" => array(
169 "Accoona-AI-Agent[/ ]([0-9.]{1,10})" => "\\1",
170 "^accoona" => ""
171 ),
172 "uri" => ""
173 ),
174 "acme" => array(
175 "icon" => "acme",
176 "title" => "Acme",
177 "rule" => array(
178 "^Acme\.Spider" => ""
179 ),
180 "uri" => "http://www.acme.com/java/software/Acme.Spider.html"
181 ),
182 "active" => array(
183 "icon" => "robot",
184 "title" => "ActiveBookmark",
185 "rule" => array(
186 "ActiveBookmark[/ ]([0-9.]{1,10})" => "\\1"
187 ),
188 "uri" => ""
189 ),
190 "admuncher" => array(
191 "icon" => "robot",
192 "title" => "Ad Muncher",
193 "rule" => array(
194 "Ad Muncher[/ v]*([0-9.]{1,10})" => "\\1"
195 ),
196 "uri" => ""
197 ),
198 "aesop" => array(
199 "icon" => "robot",
200 "title" => "Aesop",
201 "rule" => array(
202 "^AESOP_com_SpiderMan" => ""
203 ),
204 "uri" => "http://www.aesop.com"
205 ),
206 "agada" => array(
207 "icon" => "robot",
208 "title" => "Agada",
209 "rule" => array(
210 "^agadine[/ ]([0-9.]{1,10})" => "\\1"
211 ),
212 "uri" => ""
213 ),
214 "ahrefs" => array(
215 "icon" => "ahrefs",
216 "title" => "Ahrefs",
217 "rule" => array(
218 "AhrefsBot[ /]([0-9.]{1,10})" => "\\1"
219 ),
220 "uri" => "http://ahrefs.com/"
221 ),
222 "aibot" => array(
223 "icon" => "robot",
224 "title" => "Aibot",
225 "rule" => array(
226 "AIBOT[/ ]([0-9.]{1,10})" => "\\1"
227 ),
228 "uri" => ""
229 ),
230 "aihitbot" => array(
231 "icon" => "robot",
232 "title" => "aiHit",
233 "rule" => array(
234 "aiHitBot[/ ]([0-9.]{1,10})" => "\\1"
235 ),
236 "uri" => "http://www.aihit.com/"
237 ),
238 "aipbot" => array(
239 "icon" => "robot",
240 "title" => "Aipbot",
241 "rule" => array(
242 "aipbot[/ ]([0-9.]{1,10})" => "\\1"
243 ),
244 "uri" => ""
245 ),
246 "aleksika" => array(
247 "icon" => "aleksika",
248 "title" => "Aleksika",
249 "rule" => array(
250 "Aleksika Spider[/ ]([0-9.]{1,10})" => "\\1"
251 ),
252 "uri" => ""
253 ),
254 "alertsite" => array(
255 "icon" => "alertsite",
256 "title" => "AlertSite",
257 "rule" => array(
258 "ipd[ /]([0-9.]{1,10}).*Alertsite\.com" => "\\1"
259 ),
260 "uri" => "http://www.alertsite.com/index.html"
261 ),
262 "alexa" => array(
263 "icon" => "alexa",
264 "title" => "Alexa",
265 "rule" => array(
266 "^ia_archive" => ""
267 ),
268 "uri" => "http://www.alexa.com/"
269 ),
270 "almaden" => array(
271 "icon" => "almaden",
272 "title" => "IBM Crawler",
273 "rule" => array(
274 "www\.almaden\.ibm\.com/cs/crawler" => ""
275 ),
276 "uri" => "http://www.almaden.ibm.com/cs/crawler/"
277 ),
278 "altavista" => array(
279 "icon" => "altavista",
280 "title" => "Altavista",
281 "rule" => array(
282 "Scooter[ /\-]*[a-z]*([0-9.]{1,10})" => "\\1",
283 "AltaVista V([0-9.]{1,10})" => "\\1",
284 "AltaVista Intranet V([0-9.]{1,10})" => "\\1"
285 ),
286 "uri" => "http://www.altavista.com/"
287 ),
288 "amazon" => array(
289 "icon" => "amazon",
290 "title" => "Amazon",
291 "rule" => array(
292 "^(aranhabot|amzn_assoc)" => "",
293 "^NutchEC2Test" => ""
294 ),
295 "uri" => "http://www.amazon.com/"
296 ),
297 "amidalla" => array(
298 "icon" => "amidalla",
299 "title" => "Amidalla",
300 "rule" => array(
301 "^amibot" => ""
302 ),
303 "uri" => ""
304 ),
305 "amfibi" => array(
306 "icon" => "amfibi",
307 "title" => "Amfibi",
308 "rule" => array(
309 "Amfibibot[/ ]([0-9.]{1,10})" => "\\1",
310 "Amfibibot" => ""
311 ),
312 "uri" => ""
313 ),
314 "amphetadesk" => array(
315 "icon" => "robot",
316 "title" => "AmphetaDesk",
317 "rule" => array(
318 "AmphetaDesk[/ ]([0-9.]{1,10})" => "\\1"
319 ),
320 "uri" => ""
321 ),
322 "amphetameme" => array(
323 "icon" => "robot",
324 "title" => "Amphetameme",
325 "rule" => array(
326 "amphetameme[ \-]?crawler" => ""
327 ),
328 "uri" => ""
329 ),
330 "annomille" => array(
331 "icon" => "robot",
332 "title" => "AnnoMille",
333 "rule" => array(
334 "^AnnoMille( spider)?[/ ]([0-9.]{1,10})" => "\\2"
335 ),
336 "uri" => "http://www.annomille.it"
337 ),
338 "anonymouse" => array(
339 "icon" => "anonymouse",
340 "title" => "Anonymouse.org",
341 "rule" => array(
342 "http://Anonymouse.org" => ""
343 ),
344 "uri" => "http://anonymouse.org"
345 ),
346 "ansearch" => array(
347 "icon" => "robot",
348 "title" => "Ansearch",
349 "rule" => array(
350 "AnsearchBot[/ ]([0-9.]{1,10})" => "\\1"
351 ),
352 "uri" => ""
353 ),
354 "answerchase" => array(
355 "icon" => "answerchase",
356 "title" => "AnswerChase",
357 "rule" => array(
358 "AnswerChase( PROve)?[/ ]([0-9.]{1,10})" => "\\2"
359 ),
360 "uri" => "http://www.answerchase.com/"
361 ),
362 "antibot" => array(
363 "icon" => "robot",
364 "title" => "Antibot",
365 "rule" => array(
366 "antibot-V([0-9.]{1,10})" => "\\1"
367 ),
368 "uri" => ""
369 ),
370 "aonde" => array(
371 "icon" => "aonde",
372 "title" => "Aonde",
373 "rule" => array(
374 "^AONDE-Spider" => ""
375 ),
376 "uri" => ""
377 ),
378 "aonline" => array(
379 "icon" => "robot",
380 "title" => "A-Online.at",
381 "rule" => array(
382 "^A-Online Search" => ""
383 ),
384 "uri" => "http://www.a-online.at/"
385 ),
386 "aol" => array(
387 "icon" => "aol",
388 "title" => "AOLserver",
389 "rule" => array(
390 "^AOLserver-Tcl[/ ]([0-9.]{1,10})" => "\\1",
391 "^AOLserver" => ""
392 ),
393 "uri" => ""
394 ),
395 "apachebench" => array(
396 "icon" => "robot",
397 "title" => "ApacheBench",
398 "rule" => array(
399 "ApacheBench[ /]([0-9.]{1,10})" => "\\1"
400 ),
401 "uri" => ""
402 ),
403 "apassion4jazz" => array(
404 "icon" => "robot",
405 "title" => "Passion 4 Jazz",
406 "rule" => array(
407 "^BebopBot[ /]([0-9.]{1,10})" => "\\1"
408 ),
409 "uri" => "http://www.apassion4jazz.net/bebopbot.html"
410 ),
411 "apexoo" => array(
412 "icon" => "robot",
413 "title" => "Apexoo",
414 "rule" => array(
415 "^Apexoo Spider ([0-9.]{1,10})" => "\\1"
416 ),
417 "uri" => "http://www.apexoo.com/"
418 ),
419 "apnoti" => array(
420 "icon" => "apnoti",
421 "title" => "Apnoti",
422 "rule" => array(
423 "apnoti.*Robot[ /]v([0-9.]{1,10})" => "\\1"
424 ),
425 "uri" => "http://www.apnoti.com/"
426 ),
427 "aport" => array(
428 "icon" => "aport",
429 "title" => "Aport",
430 "rule" => array(
431 "^Aport" => ""
432 ),
433 "uri" => ""
434 ),
435 "appie" => array(
436 "icon" => "walhello",
437 "title" => "Walhello",
438 "rule" => array(
439 "appie[ /]([0-9.]{1,10})" => "\\1"
440 ),
441 "uri" => ""
442 ),
443 "arachmo" => array(
444 "icon" => "arachmo",
445 "title" => "Arachmo",
446 "rule" => array(
447 "compatible; Arachmo" => ""
448 ),
449 "uri" => ""
450 ),
451 "arexera" => array(
452 "icon" => "arexera",
453 "title" => "Arexera",
454 "rule" => array(
455 "^X-Crawler" => "",
456 "^TECOMAC-Crawler[ /]([0-9.]{1,10})" => "\\1"
457 ),
458 "uri" => "http://www.arexera.de/"
459 ),
460 "arianna" => array(
461 "icon" => "arianna",
462 "title" => "Arianna",
463 "rule" => array(
464 "^www.arianna.it" => ""
465 ),
466 "uri" => "http://www.arianna.it/"
467 ),
468 "artface" => array(
469 "icon" => "robot",
470 "title" => "Artface",
471 "rule" => array(
472 "^ArtfaceBot" => ""
473 ),
474 "uri" => ""
475 ),
476 "artviper" => array(
477 "icon" => "artviper",
478 "title" => "artViper",
479 "rule" => array(
480 "artViper" => ""
481 ),
482 "uri" => "http://www.artviper.net/"
483 ),
484 "asinfo" => array(
485 "icon" => "robot",
486 "title" => "Any Search Info",
487 "rule" => array(
488 "Sleek Spider[ /]([0-9.]{1,10})" => "\\1"
489 ),
490 "uri" => "http://search-info.com/"
491 ),
492 "ask" => array(
493 "icon" => "askjeeves",
494 "title" => "Ask Jeeves",
495 "rule" => array(
496 "Ask[ \-]?Jeeves" => "",
497 "teomaagent" => ""
498 ),
499 "uri" => ""
500 ),
501 "askaboutoil" => array(
502 "icon" => "robot",
503 "title" => "ASPseek",
504 "rule" => array(
505 "^AskAboutOil[ /]([0-9.]{1,10})" => "\\1"
506 ),
507 "uri" => "http://askaboutoil.com/"
508 ),
509 "asked" => array(
510 "icon" => "robot",
511 "title" => "AskEd!",
512 "rule" => array(
513 "^asked[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
514 ),
515 "uri" => "http://asked.jp"
516 ),
517 "aspseek" => array(
518 "icon" => "robot",
519 "title" => "ASPseek",
520 "rule" => array(
521 "^ASPseek[/ ]([0-9.]{1,10})" => "\\1"
522 ),
523 "uri" => ""
524 ),
525 "atlocal" => array(
526 "icon" => "robot",
527 "title" => "At Local",
528 "rule" => array(
529 "AtlocalBot[/ ]([0-9.]{1,10})" => "\\1"
530 ),
531 "uri" => "http://www.atlocal.com/"
532 ),
533 "atomz" => array(
534 "icon" => "atomz",
535 "title" => "Atomz",
536 "rule" => array(
537 "Atomz[/ ]([0-9.]{1,10})" => "\\1"
538 ),
539 "uri" => ""
540 ),
541 "axel" => array(
542 "icon" => "robot",
543 "title" => "Axel",
544 "rule" => array(
545 "^axel" => ""
546 ),
547 "uri" => ""
548 ),
549 "axmo" => array(
550 "icon" => "axmo",
551 "title" => "Axmo",
552 "rule" => array(
553 "AxmoRobot" => ""
554 ),
555 "uri" => ""
556 ),
557 "answerbus" => array(
558 "icon" => "answerbus",
559 "title" => "AnswerBus",
560 "rule" => array(
561 "answerbus" => ""
562 ),
563 "uri" => ""
564 ),
565 "automapit" => array(
566 "icon" => "robot",
567 "title" => "AutoMapIt",
568 "rule" => array(
569 "AutoMapIt[ /](Bot)?" => ""
570 ),
571 "uri" => "http://www.automapit.com/bot.html"
572 ),
573 "augurnfind" => array(
574 "icon" => "robot",
575 "title" => "Augurnfind",
576 "rule" => array(
577 "augurnfind[/ ][v\-]*([0-9.]{1,10})" => "\\1"
578 ),
579 "uri" => ""
580 ),
581 "awasu" => array(
582 "icon" => "awasu",
583 "title" => "Awasu",
584 "rule" => array(
585 "Awasu[/ ]([0-9a-z.]{1,10})" => "\\1"
586 ),
587 "uri" => ""
588 ),
589 "axxus" => array(
590 "icon" => "axxus",
591 "title" => "axxus.de",
592 "rule" => array(
593 "whoiam" => ""
594 ),
595 "uri" => "http://www.axxus.de/"
596 ),
597 "ayell" => array(
598 "icon" => "ayell",
599 "title" => "Ayell",
600 "rule" => array(
601 "^Eurobot[ /]([0-9.]{1,10})" => "\\1"
602 ),
603 "uri" => "http://eurobot.ayell.eu"
604 ),
605 "babaloo" => array(
606 "icon" => "babaloo",
607 "title" => "Babaloo",
608 "rule" => array(
609 "BabalooSpider[ /]([0-9.]{1,10})" => "\\1"
610 ),
611 "uri" => "http://www.babaloo.si"
612 ),
613 "babe" => array(
614 "icon" => "robot",
615 "title" => "ba.be",
616 "rule" => array(
617 "BACS http://www.ba.be" => ""
618 ),
619 "uri" => "http://www.ba.be/"
620 ),
621 "baidu" => array(
622 "icon" => "baidu",
623 "title" => "Baidu",
624 "rule" => array(
625 "Baiduspider[ /]([0-9.]{1,10})" => "\\1",
626 "Baiduspider" => ""
627 ),
628 "uri" => "http://www.baidu.com/search/spider.html"
629 ),
630 "bananatree" => array(
631 "icon" => "robot",
632 "title" => "BananaTree",
633 "rule" => array(
634 "www\.thebananatree\.org" => ""
635 ),
636 "uri" => "http://www.thebananatree.org/"
637 ),
638 "bdcindexer" => array(
639 "icon" => "robot",
640 "title" => "bdcindexer",
641 "rule" => array(
642 "bdcindexer_([0-9a-z.]{1,10})" => "\\1"
643 ),
644 "uri" => "http://www.business.com/"
645 ),
646 "bdfetch" => array(
647 "icon" => "robot",
648 "title" => "BDFetch",
649 "rule" => array(
650 "^BDFetch" => ""
651 ),
652 "uri" => ""
653 ),
654 "bdncentral" => array(
655 "icon" => "robot",
656 "title" => "Bdncentral",
657 "rule" => array(
658 "BDNcentral Crawler v([0-9.]{1,10})" => "\\1"
659 ),
660 "uri" => "http://www.bdncentral.com/robot.html"
661 ),
662 "beammachine" => array(
663 "icon" => "robot",
664 "title" => "BeamMachine",
665 "rule" => array(
666 "^BeamMachine[ /]([0-9.]{1,10})" => "\\1"
667 ),
668 "uri" => "http://www.beammachine.net/"
669 ),
670 "become" => array(
671 "icon" => "become",
672 "title" => "Become",
673 "rule" => array(
674 "Become(JP)?Bot[/ ]([0-9.]{1,10})" => "\\2",
675 "(BecomeBot|Exabot)@exava\.com\)$" => ""
676 ),
677 "uri" => "http://www.become.com/"
678 ),
679 "beebware" => array(
680 "icon" => "robot",
681 "title" => "Beebware",
682 "rule" => array(
683 "BeebwareDirectory[/ ]v?([0-9.]{1,10})" => "\\2"
684 ),
685 "uri" => ""
686 ),
687 "bigbrother" => array(
688 "icon" => "robot",
689 "title" => "Big Brother",
690 "rule" => array(
691 "^Big Brother" => ""
692 ),
693 "uri" => "http://pauillac.inria.fr/~fpottier/"
694 ),
695 "bigclique" => array(
696 "icon" => "robot",
697 "title" => "BigClique",
698 "rule" => array(
699 "^BigCliqueBOT[/ ]([0-9.]{1,10})" => "\\1"
700 ),
701 "uri" => "http://www.bigclique.com"
702 ),
703 "biglotron" => array(
704 "icon" => "robot",
705 "title" => "Biglotron",
706 "rule" => array(
707 "^BIGLOTRON" => ""
708 ),
709 "uri" => "http://www.bigclique.com"
710 ),
711 "bigsearch" => array(
712 "icon" => "bigsearch",
713 "title" => "Bigsearch",
714 "rule" => array(
715 "Bigsearch.ca[/ ]Nutch[- ]([0-9.]{1,10})" => "\\1"
716 ),
717 "uri" => ""
718 ),
719 "bilbo" => array(
720 "icon" => "robot",
721 "title" => "Bilbo",
722 "rule" => array(
723 "Bilbo[ /]([0-9.]{1,10})" => "\\1"
724 ),
725 "uri" => "http://home.broadpark.no/~tnilsen-1/Linux/Bilbo_-_Nessus_WEB/bilbo_-_nessus_web.html"
726 ),
727 "bilgi" => array(
728 "icon" => "bilgi",
729 "title" => "Bilgi",
730 "rule" => array(
731 "Bilgi(Beta)?Bot[ /]([0-9.]{1,10})" => "\\1"
732 ),
733 "uri" => "http://www.bilgi.com/"
734 ),
735 "bitacle" => array(
736 "icon" => "bitacle",
737 "title" => "Bitacle",
738 "rule" => array(
739 "Bitacle (ro)?bot[ \(/V\:]+([0-9.]{1,10})" => "\\2",
740 ),
741 "uri" => "http://bitacle.org/"
742 ),
743 "bitbeamer" => array(
744 "icon" => "bitbeamer",
745 "title" => "BitBeamer",
746 "rule" => array(
747 "BitBeamer/([0-9.]{1,10})" => "\\1"
748 ),
749 "uri" => ""
750 ),
751 "biz360" => array(
752 "icon" => "biz360",
753 "title" => "Biz360",
754 "rule" => array(
755 "^Biz360 spider" => ""
756 ),
757 "uri" => ""
758 ),
759 "backlinktest" => array(
760 "icon" => "backlinktest",
761 "title" => "BacklinkCrawler",
762 "rule" => array(
763 "BacklinkCrawler" => ""
764 ),
765 "uri" => "http://www.backlinktest.com/crawler.html"
766 ),
767 "blaizbee" => array(
768 "icon" => "blaiz-bee",
769 "title" => "Blaiz-Bee",
770 "rule" => array(
771 "Blaiz-Bee[ /]([0-9.]{1,10})" => ""
772 ),
773 "uri" => ""
774 ),
775 "blogbeat" => array(
776 "icon" => "robot",
777 "title" => "BlogBeat",
778 "rule" => array(
779 "BlogBeat/?([0-9.]{1,10})" => "\\1",
780 ),
781 "uri" => "http://www.blogbeat.nl"
782 ),
783 "blogbotde" => array(
784 "icon" => "robot",
785 "title" => "blogbot.de",
786 "rule" => array(
787 "Naamah[ /]([0-9.a-z]{1,10})[ /]Blogbot" => "\\1",
788 ),
789 "uri" => "http://blogbot.de/"
790 ),
791 "blogcensus" => array(
792 "icon" => "blogcensus",
793 "title" => "Blogcensus",
794 "rule" => array(
795 "^Blogcensus" => "",
796 ),
797 "uri" => "http://blogcensus.de/bot/"
798 ),
799 "blogdex" => array(
800 "icon" => "robot",
801 "title" => "Blogdex",
802 "rule" => array(
803 "Blogdex[ /]([0-9.]{1,10})" => "\\1",
804 ),
805 "uri" => ""
806 ),
807 "blogg" => array(
808 "icon" => "blogg",
809 "title" => "Blogg",
810 "rule" => array(
811 "^blogg\.de" => ""
812 ),
813 "uri" => ""
814 ),
815 "blogland" => array(
816 "icon" => "robot",
817 "title" => "BlogLand",
818 "rule" => array(
819 "BlogLand[/ ]([0-9.]{1,10})" => "\\1"
820 ),
821 "uri" => ""
822 ),
823 "bloglines" => array(
824 "icon" => "bloglines",
825 "title" => "Bloglines",
826 "rule" => array(
827 "Bloglines[ /]([0-9.]{1,10})" => "\\1",
828 "Bloglines" => ""
829 ),
830 "uri" => ""
831 ),
832 "blogmap" => array(
833 "icon" => "robot",
834 "title" => "Blogmap",
835 "rule" => array(
836 "blogmap" => ""
837 ),
838 "uri" => ""
839 ),
840 "blogosphere" => array(
841 "icon" => "robot",
842 "title" => "Blogosphere",
843 "rule" => array(
844 "Blogosphere" => ""
845 ),
846 "uri" => ""
847 ),
848 "blogpeople" => array(
849 "icon" => "robot",
850 "title" => "BlogPeople",
851 "rule" => array(
852 "BlogPeople" => ""
853 ),
854 "uri" => ""
855 ),
856 "blogpulse" => array(
857 "icon" => "blogpulse",
858 "title" => "Blogpulse",
859 "rule" => array(
860 "Blogpulse" => ""
861 ),
862 "uri" => ""
863 ),
864 "blogranking" => array(
865 "icon" => "blogranking",
866 "title" => "BlogRanking",
867 "rule" => array(
868 "^BlogRanking(/RSS checker)?" => ""
869 ),
870 "uri" => ""
871 ),
872 "blogs" => array(
873 "icon" => "blogs",
874 "title" => "Blo.gs",
875 "rule" => array(
876 "blo\.gs[ /]([0-9.]{1,10})" => "\\1",
877 "blo\.gs" => ""
878 ),
879 "uri" => ""
880 ),
881 "blogshares" => array(
882 "icon" => "blogshares",
883 "title" => "BlogShares",
884 "rule" => array(
885 "BlogShares[ /]V?([0-9.]{1,10})" => "\\1",
886 "(^| |\()Blogshares(\.com| |\))" => ""
887 ),
888 "uri" => ""
889 ),
890 "blogslife" => array(
891 "icon" => "robot",
892 "title" => "BlogsLife",
893 "rule" => array(
894 "Blogslive" => ""
895 ),
896 "uri" => ""
897 ),
898 "blogsnow" => array(
899 "icon" => "blogsnow",
900 "title" => "BlogsNow",
901 "rule" => array(
902 "blogsnowbot" => "",
903 "BlogsNow" => ""
904 ),
905 "uri" => ""
906 ),
907 "blogstreet" => array(
908 "icon" => "blogstreet",
909 "title" => "BlogStreet",
910 "rule" => array(
911 "^BlogStreetBot" => ""
912 ),
913 "uri" => ""
914 ),
915 "blogsurf" => array(
916 "icon" => "robot",
917 "title" => "BlogSurf",
918 "rule" => array(
919 "nomadscafe_ra[/ ]([0-9.]{1,10})" => "\\1"
920 ),
921 "uri" => ""
922 ),
923 "blogtick" => array(
924 "icon" => "robot",
925 "title" => "BlogTick",
926 "rule" => array(
927 "BlogTickServer" => ""
928 ),
929 "uri" => ""
930 ),
931 "blogwatcher" => array(
932 "icon" => "blogwatcher",
933 "title" => "Blogwatcher",
934 "rule" => array(
935 "blogWatcher_Spider[/ ]([0-9.]{1,10})" => "\\1"
936 ),
937 "uri" => ""
938 ),
939 "blogwise" => array(
940 "icon" => "blogwise",
941 "title" => "Blogwise",
942 "rule" => array(
943 "Blogwise\.com(-MetaChecker)?[/ ]([0-9.]{1,10})" => "\\2"
944 ),
945 "uri" => ""
946 ),
947 "boardreader" => array(
948 "icon" => "boardreader",
949 "title" => "BoardReader",
950 "rule" => array(
951 "BoardReader[ \-](Image|Favicon)[ \-]Fetcher[ /]+([0-9.]{1,10})" => "\\2"
952 ),
953 "uri" => "http://www.boardreader.com"
954 ),
955 "bobby" => array(
956 "icon" => "bobby",
957 "title" => "Bobby",
958 "rule" => array(
959 "bobby[ /]([0-9.]{1,10})" => "\\1"
960 ),
961 "uri" => ""
962 ),
963 "boitho" => array(
964 "icon" => "robot",
965 "title" => "Boitho",
966 "rule" => array(
967 "Boitho\.com[ \-](dc|robot)?[/ ]([0-9.]{1,10})" => "\\2"
968 ),
969 "uri" => ""
970 ),
971 "booch" => array(
972 "icon" => "robot",
973 "title" => "Booch",
974 "rule" => array(
975 "^booch[_ /]([0-9.]{1,10})" => "\\1"
976 ),
977 "uri" => ""
978 ),
979 "book" => array(
980 "icon" => "book",
981 "title" => "Bookmark",
982 "rule" => array(
983 "http://www\.bookmark\.ne\.jp" => ""
984 ),
985 "uri" => ""
986 ),
987 "bookdog" => array(
988 "icon" => "bookdog",
989 "title" => "Bookdog",
990 "rule" => array(
991 "^Bookdog[ /]([0-9.]{1,10})" => "\\1"
992 ),
993 "uri" => ""
994 ),
995 "bordermanager" => array(
996 "icon" => "bordermanager",
997 "title" => "Border Manager",
998 "rule" => array(
999 "BorderManager[ /]([0-9.]{1,10})" => "\\1"
1000 ),
1001 "uri" => ""
1002 ),
1003 "botonparade" => array(
1004 "icon" => "botonparade",
1005 "title" => "Bot on Parade",
1006 "rule" => array(
1007 "BotOnParade" => ""
1008 ),
1009 "uri" => "http://www.bots-on-para.de/bot.html"
1010 ),
1011 "botje" => array(
1012 "icon" => "botje",
1013 "title" => "Botje",
1014 "rule" => array(
1015 "Plukkie[ /]([0-9.]{1,10})" => "\\1"
1016 ),
1017 "uri" => "http://www.botje.com/"
1018 ),
1019 "bottomfeeder" => array(
1020 "icon" => "bottomfeeder",
1021 "title" => "BottomFeeder",
1022 "rule" => array(
1023 "BottomFeeder[ /]([0-9.]{1,10})" => "\\1"
1024 ),
1025 "uri" => ""
1026 ),
1027 "browseremulator" => array(
1028 "icon" => "browseremulator",
1029 "title" => "BrowserEmulator",
1030 "rule" => array(
1031 "BrowserEmulator[ /]([0-9.]{1,10})" => "\\1"
1032 ),
1033 "uri" => "http://www.dejavu.org/emulator.htm"
1034 ),
1035 "browsershots" => array(
1036 "icon" => "browsershots",
1037 "title" => "Browsershots",
1038 "rule" => array(
1039 "Browsershots URL Check" => ""
1040 ),
1041 "uri" => "http://browsershots.org"
1042 ),
1043 "browserspy" => array(
1044 "icon" => "robot",
1045 "title" => "BrowserSpy",
1046 "rule" => array(
1047 "BrowserSpy" => ""
1048 ),
1049 "uri" => ""
1050 ),
1051 "bruinbot" => array(
1052 "icon" => "robot",
1053 "title" => "BruinBot",
1054 "rule" => array(
1055 "BruinBot" => ""
1056 ),
1057 "uri" => ""
1058 ),
1059 "bruno" => array(
1060 "icon" => "robot",
1061 "title" => "Bruno",
1062 "rule" => array(
1063 "^Bruno" => ""
1064 ),
1065 "uri" => ""
1066 ),
1067 "btbot" => array(
1068 "icon" => "btbot",
1069 "title" => "BitTorrent",
1070 "rule" => array(
1071 "BTbot/([0-9.]{1,10})" => "\\1"
1072 ),
1073 "uri" => ""
1074 ),
1075 "builtwith" => array(
1076 "icon" => "builtwith",
1077 "title" => "BuiltWith",
1078 "rule" => array(
1079 "BuiltWith[/ ]([0-9.]{1,10})" => "\\1"
1080 ),
1081 "uri" => "http://builtwith.com/bot.html"
1082 ),
1083 "bulkfeeds" => array(
1084 "icon" => "robot",
1085 "title" => "Bulkfeeds",
1086 "rule" => array(
1087 "Bulkfeeds[/ ]([a-z0-9.]{1,10})" => "\\1"
1088 ),
1089 "uri" => ""
1090 ),
1091 "burf" => array(
1092 "icon" => "burf",
1093 "title" => "Burf.com",
1094 "rule" => array(
1095 "^Norbert the Spider" => ""
1096 ),
1097 "uri" => "http://www.burf.com/"
1098 ),
1099 "butch" => array(
1100 "icon" => "robot",
1101 "title" => "Butch",
1102 "rule" => array(
1103 "Butch(__| )?([a-z0-9.]{1,10})" => "\\2"
1104 ),
1105 "uri" => ""
1106 ),
1107 "buzzlogic" => array(
1108 "icon" => "buzzlogic",
1109 "title" => "Buzzlogic",
1110 "rule" => array(
1111 "BuzzBot[ /]([0-9.]{1,10})" => "\\1"
1112 ),
1113 "uri" => "http://www.buzzlogic.com"
1114 ),
1115 "catchbot" => array(
1116 "icon" => "catchbot",
1117 "title" => "CatchBot",
1118 "rule" => array(
1119 "^CatchBot[/ ]([0-9.]{1,10})" => "\\1"
1120 ),
1121 "uri" => "http://www.catchbot.com"
1122 ),
1123 "camdiscover" => array(
1124 "icon" => "robot",
1125 "title" => "Camdiscover",
1126 "rule" => array(
1127 "^Camcrawler" => ""
1128 ),
1129 "uri" => ""
1130 ),
1131 "cazoodle" => array(
1132 "icon" => "cazoodle",
1133 "title" => "Cazoodle",
1134 "rule" => array(
1135 "^CazoodleBot/(Nutch|CazoodleBot)[/ \-]([0-9.]{1,10})" => "\\2",
1136 "^CazoodleBot[/ ]([a-z0-9.]{1,10})" => "\\1"
1137 ),
1138 "uri" => "http://www.cazoodle.com/cazoodlebot"
1139 ),
1140 "ccbot" => array(
1141 "icon" => "robot",
1142 "title" => "ccBot",
1143 "rule" => array(
1144 "CCBot[/ ]([0-9.]{1,10})" => "\\1"
1145 ),
1146 "uri" => "http://www.commoncrawl.org/bot.html"
1147 ),
1148 "ccgcrawl" => array(
1149 "icon" => "robot",
1150 "title" => "CCGCrawl",
1151 "rule" => array(
1152 "CCGCrawl[/ ]([0-9.]{1,10})" => "\\1"
1153 ),
1154 "uri" => "http://www.myworkbase.com/bot.html"
1155 ),
1156 "cerberian" => array(
1157 "icon" => "robot",
1158 "title" => "Cerberian Drtrs",
1159 "rule" => array(
1160 "^Cerberian Drtrs" => ""
1161 ),
1162 "uri" => ""
1163 ),
1164 "cfnetwork" => array(
1165 "icon" => "robot",
1166 "title" => "Cerberian Drtrs",
1167 "rule" => array(
1168 "^CFNetwork[/ ]([0-9.]{1,10})" => "\\1"
1169 ),
1170 "uri" => "http://www.cfnetwork.be/"
1171 ),
1172 "charlotte" => array(
1173 "icon" => "charlotte",
1174 "title" => "Charlotte",
1175 "rule" => array(
1176 "Charlotte[/ ]([0-9a-z.]{1,10})" => "\\1"
1177 ),
1178 "uri" => ""
1179 ),
1180 "cirilizator" => array(
1181 "icon" => "cirilizator",
1182 "title" => "Cirilizator",
1183 "rule" => array(
1184 "Cirilizator[/ ]([0-9.]{1,10})" => "\\1"
1185 ),
1186 "uri" => ""
1187 ),
1188 "claria" => array(
1189 "icon" => "robot",
1190 "title" => "Claria",
1191 "rule" => array(
1192 "(Claria|Diamond)(Bot)?[ /]([0-9.]{1,10})" => "\\3",
1193 "(Claria|Diamond)(Bot)" => ""
1194 ),
1195 "uri" => ""
1196 ),
1197 "claymont" => array(
1198 "icon" => "claymont",
1199 "title" => "Claymont",
1200 "rule" => array(
1201 "claymont\.com" => "",
1202 "OliverPerry" => ""
1203 ),
1204 "uri" => "http://www.claymont.com"
1205 ),
1206 "clush" => array(
1207 "icon" => "clush",
1208 "title" => "Clush",
1209 "rule" => array(
1210 "Clus(tered-Search-|h)Bot[ /]([0-9.]{1,10})" => "\\2"
1211 ),
1212 "uri" => ""
1213 ),
1214 "cmsworldmap" => array(
1215 "icon" => "cmsworldmap",
1216 "title" => "CMS World Map",
1217 "rule" => array(
1218 "cmsworldmap" => ""
1219 ),
1220 "uri" => "http://www.cmsworldmap.com/"
1221 ),
1222 "cobion" => array(
1223 "icon" => "robot",
1224 "title" => "Cobion",
1225 "rule" => array(
1226 " (QXW03018|obot)\)" => ""
1227 ),
1228 "uri" => ""
1229 ),
1230 "coccoc" => array(
1231 "icon" => "coccoc",
1232 "title" => "Coccoc",
1233 "rule" => array(
1234 "coccoc[ /]([0-9.]{1,10})" => "\\1"
1235 ),
1236 "uri" => "http://help.coccoc.com"
1237 ),
1238 "coldfusion" => array(
1239 "icon" => "coldfusion",
1240 "title" => "ColdFusion",
1241 "rule" => array(
1242 "^coldfusion" => ""
1243 ),
1244 "uri" => ""
1245 ),
1246 "combine" => array(
1247 "icon" => "robot",
1248 "title" => "Combine",
1249 "rule" => array(
1250 "Combine[ /]([0-9.]{1,10})" => "\\1"
1251 ),
1252 "uri" => ""
1253 ),
1254 "combot" => array(
1255 "icon" => "robot",
1256 "title" => "comBot",
1257 "rule" => array(
1258 "^comBot[ /]([0-9.]{1,10})" => "\\1"
1259 ),
1260 "uri" => ""
1261 ),
1262 "comet" => array(
1263 "icon" => "comet",
1264 "title" => "Comet",
1265 "rule" => array(
1266 "cometsearch@cometsystems" => ""
1267 ),
1268 "uri" => ""
1269 ),
1270 "commerobo" => array(
1271 "icon" => "robot",
1272 "title" => "Commerobo",
1273 "rule" => array(
1274 "Commerobo[/ ]([0-9.]{1,10})" => "\\1"
1275 ),
1276 "uri" => ""
1277 ),
1278 "comrite" => array(
1279 "icon" => "robot",
1280 "title" => "ComRite",
1281 "rule" => array(
1282 "Comrite[/ ]([0-9.]{1,10})" => "\\1"
1283 ),
1284 "uri" => "http://www.comrite.com/"
1285 ),
1286 "convera" => array(
1287 "icon" => "convera",
1288 "title" => "Convera",
1289 "rule" => array(
1290 "Convera(MultiMedia)?Crawler[/ ]([0-9.]{1,10})" => "\\2",
1291 "Convera Internet Spider V([0-9.]{1,10})" => "\\1"
1292 ),
1293 "uri" => ""
1294 ),
1295 "coolbot" => array(
1296 "icon" => "robot",
1297 "title" => "CoolBot",
1298 "rule" => array(
1299 "^CoolBot" => ""
1300 ),
1301 "uri" => ""
1302 ),
1303 "cosmix" => array(
1304 "icon" => "robot",
1305 "title" => "Cosmix",
1306 "rule" => array(
1307 "^(voyager|cfetch|CosmixCrawler|carleson)[/ ]([0-9.]{1,10})" => "\\2",
1308 ),
1309 "uri" => ""
1310 ),
1311 "cosmos" => array(
1312 "icon" => "robot",
1313 "title" => "Cosmos",
1314 "rule" => array(
1315 "^cosmos" => ""
1316 ),
1317 "uri" => ""
1318 ),
1319 "cosmoty" => array(
1320 "icon" => "robot",
1321 "title" => "Cosmoty",
1322 "rule" => array(
1323 "^beautybot[/ ]([0-9.]{1,10})" => "\\1"
1324 ),
1325 "uri" => "http://www.uchoose.de/crawler/beautybot/"
1326 ),
1327 "covario" => array(
1328 "icon" => "covario",
1329 "title" => "Covario",
1330 "rule" => array(
1331 "Covario-IDS[/ ]([0-9.]{1,10})" => "\\1"
1332 ),
1333 "uri" => "http://www.covario.com/ids/"
1334 ),
1335 "creativecommons" => array(
1336 "icon" => "creativecommons",
1337 "title" => "Creative Commons",
1338 "rule" => array(
1339 "CreativeCommons[/ ]([0-9.]{1,6}(-dev)?)" => "\\1"
1340 ),
1341 "uri" => ""
1342 ),
1343 "cscrawler" => array(
1344 "icon" => "robot",
1345 "title" => "CsCrawler",
1346 "rule" => array(
1347 "CsCrawler" => ""
1348 ),
1349 "uri" => "http://www.kde.cs.uni-kassel.de/lehre/ss2005/googlespam/crawler.html"
1350 ),
1351 "jigsaw" => array(
1352 "icon" => "jigsaw",
1353 "title" => "Jigsaw",
1354 "rule" => array(
1355 "Jigsaw[ /]([0-9.]{1,10})" => "\\1"
1356 ),
1357 "uri" => "http://jigsaw.w3.org/css-validator/"
1358 ),
1359 "csscheck" => array(
1360 "icon" => "w3c",
1361 "title" => "W3C CSS Validator",
1362 "rule" => array(
1363 "CSS(Check|_Validator).+[ /]([0-9.]{1,10})" => "\\2"
1364 ),
1365 "uri" => "http://jigsaw.w3.org/css-validator/"
1366 ),
1367 "custo" => array(
1368 "icon" => "robot",
1369 "title" => "Custo",
1370 "rule" => array(
1371 "Custo[ /]([0-9.]{1,10})" => "\\1"
1372 ),
1373 "uri" => ""
1374 ),
1375 "cybernavi" => array(
1376 "icon" => "robot",
1377 "title" => "CyberNavi",
1378 "rule" => array(
1379 "CyberNavi_WebGet[ /]([0-9.]{1,10})" => "\\1"
1380 ),
1381 "uri" => ""
1382 ),
1383 "cyberpatrol" => array(
1384 "icon" => "cyberpatrol",
1385 "title" => "CyberPatrol",
1386 "rule" => array(
1387 "^CyberPatrol" => ""
1388 ),
1389 "uri" => "http://www.cyberpatrol.com/cyberpatrolcrawler.asp"
1390 ),
1391 "cyberz" => array(
1392 "icon" => "cyberz",
1393 "title" => "Cyberz",
1394 "rule" => array(
1395 "Cyberz Communication Agent" => ""
1396 ),
1397 "uri" => ""
1398 ),
1399 "cydral" => array(
1400 "icon" => "robot",
1401 "title" => "Cydral",
1402 "rule" => array(
1403 "CydralSpider[ /]([0-9.]{1,10})" => "\\1"
1404 ),
1405 "uri" => ""
1406 ),
1407 "cynthia" => array(
1408 "icon" => "cynthia",
1409 "title" => "Cynthia Says",
1410 "rule" => array(
1411 "Cynthia[ /]([0-9.]{1,10})" => "\\1"
1412 ),
1413 "uri" => ""
1414 ),
1415 "d4x" => array(
1416 "icon" => "d4x",
1417 "title" => "Downloader for X",
1418 "rule" => array(
1419 "Downloader for X[ /]([0-9.]{1,10})" => "\\1"
1420 ),
1421 "uri" => ""
1422 ),
1423 "da" => array(
1424 "icon" => "da",
1425 "title" => "DA",
1426 "rule" => array(
1427 "^DA[ /]([0-9.]{1,10})" => "\\1"
1428 ),
1429 "uri" => ""
1430 ),
1431 "daum" => array(
1432 "icon" => "daum",
1433 "title" => "DAUM",
1434 "rule" => array(
1435 "DAUMOA[ /]([0-9.]{1,10})" => "\\1",
1436 "DAUM Web Robot" => "",
1437 "Daum Communications Corp" => "",
1438 "EDI[ /]([0-9.]{1,10})" => "\\1",
1439 "Edacious.*Intelligent Web Robot" => "",
1440 "RaBot[/ ]([0-9.]{1,10}) Agent" => "\\1"
1441 ),
1442 "uri" => "http://ws.daum.net/"
1443 ),
1444 "daypop" => array(
1445 "icon" => "robot",
1446 "title" => "Daypop",
1447 "rule" => array(
1448 "daypopbot[/ ]([0-9.]{1,10})" => "\\1"
1449 ),
1450 "uri" => ""
1451 ),
1452 "delfi" => array(
1453 "icon" => "delfi",
1454 "title" => "Delfi",
1455 "rule" => array(
1456 "crawl at delfi dot lt" => ""
1457 ),
1458 "uri" => ""
1459 ),
1460 "depspid" => array(
1461 "icon" => "depspid",
1462 "title" => "DepSpid",
1463 "rule" => array(
1464 "DepSpid[/ ]([0-9.]{1,10})" => "\\1"
1465 ),
1466 "uri" => ""
1467 ),
1468 "devonagent" => array(
1469 "icon" => "devonagent",
1470 "title" => "DEVONagent",
1471 "rule" => array(
1472 "DEVONtech" => ""
1473 ),
1474 "uri" => ""
1475 ),
1476 "diffbot" => array(
1477 "icon" => "diffbot",
1478 "title" => "Diffbot",
1479 "rule" => array(
1480 " Diffbot" => ""
1481 ),
1482 "uri" => "http://www.diffbot.com"
1483 ),
1484 "diribot" => array(
1485 "icon" => "diribot",
1486 "title" => "Diri",
1487 "rule" => array(
1488 "diribot" => ""
1489 ),
1490 "uri" => "http://www.diri.bg"
1491 ),
1492 "directhit" => array(
1493 "icon" => "robot",
1494 "title" => "Direct Hit",
1495 "rule" => array(
1496 "EZResult -- Internet Search Engine" => ""
1497 ),
1498 "uri" => "http://www.directhit.com"
1499 ),
1500 "disco" => array(
1501 "icon" => "disco",
1502 "title" => "Disco",
1503 "rule" => array(
1504 "disco/Nutch[/ -]([0-9.]{1,10})" => "\\1",
1505 "discobot[/ -]([0-9.]{1,10})" => "\\1",
1506 "disco-crawl@discoveryengine.com" => ""
1507 ),
1508 "uri" => "http://www.discoveryengine.com/"
1509 ),
1510 "discopump" => array(
1511 "icon" => "robot",
1512 "title" => "DISCo Pump",
1513 "rule" => array(
1514 "DISCo Pump[/ ]([0-9.]{1,10})" => "\\1"
1515 ),
1516 "uri" => ""
1517 ),
1518 "dkimreputation" => array(
1519 "icon" => "dkimreputation",
1520 "title" => "DKIM Reputation",
1521 "rule" => array(
1522 "DKIMRepBot[ /]([0-9.]{1,10})" => "\\1"
1523 ),
1524 "uri" => "http://www.dkim-reputation.org"
1525 ),
1526 "dnsdigger" => array(
1527 "icon" => "dnsdigger",
1528 "title" => "DNS-Digger",
1529 "rule" => array(
1530 "DNS-Digger-Explorer[ /]([0-9.]{1,10})" => "\\1"
1531 ),
1532 "uri" => "http://www.dnsdigger.com"
1533 ),
1534 "dnsvalidation" => array(
1535 "icon" => "dnsvalidation",
1536 "title" => "DNS Validation",
1537 "rule" => array(
1538 "DNSValidation[ /]([0-9.]{1,10})" => "\\1"
1539 ),
1540 "uri" => "http://www.dnsvalidation.com/"
1541 ),
1542 "doctorhtml" => array(
1543 "icon" => "robot",
1544 "title" => "DoctorHTML",
1545 "rule" => array(
1546 "Doctor[ \-]?HTML" => ""
1547 ),
1548 "uri" => ""
1549 ),
1550 "dolphin" => array(
1551 "icon" => "dolphin",
1552 "title" => "Dolphin",
1553 "rule" => array(
1554 "Dolphin[ /]([0-9.]{1,10})" => "\\1"
1555 ),
1556 "uri" => "http://telehouse.ru/crawler.html"
1557 ),
1558 "domaindatei" => array(
1559 "icon" => "robot",
1560 "title" => "Domaindatei",
1561 "rule" => array(
1562 "DomaindateiSpider[ /]([0-9.]{1,10})" => "\\1"
1563 ),
1564 "uri" => ""
1565 ),
1566 "dontbuylists" => array(
1567 "icon" => "dontbuylists",
1568 "title" => "Dontbuylists",
1569 "rule" => array(
1570 "DBLBot[ /]([0-9.]{1,10})" => "\\1"
1571 ),
1572 "uri" => "http://www.dontbuylists.com"
1573 ),
1574 "dotbot" => array(
1575 "icon" => "robot",
1576 "title" => "DotBot",
1577 "rule" => array(
1578 "DotBot[ /]([0-9.]{1,10})" => "\\1"
1579 ),
1580 "uri" => "http://www.dotnetdotcom.org"
1581 ),
1582 "doweb" => array(
1583 "icon" => "doweb",
1584 "title" => "DoWeb",
1585 "rule" => array(
1586 "^www.doweb.co.uk" => ""
1587 ),
1588 "uri" => "http://www.doweb.co.uk/"
1589 ),
1590 "downforeveryoneorjustme" => array(
1591 "icon" => "downforeveryoneorjustme",
1592 "title" => "Down for everyone or just me",
1593 "rule" => array(
1594 "downforeveryoneorjustme" => ""
1595 ),
1596 "uri" => "http://www.downforeveryoneorjustme.com"
1597 ),
1598 "downloadninja" => array(
1599 "icon" => "robot",
1600 "title" => "Download Ninja",
1601 "rule" => array(
1602 "Download Ninja[ /]([0-9.]{1,10})" => "\\1"
1603 ),
1604 "uri" => ""
1605 ),
1606 "drupal" => array(
1607 "icon" => "drupal",
1608 "title" => "Drupal",
1609 "rule" => array(
1610 "^Drupal" => ""
1611 ),
1612 "uri" => ""
1613 ),
1614 "dsns" => array(
1615 "icon" => "robot",
1616 "title" => "DSNS Scanner",
1617 "rule" => array(
1618 "^DSNS" => ""
1619 ),
1620 "uri" => ""
1621 ),
1622 "dtsagent" => array(
1623 "icon" => "robot",
1624 "title" => "DTS Agent",
1625 "rule" => array(
1626 "DTS Agent" => ""
1627 ),
1628 "uri" => ""
1629 ),
1630 "earthcom" => array(
1631 "icon" => "earthcom",
1632 "title" => "Earthcom",
1633 "rule" => array(
1634 "EARTHCOM\.info[/ ]([0-9a-z.]{1,10})" => "\\1"
1635 ),
1636 "uri" => ""
1637 ),
1638 "ebay" => array(
1639 "icon" => "ebay",
1640 "title" => "eBay",
1641 "rule" => array(
1642 "eBay Relevance Ad Crawler" => ""
1643 ),
1644 "uri" => ""
1645 ),
1646 "echo" => array(
1647 "icon" => "robot",
1648 "title" => "Echo.com",
1649 "rule" => array(
1650 "_TrueRobot[/ ]([0-9.]{1,10})" => "\\1"
1651 ),
1652 "uri" => "http://www.echo.com/"
1653 ),
1654 "eert" => array(
1655 "icon" => "robot",
1656 "title" => "Eert",
1657 "rule" => array(
1658 "eert spdr[/ ]([0-9.]{1,10})" => "\\1"
1659 ),
1660 "uri" => "http://bot.eert.net"
1661 ),
1662 "eknip" => array(
1663 "icon" => "eknip",
1664 "title" => "E-Knip",
1665 "rule" => array(
1666 "eknip[ /]([0-9a-z.]{1,10})" => "\\1"
1667 ),
1668 "uri" => ""
1669 ),
1670 "zoominfo" => array(
1671 "icon" => "zoominfo",
1672 "title" => "ZoomInfo", //Previous called Eliyon
1673 "rule" => array(
1674 "NextGenSearchBot[/ ]([0-9.]{1,10})" => "\\1"
1675 ),
1676 "uri" => "http://www.zoominfo.com/business/nextgensearchbot.html"
1677 ),
1678 "emeraldshield" => array(
1679 "icon" => "emeraldshield",
1680 "title" => "EmeraldShield",
1681 "rule" => array(
1682 "^EmeraldShield" => ""
1683 ),
1684 "uri" => ""
1685 ),
1686 "empas" => array(
1687 "icon" => "empas",
1688 "title" => "Empas",
1689 "rule" => array(
1690 "DigExt; empas\)$" => "",
1691 "^EMPAS[_\-]ROBOT" => ""
1692 ),
1693 "uri" => ""
1694 ),
1695 "entireweb" => array(
1696 "icon" => "entireweb",
1697 "title" => "Entireweb",
1698 "rule" => array(
1699 "Speedy[ ]?Spider" => ""
1700 ),
1701 "uri" => ""
1702 ),
1703 "envolk" => array(
1704 "icon" => "envolk",
1705 "title" => "Envolk",
1706 "rule" => array(
1707 "envolk\[ITS\]spider[/ ]([0-9.]{1,10})" => "\\1",
1708 "envolk[/ ]([0-9.]{1,10})" => "\\1"
1709 ),
1710 "uri" => ""
1711 ),
1712 "esnet" => array(
1713 "icon" => "robot",
1714 "title" => "ES.NET",
1715 "rule" => array(
1716 "ES.NET Crawler[ /]([0-9.]{1,10})" => "\\1"
1717 ),
1718 "uri" => ""
1719 ),
1720 "estyle" => array(
1721 "icon" => "estyle",
1722 "title" => "eStyle Search",
1723 "rule" => array(
1724 "eStyleSearch[ /]([0-9.]{1,10})" => "\\1"
1725 ),
1726 "uri" => ""
1727 ),
1728 "eurip" => array(
1729 "icon" => "robot",
1730 "title" => "Eurip",
1731 "rule" => array(
1732 "EuripBot[ /]([0-9.]{1,10})" => "\\1"
1733 ),
1734 "uri" => "http://www.eurip.com"
1735 ),
1736 "eurodirectory" => array(
1737 "icon" => "robot",
1738 "title" => "Euro Directory",
1739 "rule" => array(
1740 "www\.euro-directory\.com" => ""
1741 ),
1742 "uri" => "http://www.euro-directory.com/"
1743 ),
1744 "euroseek" => array(
1745 "icon" => "euroseek",
1746 "title" => "EuroSeek",
1747 "rule" => array(
1748 "Arachnoidea" => ""
1749 ),
1750 "uri" => ""
1751 ),
1752 "evaal" => array(
1753 "icon" => "evaal",
1754 "title" => "Evaal",
1755 "rule" => array(
1756 "^EvaalSE" => ""
1757 ),
1758 "uri" => "http://www.evaal.com/"
1759 ),
1760 "eventax" => array(
1761 "icon" => "eventax",
1762 "title" => "Eventax",
1763 "rule" => array(
1764 "^eventax[ /]([0-9.]{1,10})" => "\\1"
1765 ),
1766 "uri" => "http://www.eventax.de/"
1767 ),
1768 "everbee" => array(
1769 "icon" => "everbee",
1770 "title" => "Everbee",
1771 "rule" => array(
1772 "EverbeeCrawler" => ""
1773 ),
1774 "uri" => ""
1775 ),
1776 "everest" => array(
1777 "icon" => "everest",
1778 "title" => "Everest",
1779 "rule" => array(
1780 "Everest-Vulcan Inc.[ /]([0-9.]{1,10})" => "\\1"
1781 ),
1782 "uri" => ""
1783 ),
1784 "exabot" => array(
1785 "icon" => "exabot",
1786 "title" => "ExaBot",
1787 "rule" => array(
1788 "^NG[ /]([0-9.]{1,10})" => "\\1",
1789 "Exabot/([0-9.]{1,10})" => "\\1",
1790 "ExaBotTest/([0-9.]{1,10})" => "\\1",
1791 "ExaBot-(Test|Images)/([0-9.]{1,10})" => "\\2",
1792 "ExaBot-Thumbnails" => ""
1793 ),
1794 "uri" => "http://www.exabot.com/go/robot"
1795 ),
1796 "exactseek" => array(
1797 "icon" => "exactseek",
1798 "title" => "ExactSeek",
1799 "rule" => array(
1800 "^exactseek[ \-]?(pagereaper|crawler)[ \-]?([0-9.]{1,10})" => "\\2",
1801 "ExactSeek[ \.\-]?(Crawler|com)" => ""
1802 ),
1803 "uri" => "http://www.exactseek.com/"
1804 ),
1805 "excite" => array(
1806 "icon" => "excite",
1807 "title" => "Excite",
1808 "rule" => array(
1809 "Architext[ \-]?Spider" => ""
1810 ),
1811 "uri" => ""
1812 ),
1813 "execrawl" => array(
1814 "icon" => "robot",
1815 "title" => "Execrawl",
1816 "rule" => array(
1817 "Execrawl[ /]([0-9.]{1,10})" => "\\1",
1818 "Execrawl" => ""
1819 ),
1820 "uri" => ""
1821 ),
1822 "expertmonitor" => array(
1823 "icon" => "robot",
1824 "title" => "ExpertMonitor",
1825 "rule" => array(
1826 "^NetMonitor[ /]([0-9.]{1,10})" => "\\1"
1827 ),
1828 "uri" => ""
1829 ),
1830 "explorerrss" => array(
1831 "icon" => "robot",
1832 "title" => "Explorer RSS",
1833 "rule" => array(
1834 "^Windows-RSS-Platform[ /]([0-9.]{1,10})" => "\\1"
1835 ),
1836 "uri" => ""
1837 ),
1838 "ezooms" => array(
1839 "icon" => "robot",
1840 "title" => "Ezooms",
1841 "rule" => array(
1842 "ezooms[/ ]([0-9a-z.\-]{1,10})" => "\\1"
1843 ),
1844 "uri" => ""
1845 ),
1846 "facebook" => array(
1847 "icon" => "facebook",
1848 "title" => "Facebook",
1849 "rule" => array(
1850 "FacebookFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
1851 "facebookexternalhit/([0-9.]{1,10})" => "\\1",
1852 "^facebook" => ""
1853 ),
1854 "uri" => "http://www.facebook.com/"
1855 ),
1856 "fast" => array(
1857 "icon" => "fast",
1858 "title" => "Fast",
1859 "rule" => array(
1860 "^FAST( Enterprise |-Web| MetaWeb )?Crawler[ /]([0-9.]{1,10})" => "\\2",
1861 "^FAST( Enterprise |-Web| MetaWeb | PartnerSite )?Crawler" => "",
1862 "^Fast Crawler" => "",
1863 "^libwww-perl[ /]([0-9.]{1,10}) FP[ /]([0-9.]{1,10})" => "\\2"
1864 ),
1865 "uri" => "http://www.alltheweb.com/"
1866 ),
1867 "fastbuzz" => array(
1868 "icon" => "fastbuzz",
1869 "title" => "Fastbuzz",
1870 "rule" => array(
1871 "^fastbuzz\.com" => ""
1872 ),
1873 "uri" => ""
1874 ),
1875 "favorg" => array(
1876 "icon" => "robot",
1877 "title" => "FavOrg",
1878 "rule" => array(
1879 "^FavOrg" => ""
1880 ),
1881 "uri" => ""
1882 ),
1883 "favorstar" => array(
1884 "icon" => "favorstar",
1885 "title" => "Favorstar",
1886 "rule" => array(
1887 "favorstarbot[ /]([0-9.]{1,10})" => "\\1"
1888 ),
1889 "uri" => "http://favorstar.com/bot.html"
1890 ),
1891 "faxo" => array(
1892 "icon" => "robot",
1893 "title" => "Faxo",
1894 "rule" => array(
1895 "^Faxobot[ /]([0-9.]{1,10})" => "\\1"
1896 ),
1897 "uri" => "http://www.faxo.com/"
1898 ),
1899 "fdse" => array(
1900 "icon" => "robot",
1901 "title" => "FDSE Robot",
1902 "rule" => array(
1903 "FDSE[ \-]?robot" => ""
1904 ),
1905 "uri" => ""
1906 ),
1907 "feedback" => array(
1908 "icon" => "robot",
1909 "title" => "FeedBack",
1910 "rule" => array(
1911 "FeedBack[/ ]([0-9.]{1,10})" => "\\1"
1912 ),
1913 "uri" => ""
1914 ),
1915 "feedburner" => array(
1916 "icon" => "feedburner",
1917 "title" => "FeedBurner",
1918 "rule" => array(
1919 "^FeedBurner[/ ]([0-9.]{1,10})" => "\\1"
1920 ),
1921 "uri" => ""
1922 ),
1923 "feeddemon" => array(
1924 "icon" => "feeddemon",
1925 "title" => "FeedDemon",
1926 "rule" => array(
1927 "FeedDemon[/ ]([0-9.]{1,10})" => "\\1"
1928 ),
1929 "uri" => ""
1930 ),
1931 "feedfind" => array(
1932 "icon" => "feedfind",
1933 "title" => "FeedFind",
1934 "rule" => array(
1935 "Feed::Find[ /]([0-9.]{1,10})" => "\\1"
1936 ),
1937 "uri" => ""
1938 ),
1939 "feedonfeeds" => array(
1940 "icon" => "robot",
1941 "title" => "Feed On Feeds",
1942 "rule" => array(
1943 "FeedOnFeeds[/ ]([0-9.]{1,10})" => "\\1"
1944 ),
1945 "uri" => ""
1946 ),
1947 "feedparser" => array(
1948 "icon" => "robot",
1949 "title" => "Feedparser",
1950 "rule" => array(
1951 "UniversalFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
1952 "FeedParser" => ""
1953 ),
1954 "uri" => ""
1955 ),
1956 "feedreader" => array(
1957 "icon" => "feedreader",
1958 "title" => "Feedreader",
1959 "rule" => array(
1960 "^Feedreader" => ""
1961 ),
1962 "uri" => ""
1963 ),
1964 "feedserver" => array(
1965 "icon" => "robot",
1966 "title" => "FeedServer",
1967 "rule" => array(
1968 "FeedServer[/ ]([0-9.]{1,10})" => "\\1"
1969 ),
1970 "uri" => ""
1971 ),
1972 "feedster" => array(
1973 "icon" => "feedster",
1974 "title" => "Feedster",
1975 "rule" => array(
1976 "Feedster Crawler[/ ]([0-9.]{1,10})" => "\\1"
1977 ),
1978 "uri" => ""
1979 ),
1980 "feedvalidator" => array(
1981 "icon" => "feedvalidator",
1982 "title" => "Feed Validator",
1983 "rule" => array(
1984 "^FeedValidator[/ ]([0-9.]{1,10})" => "\\1"
1985 ),
1986 "uri" => ""
1987 ),
1988 "fdm" => array(
1989 "icon" => "robot",
1990 "title" => "Free Download Manager",
1991 "rule" => array(
1992 "^FDM[/ ]([0-9a-z.]{1,10})" => "\\1"
1993 ),
1994 "uri" => ""
1995 ),
1996 "filangy" => array(
1997 "icon" => "robot",
1998 "title" => "Filangy",
1999 "rule" => array(
2000 "Filangy[/ ]([0-9.]{1,10})" => "\\1"
2001 ),
2002 "uri" => "http://www.filangy.com/"
2003 ),
2004 "findanisp" => array(
2005 "icon" => "robot",
2006 "title" => "FindAnISP",
2007 "rule" => array(
2008 "FindAnISP" => ""
2009 ),
2010 "uri" => "http://www.findanisp.com/"
2011 ),
2012 "findengines" => array(
2013 "icon" => "findengines",
2014 "title" => "FindEngines",
2015 "rule" => array(
2016 "FindEngines! Bot" => ""
2017 ),
2018 "uri" => ""
2019 ),
2020 "findexa" => array(
2021 "icon" => "findexa",
2022 "title" => "Findexa",
2023 "rule" => array(
2024 "Findexa Crawler" => ""
2025 ),
2026 "uri" => ""
2027 ),
2028 "findlinks" => array(
2029 "icon" => "findlinks",
2030 "title" => "FindLinks",
2031 "rule" => array(
2032 "findlinks[ /]([0-9.]{1,10})" => "\\1",
2033 "^FindLinks" => ""
2034 ),
2035 "uri" => ""
2036 ),
2037 "findoor" => array(
2038 "icon" => "findoor",
2039 "title" => "Findoor",
2040 "rule" => array(
2041 "^findoor(-Bot)?" => "\\1"
2042 ),
2043 "uri" => ""
2044 ),
2045 "firefly" => array(
2046 "icon" => "firefly",
2047 "title" => "Firefly",
2048 "rule" => array(
2049 "Firefly" => ""
2050 ),
2051 "uri" => ""
2052 ),
2053 "flashget" => array(
2054 "icon" => "flashget",
2055 "title" => "FlashGet",
2056 "rule" => array(
2057 "^FlashGet" => ""
2058 ),
2059 "uri" => ""
2060 ),
2061 "flatland" => array(
2062 "icon" => "flatland",
2063 "title" => "Flatland",
2064 "rule" => array(
2065 "^flatlandbot" => ""
2066 ),
2067 "uri" => "http://www.flatlandindustries.com/flatlandbot"
2068 ),
2069 "flickbot" => array(
2070 "icon" => "flickbot",
2071 "title" => "FlickBot",
2072 "rule" => array(
2073 "FlickBot[ /]([0-9.]{1,10})" => "\\1"
2074 ),
2075 "uri" => ""
2076 ),
2077 "flightdeckreports" => array(
2078 "icon" => "flightdeckreports",
2079 "title" => "Flight Deck Reports",
2080 "rule" => array(
2081 "FlightDeckReportsBot[ /]([0-9.]{1,10})" => "\\1"
2082 ),
2083 "uri" => "http://www.flightdeckreports.com/"
2084 ),
2085 "forex" => array(
2086 "icon" => "robot",
2087 "title" => "Forex",
2088 "rule" => array(
2089 "^Forex Trading Network Organization" => ""
2090 ),
2091 "uri" => "http://www.netforex.org/"
2092 ),
2093 "freshmeat" => array(
2094 "icon" => "freshmeat",
2095 "title" => "Freshmeat",
2096 "rule" => array(
2097 "fmII URL validator[ /]([0-9.]{1,10})" => "\\1",
2098 "freshmeat.net URL validator[ /]([0-9.]{1,10})" => "\\1"
2099 ),
2100 "uri" => "http://www.freshmeat.net/"
2101 ),
2102 "friend" => array(
2103 "icon" => "friend",
2104 "title" => "Friend",
2105 "rule" => array(
2106 "www\.friend\.fr" => ""
2107 ),
2108 "uri" => "http://www.friend.fr/"
2109 ),
2110 "frontier" => array(
2111 "icon" => "frontier",
2112 "title" => "Frontier",
2113 "rule" => array(
2114 "Frontier[ /]([0-9.]{1,10})" => "\\1"
2115 ),
2116 "uri" => ""
2117 ),
2118 "fyberspider" => array(
2119 "icon" => "robot",
2120 "title" => "FyberSpider",
2121 "rule" => array(
2122 "FyberSpider[ /]([0-9.]{1,10})" => "\\1"
2123 ),
2124 "uri" => "http://www.fyberspider.com/"
2125 ),
2126 "gaisbot" => array(
2127 "icon" => "gais",
2128 "title" => "Gaisbot",
2129 "rule" => array(
2130 "Gaisbot[ /]([0-9.]{1,10})" => "\\1"
2131 ),
2132 "uri" => ""
2133 ),
2134 "galaxy" => array(
2135 "icon" => "galaxy",
2136 "title" => "Galaxy",
2137 "rule" => array(
2138 "GalaxyBot[ /]([0-9.]{1,10})" => "\\1",
2139 "www.galaxy.com" => ""
2140 ),
2141 "uri" => "http://www.galaxy.com/"
2142 ),
2143 "gamespy" => array(
2144 "icon" => "gamespy",
2145 "title" => "GameSpy",
2146 "rule" => array(
2147 "GameSpyHTTP[ /]([0-9.]{1,10})" => "\\1"
2148 ),
2149 "uri" => ""
2150 ),
2151 "garlik" => array(
2152 "icon" => "garlik",
2153 "title" => "Garlik",
2154 "rule" => array(
2155 "GarlikCrawler[ /]([0-9.]{1,10})" => "\\1"
2156 ),
2157 "uri" => "http://garlik.com/"
2158 ),
2159 "gdesktop" => array(
2160 "icon" => "gdesktop",
2161 "title" => "Google Desktop",
2162 "rule" => array(
2163 "compatible; Google Desktop" => ""
2164 ),
2165 "uri" => ""
2166 ),
2167 "genome" => array(
2168 "icon" => "robot",
2169 "title" => "Genome Machine",
2170 "rule" => array(
2171 "Genome[ \-]?Machine" => ""
2172 ),
2173 "uri" => ""
2174 ),
2175 "geohash" => array(
2176 "icon" => "geohash",
2177 "title" => "Geohash",
2178 "rule" => array(
2179 "GeoHasher(/Nutch)[ /-]([0-9.]{1,10})" => "\\2"
2180 ),
2181 "uri" => "http://geohash.org/"
2182 ),
2183 "geona" => array(
2184 "icon" => "robot",
2185 "title" => "Geona",
2186 "rule" => array(
2187 "GeonaBot[ /]([0-9.]{1,10})" => "\\1"
2188 ),
2189 "uri" => ""
2190 ),
2191 "geoblog" => array(
2192 "icon" => "robot",
2193 "title" => "The World as a Blog",
2194 "rule" => array(
2195 "The World as a Blog" => ""
2196 ),
2197 "uri" => ""
2198 ),
2199 "geourl" => array(
2200 "icon" => "geourl",
2201 "title" => "GeoUrl",
2202 "rule" => array(
2203 "geourl[ /]([0-9.]{1,10})" => "\\1",
2204 "^GeoURLBot[ /]([0-9.]{1,10})" => "\\1",
2205 ),
2206 "uri" => ""
2207 ),
2208 "getnetwise" => array(
2209 "icon" => "robot",
2210 "title" => "GetNetWise",
2211 "rule" => array(
2212 " Crayon Crawler" => ""
2213 ),
2214 "uri" => ""
2215 ),
2216 "getright" => array(
2217 "icon" => "getright",
2218 "title" => "GetRight",
2219 "rule" => array(
2220 "GetRight[ /]([0-9.]{1,10})" => "\\1"
2221 ),
2222 "uri" => ""
2223 ),
2224 "getsmart" => array(
2225 "icon" => "getsmart",
2226 "title" => "GetSmart",
2227 "rule" => array(
2228 "GetSmart[ /]([0-9.]{1,10})" => "\\1"
2229 ),
2230 "uri" => ""
2231 ),
2232 "gigabot" => array(
2233 "icon" => "gigablast",
2234 "title" => "Gigablast",
2235 "rule" => array(
2236 "(Gigabot|Sitesearch)[/ ]([0-9.]{1,10})" => "\\2",
2237 "GigabotSiteSearch[/ ]([0-9.]{1,10})" => "\\1",
2238 ),
2239 "uri" => ""
2240 ),
2241 "gimme" => array(
2242 "icon" => "gimme",
2243 "title" => "gimmeUSA",
2244 "rule" => array(
2245 "Gimme60bot[ /]([0-9.]{1,10})" => "\\1"
2246 ),
2247 "uri" => "http://gimme60.com"
2248 ),
2249 "ginger" => array(
2250 "icon" => "ginger",
2251 "title" => "GingerCrawler",
2252 "rule" => array(
2253 "GingerCrawler[ /]([0-9.]{1,10})" => "\\1"
2254 ),
2255 "uri" => "http://www.gingersoftware.com/crawler_agent.htm"
2256 ),
2257 "girafabot" => array(
2258 "icon" => "girafa",
2259 "title" => "Girafa",
2260 "rule" => array(
2261 "Girafabot" => ""
2262 ),
2263 "uri" => ""
2264 ),
2265 "globalspec" => array(
2266 "icon" => "globalspec",
2267 "title" => "GlobalSpec",
2268 "rule" => array(
2269 "Ocelli[ /]([0-9.]{1,10})" => "\\1"
2270 ),
2271 "uri" => ""
2272 ),
2273 "glucose" => array(
2274 "icon" => "glucose",
2275 "title" => "Glucose",
2276 "rule" => array(
2277 "glucose[ /]([0-9a-z.\-]{1,10})" => "\\1"
2278 ),
2279 "uri" => ""
2280 ),
2281 "gnomit" => array(
2282 "icon" => "gnomit",
2283 "title" => "Gnomit",
2284 "rule" => array(
2285 "gnomit[ /]([0-9.]{1,10})" => "\\1"
2286 ),
2287 "uri" => "http://www.gnomit.com/",
2288 ),
2289 "goforit" => array(
2290 "icon" => "goforit",
2291 "title" => "GoForIt",
2292 "rule" => array(
2293 "^GoForIt\.com" => "",
2294 "^GOFORITBOT" => ""
2295 ),
2296 "uri" => ""
2297 ),
2298 "goguides" => array(
2299 "icon" => "robot",
2300 "title" => "GoGuides",
2301 "rule" => array(
2302 "^GoGuidesBot[ /]([0-9.]{1,10})" => "\\1"
2303 ),
2304 "uri" => "http://www.goguides.org/"
2305 ),
2306 // Needs to be before google for correct detection
2307 "mediapartners" => array(
2308 "icon" => "google",
2309 "title" => "Mediapartners",
2310 "rule" => array (
2311 "Mediapartners-Google[ /]([0-9.]{1,10})" => "\\1",
2312 "Mediapartners-Google" => ""
2313 ),
2314 "uri" => ""
2315 ),
2316 "google" => array(
2317 "icon" => "google",
2318 "title" => "Google",
2319 "rule" => array (
2320 "Googl(e|ebot)(-Image)?/([0-9.]{1,10})" => "\\3",
2321 "Googl(e|ebot)(-Image)?/" => "",
2322 "^gsa-crawler" => "",
2323 "Google Web Preview" => ""
2324 ),
2325 "uri" => "http://www.google.com/"
2326 ),
2327 "googlesitemaps" => array(
2328 "icon" => "google",
2329 "title" => "Google-Sitemaps",
2330 "rule" => array (
2331 "Googl(e|ebot)(-Sitemaps)?/([0-9.]{1,10})" => "\\3",
2332 "GSiteCrawler[ /v]*([0-9.a-z]{1,10})" => "\\1",
2333 "Googl(e|ebot)(-Sitemaps)?/" => ""
2334 ),
2335 "uri" => ""
2336 ),
2337 "googlemobile" => array(
2338 "icon" => "google",
2339 "title" => "Google-Mobile",
2340 "rule" => array (
2341 "Googl(e|ebot)(-Mobile)?/([0-9.]{1,10})" => "\\3",
2342 "Googl(e|ebot)(-Mobile)?/" => ""
2343 ),
2344 "uri" => ""
2345 ),
2346 "googleads" => array(
2347 "icon" => "google",
2348 "title" => "Google-AdsBot",
2349 "rule" => array (
2350 "^AdsBot-Google" => "",
2351 ),
2352 "uri" => ""
2353 ),
2354 "googlefeeds" => array(
2355 "icon" => "google",
2356 "title" => "Google-Feedfetcher",
2357 "rule" => array (
2358 "^Feedfetcher-Google" => "",
2359 ),
2360 "uri" => ""
2361 ),
2362 "googlverification" => array(
2363 "icon" => "google",
2364 "title" => "Google-Site-Verification",
2365 "rule" => array (
2366 "Google-Site-Verification[ /]([0-9.]{1,10})" => "\\1"
2367 ),
2368 "uri" => ""
2369 ),
2370 // Needs to be AFTER Google detection
2371 "goo" => array(
2372 "icon" => "goo",
2373 "title" => "Goo",
2374 "rule" => array (
2375 "(gazz|ichiro|mog(et|imogi))[ /]([0-9.]{1,10})" => "\\3",
2376 "DoCoMo[ /]([0-9.]{1,10})" => "\\1"
2377 ),
2378 "uri" => ""
2379 ),
2380 "goongee" => array(
2381 "icon" => "robot",
2382 "title" => "GoonGee",
2383 "rule" => array (
2384 "^Big Fish[ /]v?([0-9.]{1,10})" => "\\2"
2385 ),
2386 "uri" => "http://www.goongee.com/"
2387 ),
2388 "gpost" => array(
2389 "icon" => "gpost",
2390 "title" => "GPost",
2391 "rule" => array(
2392 "^GPostbot" => ""
2393 ),
2394 "uri" => ""
2395 ),
2396 "grapeshot" => array(
2397 "icon" => "grapeshot",
2398 "title" => "Grapeshot",
2399 "rule" => array(
2400 "GrapeshotCrawler[/ ]([0-9.]{1,10})" => "\\1"
2401 ),
2402 "uri" => "http://www.grapeshot.co.uk/crawler.php"
2403 ),
2404 "gregarius" => array(
2405 "icon" => "robot",
2406 "title" => "Gregarius",
2407 "rule" => array(
2408 "^Gregarius[/ ]([0-9.]{1,10})" => ""
2409 ),
2410 "uri" => ""
2411 ),
2412 "grub" => array(
2413 "icon" => "grub",
2414 "title" => "Grub",
2415 "rule" => array(
2416 "grub[ \-]?client[ /\-]{1,5}([0-9.]{1,10})" => "\\1",
2417 "grub crawler" => "",
2418 "grub[/ ]([0-9.]{1,10})" => "\\1",
2419 "^GrubNG([0-9. ]{1,10})?" => "\\1"
2420 ),
2421 "uri" => "http://www.grub.org/"
2422 ),
2423 "gulliver" => array(
2424 "icon" => "robot",
2425 "title" => "Gulliver",
2426 "rule" => array(
2427 "Gulliver" => ""
2428 ),
2429 "uri" => ""
2430 ),
2431 "guruji" => array(
2432 "icon" => "guruji",
2433 "title" => "Guruji",
2434 "rule" => array(
2435 "GurujiBot[/ ]([0-9.]{1,10})" => "\\1"
2436 ),
2437 "uri" => "http://www.guruji.com/"
2438 ),
2439 "gush" => array(
2440 "icon" => "robot",
2441 "title" => "Gush",
2442 "rule" => array(
2443 "^Gush[/ ]([0-9.]{1,10})" => "\\1"
2444 ),
2445 "uri" => ""
2446 ),
2447 "gziptester" => array(
2448 "icon" => "robot",
2449 "title" => "Gzip Tester",
2450 "rule" => array(
2451 "g(id)?zip[ \-]?test(er)?" => ""
2452 ),
2453 "uri" => ""
2454 ),
2455 "hanzoweb" => array(
2456 "icon" => "hanzoweb",
2457 "title" => "Hanzoweb",
2458 "rule" => array(
2459 "^Hanzoweb" => ""
2460 ),
2461 "uri" => ""
2462 ),
2463 "harbot" => array(
2464 "icon" => "harbot",
2465 "title" => "Harbot",
2466 "rule" => array(
2467 "^Harbot GateStation" => ""
2468 ),
2469 "uri" => ""
2470 ),
2471 "hatena" => array(
2472 "icon" => "hatena",
2473 "title" => "Hatena",
2474 "rule" => array(
2475 "Hatena (Antenna|Bookmark|Pagetitle Agent)[ /]([0-9.]{1,10})" => "\\2"
2476 ),
2477 "uri" => ""
2478 ),
2479 "htmlparser" => array(
2480 "icon" => "htmlparser",
2481 "title" => "HTMLParser",
2482 "rule" => array(
2483 "HTMLParser[ /]([0-9.]{1,10})" => "\\1"
2484 ),
2485 "uri" => "http://htmlparser.sourceforge.net/"
2486 ),
2487 "helix" => array(
2488 "icon" => "helix",
2489 "title" => "Heritrix",
2490 "rule" => array(
2491 "^helix[ /]([0-9.]{1,10})" => "\\1"
2492 ),
2493 "uri" => "http://www.sitesearch.ca/helix/"
2494 ),
2495 "heritrix" => array(
2496 "icon" => "heritrix",
2497 "title" => "Heritrix",
2498 "rule" => array(
2499 "heritrix[ /]([0-9.]{1,10})" => "\\1",
2500 "archive.org_bot" => "",
2501 "InternetArchive[ /]([0-9.a-z]{1,10})" => "\\1"
2502 ),
2503 "uri" => "http://archive.org"
2504 ),
2505 "hiddenmarket" => array(
2506 "icon" => "robot",
2507 "title" => "HiddenMarket",
2508 "rule" => array(
2509 "HiddenMarket[ /\-]([0-9.]{1,10})" => "\\1"
2510 ),
2511 "uri" => ""
2512 ),
2513 "honda" => array(
2514 "icon" => "robot",
2515 "title" => "Honda",
2516 "rule" => array(
2517 "Honda-Search[ /]([0-9.]{1,10})" => "\\1"
2518 ),
2519 "uri" => "http://www.honda-search.com"
2520 ),
2521 "hoowwwer" => array(
2522 "icon" => "hoowwwer",
2523 "title" => "HooWWWer",
2524 "rule" => array(
2525 "HooWWWer[ /]([0-9.]{1,10})" => "\\1"
2526 ),
2527 "uri" => ""
2528 ),
2529 "hotzonu" => array(
2530 "icon" => "hotzonu",
2531 "title" => "Hotzonu",
2532 "rule" => array(
2533 "Hotzonu[ /]([0-9.]{1,10})" => "\\1"
2534 ),
2535 "uri" => ""
2536 ),
2537 "houxou" => array(
2538 "icon" => "robot",
2539 "title" => "Houxou",
2540 "rule" => array(
2541 "HouxouCrawler[ /]Nutch.([0-9.]{1,10})" => "\\1",
2542 "HouxouCrawler" => ""
2543 ),
2544 "uri" => ""
2545 ),
2546 "htdig" => array(
2547 "icon" => "htdig",
2548 "title" => "ht://Dig",
2549 "rule" => array(
2550 "htdig[ /]([0-9.]{1,10})" => "\\1",
2551 "htdig" => "\\1"
2552 ),
2553 "uri" => ""
2554 ),
2555 "html2jpg" => array(
2556 "icon" => "html2jpg",
2557 "title" => "HTML2JPG",
2558 "rule" => array(
2559 "^HTML2JPG" => ""
2560 ),
2561 "uri" => ""
2562 ),
2563 "httperf" => array(
2564 "icon" => "robot",
2565 "title" => "HTTPerf",
2566 "rule" => array(
2567 "httperf[ /]([0-9.]{1,10})" => "\\1"
2568 ),
2569 "uri" => ""
2570 ),
2571 "httpunit" => array(
2572 "icon" => "httpunit",
2573 "title" => "HttpUnit",
2574 "rule" => array(
2575 "httpunit[ /]([0-9.]{1,10})" => "\\1"
2576 ),
2577 "uri" => ""
2578 ),
2579 "httrack" => array(
2580 "icon" => "httrack",
2581 "title" => "HTTrack",
2582 "rule" => array(
2583 "HTTrack[ /]([0-9.]{1,10})" => "\\1"
2584 ),
2585 "uri" => ""
2586 ),
2587 "huaweisymantec" => array(
2588 "icon" => "huaweisymantec",
2589 "title" => "HuaweiSymantec",
2590 "rule" => array(
2591 "HuaweiSymantecSpider[ /]([0-9.]{1,10})" => "\\1"
2592 ),
2593 "uri" => "http://www.huaweisymantec.com/en/IRL/spider/"
2594 ),
2595 "hungary" => array(
2596 "icon" => "hungary",
2597 "title" => "Hungary",
2598 "rule" => array(
2599 "HuRob[ /]([0-9.]{1,10})" => "\\1"
2600 ),
2601 "uri" => ""
2602 ),
2603 "i18n" => array(
2604 "icon" => "w3c",
2605 "title" => "W3C I18n Checker",
2606 "rule" => array(
2607 "^W3C_I18n-Checker[ /]([0-9.]{1,10})" => "\\1"
2608 ),
2609 "uri" => "http://validator.w3.org/services"
2610 ),
2611 "iakke" => array(
2612 "icon" => "iakke",
2613 "title" => "Iakké",
2614 "rule" => array(
2615 "^iakke_bot[ /]v([0-9.]{1,10})" => "\\1"
2616 ),
2617 "uri" => "http://fr.iakke.com/"
2618 ),
2619 "iask" => array(
2620 "icon" => "iask",
2621 "title" => "IAsk",
2622 "rule" => array(
2623 "iaskspider[ /]([0-9.]{1,10})" => "\\1",
2624 "^iaskspider" => ""
2625 ),
2626 "uri" => "http://iask.com"
2627 ),
2628 "icc" => array(
2629 "icon" => "icc",
2630 "title" => "ICC-Crawler",
2631 "rule" => array(
2632 "^ICC-Crawler" => ""
2633 ),
2634 "uri" => "http://kc.nict.go.jp/icc/crawl.html"
2635 ),
2636 "icerocket" => array(
2637 "icon" => "icerocket",
2638 "title" => "Icerocket",
2639 "rule" => array(
2640 "BlogzIce[ /]([0-9.]{1,10})" => "\\1",
2641 "BlogSearch[ /]([0-9.]{1,10})" => "\\1"
2642 ),
2643 "uri" => ""
2644 ),
2645 "icjobs" => array(
2646 "icon" => "icjobs",
2647 "title" => "iCjobs",
2648 "rule" => array(
2649 "iCjobs[ /]([0-9.]{1,10})" => "\\1"
2650 ),
2651 "uri" => "http://www.icjobs.de/"
2652 ),
2653 "icra" => array(
2654 "icon" => "icra",
2655 "title" => "ICRA",
2656 "rule" => array(
2657 "^ICRA_Semantic_spider[ /]([0-9.]{1,10})" => "\\1"
2658 ),
2659 "uri" => "http://www.icra.org"
2660 ),
2661 "iknow" => array(
2662 "icon" => "robot",
2663 "title" => "I know",
2664 "rule" => array(
2665 "Comaneci_bot[ /]([0-9.]{1,10})" => "\\1"
2666 ),
2667 "uri" => ""
2668 ),
2669 "ilial" => array(
2670 "icon" => "robot",
2671 "title" => "Ilial",
2672 "rule" => array(
2673 "ilial[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
2674 ),
2675 "uri" => ""
2676 ),
2677 "ilocal" => array(
2678 "icon" => "ilocal",
2679 "title" => "ilocal",
2680 "rule" => array(
2681 "^ilocal" => "",
2682 ),
2683 "uri" => "http://www.ilocal.nl"
2684 ),
2685 "ilse" => array(
2686 "icon" => "ilse",
2687 "title" => "Ilse",
2688 "rule" => array(
2689 "I(NGRID|lseRobot|lseBot)[ /]([0-9.]{1,10})" => "\\1"
2690 ),
2691 "uri" => "http://ilse.nl/"
2692 ),
2693 "iltrovatore" => array(
2694 "icon" => "iltrovatore",
2695 "title" => "IlTrovatore",
2696 "rule" => array(
2697 "iltrovatore-setaccio[ /]([0-9.]{1,10})" => "\\1",
2698 "Iltrovatore-Setaccio" => "",
2699 "iltrovatore[ /]([0-9.]{1,10})" => "\\1"
2700 ),
2701 "uri" => ""
2702 ),
2703 "indylibrary" => array(
2704 "icon" => "robot",
2705 "title" => "Indy Library",
2706 "rule" => array(
2707 "Indy[ \-]?Library" => ""
2708 ),
2709 "uri" => ""
2710 ),
2711 "inela" => array(
2712 "icon" => "robot",
2713 "title" => "Inela",
2714 "rule" => array(
2715 "InelaBot[ /]([0-9.]{1,10})" => ""
2716 ),
2717 "uri" => "http://inelegant.org/bot"
2718 ),
2719 "ineturl" => array(
2720 "icon" => "robot",
2721 "title" => "InetURL",
2722 "rule" => array(
2723 "InetURL.?[ /]([0-9.]{1,10})" => ""
2724 ),
2725 "uri" => ""
2726 ),
2727 "infoart" => array(
2728 "icon" => "robot",
2729 "title" => "InfoArt",
2730 "rule" => array(
2731 "InfoArt crawler" => ""
2732 ),
2733 "uri" => ""
2734 ),
2735 "infomine" => array(
2736 "icon" => "infomine",
2737 "title" => "INFOMINE",
2738 "rule" => array(
2739 "^DataFountains/DMOZ" => "",
2740 "^INFOMINE[ /]([0-9.]{1,10})" => "\\1"
2741 ),
2742 "uri" => "http://infomine.ucr.edu/"
2743 ),
2744 "infoseek" => array(
2745 "icon" => "infoseek",
2746 "title" => "Infoseek",
2747 "rule" => array(
2748 "SideWinder[ /]?([0-9a-z.]{1,10})" => "\\1",
2749 "Infoseek" => ""
2750 ),
2751 "uri" => ""
2752 ),
2753 "inktomi" => array(
2754 "icon" => "inktomi",
2755 "title" => "Inktomi",
2756 "rule" => array(
2757 "slurp@inktomi\.com" => ""
2758 ),
2759 "uri" => ""
2760 ),
2761 "innerprise" => array(
2762 "icon" => "robot",
2763 "title" => "Innerprise",
2764 "rule" => array(
2765 "^InnerpriseBot[ /]([0-9.]{1,10})" => "\\1",
2766 "URL[ _]Spider[ _]Pro[ /]([0-9.+]{1,10})" => "\\1",
2767 "^ES[ .]NET[ _]Crawler[ /]([0-9.]{1,10})" => "\\1"
2768 ),
2769 "uri" => "http://www.innerprise.com/"
2770 ),
2771 "inria" => array(
2772 "icon" => "inria",
2773 "title" => "Inria",
2774 "rule" => array(
2775 "^xyro_" => ""
2776 ),
2777 "uri" => ""
2778 ),
2779 "insitor" => array(
2780 "icon" => "insitor",
2781 "title" => "Insitor",
2782 "rule" => array(
2783 "^Insitor(,|\.|naut)" => ""
2784 ),
2785 "uri" => "http://www.insitor.com/"
2786 ),
2787 "internetninja" => array(
2788 "icon" => "robot",
2789 "title" => "Internet Ninja",
2790 "rule" => array(
2791 "^Internet Ninja[ /]([0-9.]{1,10})" => "\\1"
2792 ),
2793 "uri" => ""
2794 ),
2795 "internetseer" => array(
2796 "icon" => "internetseer",
2797 "title" => "InternetSeer",
2798 "rule" => array(
2799 "^InternetSeer\.com" => ""
2800 ),
2801 "uri" => ""
2802 ),
2803 "interseek" => array(
2804 "icon" => "interseek",
2805 "title" => "Interseek",
2806 "rule" => array(
2807 "Interseek.com" => ""
2808 ),
2809 "uri" => "http://www.interseek.com"
2810 ),
2811 "intravnews" => array(
2812 "icon" => "intravnews",
2813 "title" => "IntraVnews",
2814 "rule" => array(
2815 "IntraVnews[ /]([0-9.]{1,10})" => "\\1"
2816 ),
2817 "uri" => "http://www.intravnews.com/"
2818 ),
2819 "ip2location" => array(
2820 "icon" => "ip2location",
2821 "title" => "IP2LocationBot",
2822 "rule" => array(
2823 "^IP2(Map|Location)Bot[ /]([0-9.]{1,10})" => "\\2"
2824 ),
2825 "uri" => "http://www.ip2location.com"
2826 ),
2827 "ipworks" => array(
2828 "icon" => "ipworks",
2829 "title" => "IP*Works",
2830 "rule" => array(
2831 "^IP\*Works\! V([0-9.]{1,10})" => "\\1"
2832 ),
2833 "uri" => "http://www.nsoftware.com/ipworks/"
2834 ),
2835 "irca" => array(
2836 "icon" => "robot",
2837 "title" => "Novell iChain Cool Solutions caching",
2838 "rule" => array(
2839 "^ICRA_(label_generator|Semantic_spider)[ /]([0-9.]{1,10})" => "\\2",
2840 "^Mozilla[/ ]([0-9.]{1,10})[/ ]\(compatible[ ;]*ICS" => "\\1"
2841 ),
2842 "uri" => "http://www.icra.org"
2843 ),
2844 "irvine" => array(
2845 "icon" => "robot",
2846 "title" => "Irvine",
2847 "rule" => array(
2848 "Irvine[ /]([0-9.]{1,10})" => "\\1"
2849 ),
2850 "uri" => ""
2851 ),
2852 "ips-agent" => array(
2853 "icon" => "robot",
2854 "title" => "IPS-agent",
2855 "rule" => array(
2856 "ips-agent" => ""
2857 ),
2858 "uri" => ""
2859 ),
2860 "isara" => array(
2861 "icon" => "isara",
2862 "title" => "Isara",
2863 "rule" => array(
2864 "Isara[ -]([0-9.]{1,10})" => "\\1"
2865 ),
2866 "uri" => "http://www.isara.org/"
2867 ),
2868 "isspider" => array(
2869 "icon" => "robot",
2870 "title" => "ISSpider",
2871 "rule" => array(
2872 "ISSpider[ /\-]([0-9.]{1,10})" => "\\1"
2873 ),
2874 "uri" => ""
2875 ),
2876 "it2media" => array(
2877 "icon" => "it2media",
2878 "title" => "IT2media",
2879 "rule" => array(
2880 "www.adressendeutschland.de" => ""
2881 ),
2882 "uri" => "http://www.adressendeutschland.de/"
2883 ),
2884 "ivia" => array(
2885 "icon" => "robot",
2886 "title" => "iVia",
2887 "rule" => array(
2888 "iVia Site Checker.?[ /]([0-9.]{1,10})" => "\\1"
2889 ),
2890 "uri" => ""
2891 ),
2892 "jeteye" => array(
2893 "icon" => "jeteye",
2894 "title" => "Jeteye",
2895 "rule" => array(
2896 "Jetbot[ /]([0-9.]{1,10})" => "\\1"
2897 ),
2898 "uri" => ""
2899 ),
2900 "jobsde" => array(
2901 "icon" => "jobsde",
2902 "title" => "jobs.de",
2903 "rule" => array(
2904 "www\.jobs\.de" => "",
2905 "jobs.de-Robot" => ""
2906 ),
2907 "uri" => "http://www.jobs.de/"
2908 ),
2909 "jpluck" => array(
2910 "icon" => "robot",
2911 "title" => "Jpluck",
2912 "rule" => array(
2913 "JPluck[ /]([0-9a-z.]{1,10})" => "\\1"
2914 ),
2915 "uri" => ""
2916 ),
2917 "jxta" => array(
2918 "icon" => "robot",
2919 "title" => "Jxta",
2920 "rule" => array(
2921 "falcon[ /]([0-9.]{1,10})" => "\\1"
2922 ),
2923 "uri" => ""
2924 ),
2925 "jyte" => array(
2926 "icon" => "jyte",
2927 "title" => "Jyte",
2928 "rule" => array(
2929 "jyte_fetcher[ /]([0-9.]{1,10})" => "\\1"
2930 ),
2931 "uri" => ""
2932 ),
2933 "jyxo" => array(
2934 "icon" => "jyxo",
2935 "title" => "Jyxo",
2936 "rule" => array(
2937 "Jyxobot[ /]([0-9.]{1,10})" => "\\1"
2938 ),
2939 "uri" => ""
2940 ),
2941 "kalooga" => array(
2942 "icon" => "kalooga",
2943 "title" => "Kalooga",
2944 "rule" => array(
2945 "kalooga[ /-]([0-9.]{1,10})" => "\\1",
2946 "^kalooga" => "",
2947 "KaloogaBot" => ""
2948 ),
2949 "uri" => "http://www.kalooga.com"
2950 ),
2951 "keywen" => array(
2952 "icon" => "keywen",
2953 "title" => "Keywen",
2954 "rule" => array(
2955 "EasyDL[ /]([0-9.]{1,10})" => "\\1"
2956 ),
2957 "uri" => ""
2958 ),
2959 "kilomonkey" => array(
2960 "icon" => "robot",
2961 "title" => "Kilomonkey",
2962 "rule" => array(
2963 "kmky-not-a-bot[ /]([0-9.]{1,10})" => "\\1"
2964 ),
2965 "uri" => "http://www.kilomonkey.com/notabot.txt"
2966 ),
2967 "kinja" => array(
2968 "icon" => "kinja",
2969 "title" => "Kinja",
2970 "rule" => array(
2971 "kinjabot[ /]([0-9.]{1,10})" => "\\1",
2972 "^kinjabot" => ""
2973 ),
2974 "uri" => ""
2975 ),
2976 "kiwi" => array(
2977 "icon" => "robot",
2978 "title" => "KiwiStatus",
2979 "rule" => array(
2980 "KiwiStatus[ /]([0-9.]{1,10})" => "\\1",
2981 "KiwiStatus" => ""
2982 ),
2983 "uri" => "http://www.nzs.com/kiei-status/"
2984 ),
2985 "lachesis" => array(
2986 "icon" => "robot",
2987 "title" => "Lachesis",
2988 "rule" => array(
2989 "lachesis" => ""
2990 ),
2991 "uri" => ""
2992 ),
2993 "lanshan" => array(
2994 "icon" => "robot",
2995 "title" => "Lachesis",
2996 "rule" => array(
2997 "lanshanbot[/ ]([0-9.]{1,10})" => "\\1"
2998 ),
2999 "uri" => ""
3000 ),
3001 "lapozz" => array(
3002 "icon" => "lapozz",
3003 "title" => "Lapozz",
3004 "rule" => array(
3005 "LapozzBot[/ ]?([0-9.]{1,10})" => "\\1"
3006 ),
3007 "uri" => ""
3008 ),
3009 "larbin" => array(
3010 "icon" => "robot",
3011 "title" => "Larbin",
3012 "rule" => array(
3013 "larbin[_/ ]?([0-9.]{1,10})" => "\\1"
3014 ),
3015 "uri" => ""
3016 ),
3017 "laurion" => array(
3018 "icon" => "robot",
3019 "title" => "Laurion",
3020 "rule" => array(
3021 "^IPiumBot" => ""
3022 ),
3023 "uri" => "http://www.laurion.com/"
3024 ),
3025 "leechget" => array(
3026 "icon" => "leechget",
3027 "title" => "LeechGet",
3028 "rule" => array(
3029 "^LeechGet[ /]([0-9.]{1,10})" => "\\1"
3030 ),
3031 "uri" => ""
3032 ),
3033 "linguaseek" => array(
3034 "icon" => "linguaseek",
3035 "title" => "Linguaseek",
3036 "rule" => array(
3037 "^LinguaBot[ /]v([0-9.]{1,10})" => "\\1"
3038 ),
3039 "uri" => "http://www.linguaseek.com/"
3040 ),
3041 "linguee" => array(
3042 "icon" => "linguee",
3043 "title" => "Linguee",
3044 "rule" => array(
3045 "^Linguee Bot" => ""
3046 ),
3047 "uri" => "http://www.linguee.com/"
3048 ),
3049 "linkguard" => array(
3050 "icon" => "robot",
3051 "title" => "Linkguard",
3052 "rule" => array(
3053 "Linkguard Online[ /]([0-9.]{1,10})" => "\\1"
3054 ),
3055 "uri" => "http://www.linkguard.com/"
3056 ),
3057 "linklint" => array(
3058 "icon" => "linklint",
3059 "title" => "Linklint",
3060 "rule" => array(
3061 "^Linklint[-\-a-z /]*([0-9.]{1,10})" => "\\1"
3062 ),
3063 "uri" => "http://www.linklint.org/"
3064 ),
3065 "linkman" => array(
3066 "icon" => "linkman",
3067 "title" => "Linkman",
3068 "rule" => array(
3069 "\(compatible; Linkman\)" => ""
3070 ),
3071 "uri" => ""
3072 ),
3073 // Needs to be before linkcheck for correct detection
3074 "linkchecker" => array(
3075 "icon" => "w3c",
3076 "title" => "W3C Link Checker",
3077 "rule" => array(
3078 "^W3C-checklink[ /]([0-9.]{1,10})" => "\\1"
3079 ),
3080 "uri" => "http://validator.w3.org/checklink"
3081 ),
3082 "linkcheck" => array(
3083 "icon" => "linkcheck",
3084 "title" => "Linkcheck",
3085 "rule" => array(
3086 "checklink[ /]([0-9.]{1,10})" => "\\1",
3087 "Link[ \-]?(Chec(k|ker)|Val(et|idator))" => "",
3088 "Adaxas Spider" => "",
3089 "Agent-SharewarePlazaFileCheckBot[ /]([0-9.]{1,10})" => "\\1",
3090 "NetMechanic V([0-9.]{1,10})" => "\\1",
3091 "^InfoLink" => "",
3092 "InternetLinkAgent" => "",
3093 "; SPENG\)" => "",
3094 "SharewarePlazaFileCheckBot" => "",
3095 "fileboost.net" => "",
3096 "^billbot" => ""
3097 ),
3098 "uri" => ""
3099 ),
3100 "linkru" => array(
3101 "icon" => "robot",
3102 "title" => "Link.RU",
3103 "rule" => array(
3104 "^Link.RU bot" => ""
3105 ),
3106 "uri" => ""
3107 ),
3108 "linkssql" => array(
3109 "icon" => "robot",
3110 "title" => "Links SQL",
3111 "rule" => array(
3112 "links sql" => ""
3113 ),
3114 "uri" => ""
3115 ),
3116 "linksweeper" => array(
3117 "icon" => "robot",
3118 "title" => "Link Sweeper",
3119 "rule" => array(
3120 "LinkSweeper[ /]([0-9.]{1,10})" => "\\1"
3121 ),
3122 "uri" => ""
3123 ),
3124 "linkwalker" => array(
3125 "icon" => "robot",
3126 "title" => "Link Walker",
3127 "rule" => array(
3128 "^LinkWalker" => ""
3129 ),
3130 "uri" => ""
3131 ),
3132 "lipperhey" => array(
3133 "icon" => "lipperhey",
3134 "title" => "Lipperhey",
3135 "rule" => array(
3136 "Lipperhey Spider" => ""
3137 ),
3138 "uri" => "http://www.lipperhey.com"
3139 ),
3140 "livedoor" => array(
3141 "icon" => "livedoor",
3142 "title" => "Livedoor",
3143 "rule" => array(
3144 "^Livedoor( SF( - California Crawl)?|Checkers)[ /]" => ""
3145 ),
3146 "uri" => ""
3147 ),
3148 "livejournal" => array(
3149 "icon" => "livejournal",
3150 "title" => "Live Journal",
3151 "rule" => array(
3152 "^LiveJournal\.com" => ""
3153 ),
3154 "uri" => "http://www.livejournal.com"
3155 ),
3156 "ljpic" => array(
3157 "icon" => "ljpic",
3158 "title" => "ljpic",
3159 "rule" => array(
3160 "LjSEEK Picture-Bot[ /]+([0-9.]{1,10})" => "\\1"
3161 ),
3162 "uri" => "http://www.ljpic.com"
3163 ),
3164 "lmspider" => array(
3165 "icon" => "robot",
3166 "title" => "Lmspider",
3167 "rule" => array(
3168 "^lmspider" => ""
3169 ),
3170 "uri" => ""
3171 ),
3172 "locators" => array(
3173 "icon" => "robot",
3174 "title" => "Locaters",
3175 "rule" => array(
3176 "^FiNDoBot[/ ]([0-9a-z.]{1,10})" => "\\1"
3177 ),
3178 "uri" => ""
3179 ),
3180 "look" => array(
3181 "icon" => "look",
3182 "title" => "Look",
3183 "rule" => array(
3184 "www\.look\.com" => "",
3185 "Lookbot" => ""
3186 ),
3187 "uri" => ""
3188 ),
3189 "looksmart" => array(
3190 "icon" => "looksmart",
3191 "title" => "LookSmart",
3192 "rule" => array(
3193 "^Martini" => "",
3194 "^MantraAgent" => "",
3195 "FurlBot" => "",
3196 "looksmart-sv-fw" => ""
3197 ),
3198 "uri" => ""
3199 ),
3200 "loop" => array(
3201 "icon" => "loop",
3202 "title" => "LOOP",
3203 "rule" => array(
3204 "NetResearchServer[ /]([0-9.]{1,10})" => "\\1"
3205 ),
3206 "uri" => ""
3207 ),
3208 "lotkyll" => array(
3209 "icon" => "robot",
3210 "title" => "Lotkyll",
3211 "rule" => array(
3212 "Lotkyll" => ""
3213 ),
3214 "uri" => ""
3215 ),
3216 "lwp" => array(
3217 "icon" => "robot",
3218 "title" => "lwp",
3219 "rule" => array(
3220 "lwp(-trivial|::simple)[ /]([0-9.]{1,10})" => "\\2"
3221 ),
3222 "uri" => ""
3223 ),
3224 "lycos" => array(
3225 "icon" => "lycos",
3226 "title" => "Lycos",
3227 "rule" => array(
3228 "Lycos_Spider_" => ""
3229 ),
3230 "uri" => ""
3231 ),
3232 "magpierss" => array(
3233 "icon" => "rss",
3234 "title" => "MagpieRSS",
3235 "rule" => array(
3236 "MagpieRSS" => ""
3237 ),
3238 "uri" => "http://magpierss.sourceforge.net/"
3239 ),
3240 "mailru" => array(
3241 "icon" => "mailru",
3242 "title" => "Mail.Ru",
3243 "rule" => array(
3244 "^Mail.Ru[ /]([0-9.]{1,10})" => "\\1",
3245 "Mail.RU_Bot[ /]([0-9.]{1,10})" => "\\1"
3246 ),
3247 "uri" => "http://www.mail.ru/"
3248 ),
3249 "mailsweeper" => array(
3250 "icon" => "robot",
3251 "title" => "Mail Sweeper",
3252 "rule" => array(
3253 "Mail[ \-]?Sweeper" => ""
3254 ),
3255 "uri" => ""
3256 ),
3257 "marvin" => array(
3258 "icon" => "robot",
3259 "title" => "Marvin",
3260 "rule" => array(
3261 "^Marvin" => ""
3262 ),
3263 "uri" => ""
3264 ),
3265 "matkurja" => array(
3266 "icon" => "matkurja",
3267 "title" => "Mat'Kurja",
3268 "rule" => array(
3269 "Mosad[ /]([0-9.]{1,10})" => "\\1"
3270 ),
3271 "uri" => ""
3272 ),
3273 "mavicanet" => array(
3274 "icon" => "mavicanet",
3275 "title" => "Mavicanet",
3276 "rule" => array(
3277 "Mavicanet robot" => ""
3278 ),
3279 "uri" => ""
3280 ),
3281 "meanpath" => array(
3282 "icon" => "meanpath",
3283 "title" => "Meanpath",
3284 "rule" => array(
3285 "meanpathbot[ /]([0-9.]{1,10})" => "\\1"
3286 ),
3287 "uri" => "http://www.meanpath.com/meanpathbot.html"
3288 ),
3289 "mediater" => array(
3290 "icon" => "robot",
3291 "title" => "Mediater",
3292 "rule" => array (
3293 "^libwww[ /]([0-9.]{1,10})" => "\\1"
3294 ),
3295 "uri" => ""
3296 ),
3297 "memory" => array(
3298 "icon" => "memory",
3299 "title" => "internet Memory",
3300 "rule" => array (
3301 "memoryBot[ /]([0-9.]{1,10})" => "\\1"
3302 ),
3303 "uri" => "http://internetmemory.org/en/"
3304 ),
3305 "mercator" => array(
3306 "icon" => "robot",
3307 "title" => "Mercator",
3308 "rule" => array(
3309 "Mercator" => ""
3310 ),
3311 "uri" => ""
3312 ),
3313 "metacarta" => array(
3314 "icon" => "robot",
3315 "title" => "Metacarta",
3316 "rule" => array(
3317 "^RRC (crawler_admin@bigfoot.com)" => "",
3318 "^flunky" => "",
3319 "^Mozilla.*\(samualt9@bigfoot.com\)$" => ""
3320 ),
3321 "uri" => "http://www.metacarta.com"
3322 ),
3323 "metager" => array(
3324 "icon" => "metager",
3325 "title" => "MetaGer",
3326 "rule" => array(
3327 "MetaGer" => ""
3328 ),
3329 "uri" => ""
3330 ),
3331 "metamark" => array(
3332 "icon" => "robot",
3333 "title" => "Metamark",
3334 "rule" => array(
3335 "^XRL[ /]([0-9.a-z]{1,10})" => "\\1"
3336 ),
3337 "uri" => "http://metamark.net"
3338 ),
3339 "metamedic" => array(
3340 "icon" => "metamedic",
3341 "title" => "MetaMedic",
3342 "rule" => array(
3343 "MediBot[ /]([0-9.]{1,10})" => "\\1"
3344 ),
3345 "uri" => ""
3346 ),
3347 "mirago" => array(
3348 "icon" => "mirago",
3349 "title" => "Mirago",
3350 "rule" => array(
3351 "Mirago" => ""
3352 ),
3353 "uri" => ""
3354 ),
3355 "misterwong" => array(
3356 "icon" => "misterwong",
3357 "title" => "Mister Wong",
3358 "rule" => array(
3359 "Mister Wong-Bot[ /]([0-9.]{1,10})" => "\\1"
3360 ),
3361 "uri" => "http://www.mister-wong.de/"
3362 ),
3363 "miva" => array(
3364 "icon" => "miva",
3365 "title" => "Miva",
3366 "rule" => array(
3367 "AlgoFeedback@miva\.com" => ""
3368 ),
3369 "uri" => "http://www.miva.com/"
3370 ),
3371 "mj12" => array(
3372 "icon" => "mj12",
3373 "title" => "Majestic-12",
3374 "rule" => array(
3375 "Mj12bot[ /]v?([0-9.]{1,10})" => "\\1",
3376 "MJ12bot \(mini\)[ /]([0-9.]{1,10})" => "\\1"
3377 ),
3378 "uri" => "http://majestic12.co.uk/bot.php"
3379 ),
3380 "mlbot" => array(
3381 "icon" => "robot",
3382 "title" => "MLBot",
3383 "rule" => array(
3384 "^MLBot" => ""
3385 ),
3386 "uri" => "http://www.metadatalabs.com/mlbot"
3387 ),
3388 "mnogo" => array(
3389 "icon" => "mnogo",
3390 "title" => "mnoGoSearch",
3391 "rule" => array(
3392 "Mnogosearch[ /\-]([0-9.]{1,10})" => "\\1"
3393 ),
3394 "uri" => "http://www.mnogosearch.org/"
3395 ),
3396 "mobileok" => array(
3397 "icon" => "mobileok",
3398 "title" => "W3C mobileOK",
3399 "rule" => array(
3400 "^W3C-mobileOK" => ""
3401 ),
3402 "uri" => "http://www.w3.org/2006/07/mobileok-ddc"
3403 ),
3404 "mojeek" => array(
3405 "icon" => "mojeek",
3406 "title" => "Mojeek",
3407 "rule" => array(
3408 "MojeekBot[ /]([0-9.]{1,10})" => "\\1"
3409 ),
3410 "uri" => "https://www.mojeek.com/bot.html"
3411 ),
3412 "momspider" => array(
3413 "icon" => "robot",
3414 "title" => "MOM Spider",
3415 "rule" => array(
3416 "MOMspider[ /]([0-9.]{1,10})" => "\\1"
3417 ),
3418 "uri" => ""
3419 ),
3420 "moreover" => array(
3421 "icon" => "moreover",
3422 "title" => "Moreover",
3423 "rule" => array(
3424 "^Moreoverbot[ /]([0-9.]{1,10})" => "\\1"
3425 ),
3426 "uri" => ""
3427 ),
3428 "movabletype" => array(
3429 "icon" => "movabletype",
3430 "title" => "Movable Type",
3431 "rule" => array(
3432 "MovableType[ /]([0-9.]{1,10})" => "\\1"
3433 ),
3434 "uri" => ""
3435 ),
3436 "mozdex" => array(
3437 "icon" => "mozdex",
3438 "title" => "MozDex",
3439 "rule" => array(
3440 "mozDex[ /]([0-9.]{1,6}(-dev)?)" => "\\1"
3441 ),
3442 "uri" => ""
3443 ),
3444 "mqbot" => array(
3445 "icon" => "robot",
3446 "title" => "MQbot",
3447 "rule" => array(
3448 "MQbot" => ""
3449 ),
3450 "uri" => ""
3451 ),
3452 "msnbot" => array(
3453 "icon" => "bing",
3454 "title" => "Bing",
3455 "rule" => array(
3456 "MSN(BOT|PTC)[ /]([0-9.]{1,10})" => "\\2",
3457 "MS Search ([0-9.]{1,10}) Robot" => "\\1",
3458 "MSNBOT-(MEDIA|PRODUCTS|NewsBlogs)[ /]([0-9.]{1,10})" => "\\2",
3459 "bingbot[ /]([0-9.]{1,10})" => "\\1"
3460 ),
3461 "uri" => ""
3462 ),
3463 "msnbot-mobile" => array(
3464 "icon" => "msn",
3465 "title" => "MSN Mobile",
3466 "rule" => array(
3467 "MSNBOT-(MOBILE|)[ /]([0-9.]{1,10})" => "\\2",
3468 "MSNBOT_Mobile" => "",
3469 "MSMOBOT" => ""
3470 ),
3471 "uri" => ""
3472 ),
3473 "mslivebot" => array(
3474 "icon" => "livesearch",
3475 "title" => "MS Live Search",
3476 "rule" => array(
3477 "MSNBOT-(Academic)[ /]([0-9.]{1,10})" => "\\2"
3478 ),
3479 "uri" => ""
3480 ),
3481 "msproxy" => array(
3482 "icon" => "robot",
3483 "title" => "MSProxy",
3484 "rule" => array(
3485 "MSProxy[ /]([0-9.]{1,10})" => "\\1"
3486 ),
3487 "uri" => ""
3488 ),
3489 "msrbot" => array(
3490 "icon" => "robot",
3491 "title" => "MSRBOT",
3492 "rule" => array(
3493 "^MSRBOT" => ""
3494 ),
3495 "uri" => "http://research.microsoft.com/research/sv/msrbot/"
3496 ),
3497 "mswebdav" => array(
3498 "icon" => "robot",
3499 "title" => "MS-WebDAV",
3500 "rule" => array(
3501 "Microsoft[ \-]?WebDAV[ \-]?MiniRedir" => ""
3502 ),
3503 "uri" => ""
3504 ),
3505 "mticon" => array(
3506 "icon" => "robot",
3507 "title" => "MTIcon",
3508 "rule" => array(
3509 "MTIcon[/ ]([0-9.]{1,10})" => "\\1"
3510 ),
3511 "uri" => ""
3512 ),
3513 "multipage-validator" => array(
3514 "icon" => "multipage-validator",
3515 "title" => "Multipage Validator",
3516 "rule" => array(
3517 "^W3C_Multipage_Validator[ /]([0-9.]{1,10})" => "\\1"
3518 ),
3519 "uri" => "http://www.validator.ca/"
3520 ),
3521 "myrss" => array(
3522 "icon" => "rss",
3523 "title" => "MyRSS",
3524 "rule" => array(
3525 "MyRSS.jp[/ ]([0-9.]{1,10})" => "\\1"
3526 ),
3527 "uri" => ""
3528 ),
3529 "multimap" => array(
3530 "icon" => "robot",
3531 "title" => "Multimap",
3532 "rule" => array(
3533 "Multimap Geotag Blog Parser[/ ]([0-9.]{1,10})" => "\\1"
3534 ),
3535 "uri" => ""
3536 ),
3537 "najdi" => array(
3538 "icon" => "najdi",
3539 "title" => "Najdi.si",
3540 "rule" => array(
3541 "Najdi.si" => ""
3542 ),
3543 "uri" => "http://www.najdi.si"
3544 ),
3545 "nameprotect" => array(
3546 "icon" => "nameprotect",
3547 "title" => "Name Protect",
3548 "rule" => array(
3549 "NPBot" => ""
3550 ),
3551 "uri" => ""
3552 ),
3553 "nationaldirectory" => array(
3554 "icon" => "robot",
3555 "title" => "National Directory",
3556 "rule" => array(
3557 "NationalDirectory-WebSpider[ /]([0-9.]{1,10})" => "\\1"
3558 ),
3559 "uri" => ""
3560 ),
3561 "natsumican" => array(
3562 "icon" => "robot",
3563 "title" => "Natsu Mican",
3564 "rule" => array(
3565 "NATSU[ \-]MICAN[/ ]([0-9a-z.]{1,10})" => "\\1"
3566 ),
3567 "uri" => ""
3568 ),
3569 "naverbot" => array(
3570 "icon" => "naverbot",
3571 "title" => "Naver",
3572 "rule" => array(
3573 "NaverBot([_\-]dloader)?[/ \-]([0-9.]{1,10})" => "\\2",
3574 "Naver(Bot)?" => "",
3575 "^nabot" => ""
3576 ),
3577 "uri" => ""
3578 ),
3579 "navisso" => array(
3580 "icon" => "navisso",
3581 "title" => "Navisso",
3582 "rule" => array(
3583 "Navisso(Bot)?" => ""
3584 ),
3585 "uri" => "http://www.navisso.com"
3586 ),
3587 "neofonie" => array(
3588 "icon" => "robot",
3589 "title" => "Neofonie",
3590 "rule" => array(
3591 "www.neofonie.de" => ""
3592 ),
3593 "uri" => "http://www.neofonie.de/loesungen/search/robot.html"
3594 ),
3595 "neomo" => array(
3596 "icon" => "robot",
3597 "title" => "Neomo",
3598 "rule" => array(
3599 "Francis[ /]([0-9.]{1,10})" => "\\1"
3600 ),
3601 "uri" => ""
3602 ),
3603 "nessus" => array(
3604 "icon" => "nessus",
3605 "title" => "Nessus",
3606 "rule" => array(
3607 "Nessus\)$" => ""
3608 ),
3609 "uri" => ""
3610 ),
3611 "nerdybot" => array(
3612 "icon" => "robot",
3613 "title" => "NerdyBot",
3614 "rule" => array(
3615 "NerdyBot" => ""
3616 ),
3617 "uri" => "http://nerdybot.com/"
3618 ),
3619 "nerdbynature" => array(
3620 "icon" => "nerdbynature",
3621 "title" => "NerdByNature",
3622 "rule" => array(
3623 "NerdByNature.Bot" => ""
3624 ),
3625 "uri" => "http://www.nerdbynature.net/bot"
3626 ),
3627 "netants" => array(
3628 "icon" => "netants",
3629 "title" => "NetAnts",
3630 "rule" => array(
3631 "NetAnts[ /]([0-9.]{1,10})" => "\\1"
3632 ),
3633 "uri" => ""
3634 ),
3635 "netcraft" => array(
3636 "icon" => "netcraft",
3637 "title" => "Netcraft",
3638 "rule" => array(
3639 "netcraft" => ""
3640 ),
3641 "uri" => ""
3642 ),
3643 "netinfo" => array(
3644 "icon" => "netinfo",
3645 "title" => "Netinfo",
3646 "rule" => array(
3647 "^NetinfoBot[ /]([0-9.]{1,10})" => "\\1"
3648 ),
3649 "uri" => "http://netinfo.bg/"
3650 ),
3651 "netluchs" => array(
3652 "icon" => "netluchs",
3653 "title" => "Netluchs",
3654 "rule" => array(
3655 "Netluchs[ /]([0-9.a-z]{1,10})" => "\\1"
3656 ),
3657 "uri" => "http://www.netluchs.de/"
3658 ),
3659 "netmechanic" => array(
3660 "icon" => "netmechanic",
3661 "title" => "NetMechanic",
3662 "rule" => array(
3663 "NetMechanic[ /V]{1,5}([0-9.]{1,10})" => "\\1"
3664 ),
3665 "uri" => ""
3666 ),
3667 "netnose" => array(
3668 "icon" => "netnose",
3669 "title" => "NetNose",
3670 "rule" => array(
3671 "NetNose[ \-]Crawler[/ ]([0-9.]{1,10})" => "\\1"
3672 ),
3673 "uri" => ""
3674 ),
3675 "netoskop" => array(
3676 "icon" => "robot",
3677 "title" => "Netoskop",
3678 "rule" => array(
3679 "netoskop" => ""
3680 ),
3681 "uri" => ""
3682 ),
3683 "netpromoter" => array(
3684 "icon" => "netpromoter",
3685 "title" => "NetPromoter",
3686 "rule" => array(
3687 "NetPromoter Spider" => ""
3688 ),
3689 "uri" => "http://www.net-promoter.com/"
3690 ),
3691 "netprospector" => array(
3692 "icon" => "robot",
3693 "title" => "Netprospector",
3694 "rule" => array(
3695 "^netprospector" => ""
3696 )
3697 ),
3698 "netpumper" => array(
3699 "icon" => "robot",
3700 "title" => "Netpumper",
3701 "rule" => array(
3702 "^NetPumper[/ ]([0-9.]{1,10})" => "\\1"
3703 ),
3704 "uri" => ""
3705 ),
3706 "netscapeproxy" => array(
3707 "icon" => "netscape",
3708 "title" => "Netscape Proxy",
3709 "rule" => array(
3710 "Netscape-Proxy[/ ]([0-9.]{1,10})" => "\\1"
3711 ),
3712 "uri" => ""
3713 ),
3714 "netspective" => array(
3715 "icon" => "robot",
3716 "title" => "NetSpective",
3717 "rule" => array(
3718 "^WebFilter Robot ([0-9.]{1,10})" => "\\1"
3719 ),
3720 "uri" => ""
3721 ),
3722 "netvibes" => array(
3723 "icon" => "netvibes",
3724 "title" => " Netvibes",
3725 "rule" => array(
3726 "^Netvibes" => "\\1"
3727 ),
3728 "uri" => ""
3729 ),
3730 "newsfire" => array(
3731 "icon" => "newsfire",
3732 "title" => "NewsFire",
3733 "rule" => array(
3734 "NewsFire[/ ]([0-9.]{1,10})" => "\\1"
3735 ),
3736 "uri" => ""
3737 ),
3738 "newsgator" => array(
3739 "icon" => "newsgator",
3740 "title" => "NewsGator",
3741 "rule" => array(
3742 "NewsGato(r|rOnline)[/ ]([0-9.]{1,10})" => "\\2"
3743 ),
3744 "uri" => ""
3745 ),
3746 "newzcrawler" => array(
3747 "icon" => "newzcrawler",
3748 "title" => "NewzCrawler",
3749 "rule" => array(
3750 "NewzCrawler[/ ]([0-9.]{1,10})" => "\\1"
3751 ),
3752 "uri" => ""
3753 ),
3754 "nextopia" => array(
3755 "icon" => "newzcrawler",
3756 "title" => "NewzCrawler",
3757 "rule" => array(
3758 "^NextopiaBOT.*[v ]([0-9.]{1,10})" => "\\1"
3759 ),
3760 "uri" => ""
3761 ),
3762 "ngsearch" => array(
3763 "icon" => "ngsearch",
3764 "title" => "NG Search",
3765 "rule" => array(
3766 "NG-Search[/ ]([0-9.]{1,10})" => "\\1"
3767 ),
3768 "uri" => ""
3769 ),
3770 "nimble" => array(
3771 "icon" => "robot",
3772 "title" => "Nimble",
3773 "rule" => array(
3774 "NimbleCrawler[/ ]([0-9.]{1,10})" => "\\1"
3775 ),
3776 "uri" => ""
3777 ),
3778 "nmap" => array(
3779 "icon" => "nmap",
3780 "title" => "Nmap",
3781 "rule" => array(
3782 "Nmap Scripting Engine" => ""
3783 ),
3784 "uri" => "http://nmap.org/book/nse.html"
3785 ),
3786 "nusearch" => array(
3787 "icon" => "robot",
3788 "title" => "NuSearch",
3789 "rule" => array(
3790 "^nuSearch" => ""
3791 ),
3792 "uri" => "http://www.nusearch.com/"
3793 ),
3794 "noago" => array(
3795 "icon" => "noago",
3796 "title" => "Noago",
3797 "rule" => array(
3798 "Noago Spider" => ""
3799 ),
3800 "uri" => "http://www.noago.com/"
3801 ),
3802 "noviforum" => array(
3803 "icon" => "noviforum",
3804 "title" => "Noviforum",
3805 "rule" => array(
3806 "TridentSpider[/ ]?([0-9.]{1,10})" => "\\1"
3807 ),
3808 "uri" => ""
3809 ),
3810 "noxtrum" => array(
3811 "icon" => "noxtrum",
3812 "title" => "noXtrum",
3813 "rule" => array(
3814 "noxtrumbot[/ ]?([0-9.]{1,10})" => "\\1"
3815 ),
3816 "uri" => ""
3817 ),
3818 "noyona" => array(
3819 "icon" => "robot",
3820 "title" => "Noyona",
3821 "rule" => array(
3822 "noyona.([0-9._]{1,10})" => "\\1"
3823 ),
3824 "uri" => "http://noyona.com/"
3825 ),
3826 "nsauditor" => array(
3827 "icon" => "nsauditor",
3828 "title" => "Nsauditor",
3829 "rule" => array(
3830 "Nsauditor[ /]([0-9.]{1,10})" => "\\1"
3831 ),
3832 "uri" => "http://www.nsauditor.com/"
3833 ),
3834 "obidosbot" => array(
3835 "icon" => "robot",
3836 "title" => "Bookwatch",
3837 "rule" => array(
3838 "obidos[ \-]?bot" => ""
3839 ),
3840 "uri" => ""
3841 ),
3842 "objectssearch" => array(
3843 "icon" => "robot",
3844 "title" => "Objects Search",
3845 "rule" => array(
3846 "ObjectsSearch[ /]([0-9.]{1,10})" => "\\1"
3847 ),
3848 "uri" => ""
3849 ),
3850 "obot" => array(
3851 "icon" => "ibm",
3852 "title" => "IBM (ONLY) Crawler",
3853 "rule" => array(
3854 "oBot[ /]([0-9.]{1,10})" => "\\1"
3855 ),
3856 "uri" => "http://filterdb.iss.net/crawler/"
3857 // Previous from "ONLY Solutions GmbH" – that is what the O stands for
3858 ),
3859 "ocawa" => array(
3860 "icon" => "ocawa",
3861 "title" => "Ocawa",
3862 "rule" => array(
3863 "Ocawa[ /]([A-Z.a-z][0-9.]{1,10})" => "\\1",
3864 "Ocawa" => ""
3865 ),
3866 "uri" => "http://www.ocawa.com/"
3867 ),
3868 "octora" => array(
3869 "icon" => "octora",
3870 "title" => "Octora",
3871 "rule" => array(
3872 "^Octora (Beta)?" => ""
3873 ),
3874 "uri" => "http://www.octora.com/"
3875 ),
3876 "offlineexplorer" => array(
3877 "icon" => "robot",
3878 "title" => "OfflineExplorer",
3879 "rule" => array(
3880 "^Offline Explorer[ /]([0-9.]{1,10})" => "\\1"
3881 ),
3882 "uri" => ""
3883 ),
3884 "omea" => array(
3885 "icon" => "omea",
3886 "title" => "Omea Reader",
3887 "rule" => array(
3888 "Omea Reader[ /]([0-9.]{1,10})" => "\\1"
3889 ),
3890 "uri" => ""
3891 ),
3892 "onet" => array(
3893 "icon" => "onet",
3894 "title" => "Onet",
3895 "rule" => array(
3896 "OnetSzukaj[ /]([0-9.]{1,10})" => "\\1",
3897 "Onet\.pl" => "",
3898 "inktomi.search.onet" => ""
3899 ),
3900 "uri" => "http://www.onet.pl"
3901 ),
3902 "online24" => array(
3903 "icon" => "robot",
3904 "title" => "Online24",
3905 "rule" => array(
3906 "^Online24-Bot .* ([0-9.]{1,10})" => "\\1"
3907 ),
3908 "uri" => "http://www.online24.de"
3909 ),
3910 "onlinewebcheck" => array(
3911 "icon" => "csehtmlvalidator",
3912 "title" => "CSE HTML Validator",
3913 "rule" => array(
3914 "onlinewebcheck" => ""
3915 ),
3916 "uri" => "http://www.onlinewebcheck.com"
3917 ),
3918 "onsearch" => array(
3919 "icon" => "onsearch",
3920 "title" => "OnSearch",
3921 "rule" => array(
3922 "^onCHECK-Robot" => ""
3923 ),
3924 "uri" => "http://www.onsearch.de"
3925 ),
3926 "onto" => array(
3927 "icon" => "robot",
3928 "title" => "OntoSpider",
3929 "rule" => array(
3930 "^OntoSpider[ /]([0-9.]{1,10})" => "\\1"
3931 ),
3932 "uri" => "http://ontospider.i-n.info/"
3933 ),
3934 "openacoon" => array(
3935 "icon" => "robot",
3936 "title" => "OpenAcoon",
3937 "rule" => array(
3938 "^OpenAcoon v([0-9.]{1,10})" => "\\1"
3939 ),
3940 "uri" => "http://www.openacoon.de/"
3941 ),
3942 "openfind" => array(
3943 "icon" => "openfind",
3944 "title" => "Openfind",
3945 "rule" => array(
3946 "openbot[ /]([0-9.]{1,10})" => "\\1",
3947 "Openfind Robot[ /]([0-9.A-Z]{1,10})" => "\\1"
3948 ),
3949 "uri" => ""
3950 ),
3951 "opentagger" => array(
3952 "icon" => "robot",
3953 "title" => "OpenTagger",
3954 "rule" => array(
3955 "^OpenTaggerBot" => ""
3956 ),
3957 "uri" => "http://www.opentagger.com/opentaggerbot.htm"
3958 ),
3959 "opentext" => array(
3960 "icon" => "opentext",
3961 "title" => "OpenText",
3962 "rule" => array(
3963 "^OpenTextSiteCrawler[ /]([0-9.]{1,10})" => "\\1"
3964 ),
3965 "uri" => "http://www.opentext.net/"
3966 ),
3967 "openweb" => array(
3968 "icon" => "robot",
3969 "title" => "OpenWebSpider",
3970 "rule" => array(
3971 "^OpenWebSpider[ /]([0-9.]{1,10})" => "\\1",
3972 "^OpenWebSpider v([0-9.A-Z]{1,10})" => "\\1"
3973 ),
3974 "uri" => "http://www.openwebspider.org"
3975 ),
3976 "openx" => array(
3977 "icon" => "openx",
3978 "title" => "OpenX Spider",
3979 "rule" => array(
3980 "OpenX" => ""
3981 ),
3982 "uri" => "http://www.openx.org"
3983 ),
3984 "orange" => array(
3985 "icon" => "orange",
3986 "title" => "Orange",
3987 "rule" => array(
3988 "OrangeBot-Mobile[ /]([0-9.]{1,10})" => "\\1"
3989 ),
3990 "uri" => "http://orange.com/"
3991 ),
3992 "organica" => array(
3993 "icon" => "robot",
3994 "title" => "Organica",
3995 "rule" => array(
3996 "crawler@organica\.us" => ""
3997 ),
3998 "uri" => ""
3999 ),
4000 "outfox" => array(
4001 "icon" => "robot",
4002 "title" => "Outfox Melon",
4003 "rule" => array(
4004 "OutfoxMelonBot[ /]([0-9.]{1,10})" => "\\1",
4005 "OutfoxBot[ /]([0-9.]{1,10})" => "\\1"
4006 ),
4007 "uri" => ""
4008 ),
4009 "overture" => array(
4010 "icon" => "overture",
4011 "title" => "Overture",
4012 "rule" => array(
4013 "Overture[ \-]?WebCrawler" => ""
4014 ),
4015 "uri" => ""
4016 ),
4017 "page2rss" => array(
4018 "icon" => "page2rss",
4019 "title" => "Page2RSS",
4020 "rule" => array(
4021 "Page2RSS[ /]([0-9.]{1,10})" => "\\1"
4022 ),
4023 "uri" => "http://page2rss.com"
4024 ),
4025 "pagebytes" => array(
4026 "icon" => "robot",
4027 "title" => "PageBites",
4028 "rule" => array(
4029 "^PageBitesHyperBot[ /]([0-9.]{1,10})" => "\\1"
4030 ),
4031 "uri" => ""
4032 ),
4033 "pagesinventory" => array(
4034 "icon" => "pagesinventory",
4035 "title" => "PagesInventory",
4036 "rule" => array(
4037 "^PagesInventory" => ""
4038 ),
4039 "uri" => "http://www.pagesinventory.com"
4040 ),
4041 "pagesjaunes" => array(
4042 "icon" => "pagesjaunes",
4043 "title" => "Pages Jaunes",
4044 "rule" => array(
4045 "PJBot[ /]([0-9.]{1,10})" => "\\1"
4046 ),
4047 "uri" => "http://www.pagesjaunes.fr/"
4048 ),
4049 "pagevalet" => array(
4050 "icon" => "wdg",
4051 "title" => "WDG Page Valet",
4052 "rule" => array(
4053 "^Page Valet[ /]([0-9.]{1,10})" => "\\1"
4054 ),
4055 "uri" => "http://www.htmlhelp.com/tools/validator/"
4056 ),
4057 "panopeabot" => array(
4058 "icon" => "robot",
4059 "title" => "PanopeaBot",
4060 "rule" => array(
4061 "PanopeaBot[/ ]([0-9.]{1,10})" => "\\1"
4062 ),
4063 "uri" => ""
4064 ),
4065 "parchmenthill" => array(
4066 "icon" => "robot",
4067 "title" => "Parchment Hill",
4068 "rule" => array(
4069 "ParchBot[ /]([0-9.]{1,10})" => "\\1"
4070 ),
4071 "uri" => "http://www.parchmenthill.com/search.htm"
4072 ),
4073 "pascient" => array(
4074 "icon" => "pascient",
4075 "title" => "Pascient",
4076 "rule" => array(
4077 "panscient.com" => ""
4078 ),
4079 "uri" => "http://www.panscient.com/"
4080 ),
4081 "peerbot" => array(
4082 "icon" => "peerbot",
4083 "title" => "Peerbot",
4084 "rule" => array(
4085 "^PEERbot" => ""
4086 ),
4087 "uri" => ""
4088 ),
4089 "php" => array(
4090 "icon" => "php",
4091 "title" => "PHP",
4092 "rule" => array(
4093 "^PHP[ /]([0-9.]{1,10})" => "\\1"
4094 ),
4095 "uri" => ""
4096 ),
4097 "phpcrawl" => array(
4098 "icon" => "robot",
4099 "title" => "PHPCrawl",
4100 "rule" => array(
4101 "^PHPCrawl" => ""
4102 ),
4103 "uri" => "http://phpcrawl.cuab.de/"
4104 ),
4105 "phpdig" => array(
4106 "icon" => "robot",
4107 "title" => "PhpDig",
4108 "rule" => array(
4109 "^PhpDig[ /]([0-9.]{1,10})" => "\\1"
4110 ),
4111 "uri" => "http://www.finbot.com/"
4112 ),
4113 "phpversiontracker" => array(
4114 "icon" => "phpversiontracker",
4115 "title" => "PHP version tracker",
4116 "rule" => array(
4117 "^PHP version tracker" => ""
4118 ),
4119 "uri" => "http://www.nexen.net/phpversion/bot.php"
4120 ),
4121 "pictureofinternet" => array(
4122 "icon" => "robot",
4123 "title" => "PictureOfInternet",
4124 "rule" => array(
4125 "^PictureOfInternet[ /]([0-9.]{1,10})" => ""
4126 ),
4127 "uri" => ""
4128 ),
4129 "pingdom" => array(
4130 "icon" => "pingdom",
4131 "title" => "Pingdom",
4132 "rule" => array(
4133 "^Pingdom GIGRIB v([0-9.]{1,10})" => "\\1",
4134 "^Pingdom" => ""
4135 ),
4136 "uri" => "http://www.pingdom.com/"
4137 ),
4138 "pinseri" => array(
4139 "icon" => "pinseri",
4140 "title" => "Pinseri",
4141 "rule" => array(
4142 "www\.pinseri\.com/bloglist" => ""
4143 ),
4144 "uri" => ""
4145 ),
4146 "plagger" => array(
4147 "icon" => "plagger",
4148 "title" => "Plagger",
4149 "rule" => array(
4150 "Plagger[ /]([0-9.]{1,10})" => "\\1"
4151 ),
4152 "uri" => "http://www.plugger.org"
4153 ),
4154 "planet" => array(
4155 "icon" => "planet",
4156 "title" => "Planet",
4157 "rule" => array(
4158 "Planet[ /]([0-9.]{1,10})" => "\\1"
4159 ),
4160 "uri" => ""
4161 ),
4162 "plantynet" => array(
4163 "icon" => "robot",
4164 "title" => "PlantyNet",
4165 "rule" => array(
4166 "PlantyNet_WebRobot[_ /]V?([0-9.]{1,10})" => "\\1"
4167 ),
4168 "uri" => ""
4169 ),
4170 "pluck" => array(
4171 "icon" => "pluck",
4172 "title" => "Pluck",
4173 "rule" => array(
4174 "PluckFeedCrawler[ /]([0-9.]{1,10})" => "\\1"
4175 ),
4176 "uri" => ""
4177 ),
4178 "plsearch" => array(
4179 "icon" => "plsearch",
4180 "title" => "PlanetSearch",
4181 "rule" => array(
4182 "fido[ /]([0-9.]{1,10}) Harvest" => "\\1"
4183 ),
4184 "uri" => ""
4185 ),
4186 "poe" => array(
4187 "icon" => "robot",
4188 "title" => "POE-Component",
4189 "rule" => array(
4190 "^POE-Component-Client-HTTP[/ ]([0-9.]{1,10})" => "\\1"
4191 ),
4192 "uri" => ""
4193 ),
4194 "pogodak" => array(
4195 "icon" => "pogodak",
4196 "title" => "Pogodak",
4197 "rule" => array(
4198 "Pogodak\.hr[/ ]?([0-9.]{1,10})" => "\\1"
4199 ),
4200 "uri" => ""
4201 ),
4202 "poodle" => array(
4203 "icon" => "robot",
4204 "title" => "Poodle predictor",
4205 "rule" => array(
4206 "P(oo|ooo)dle[ \-]?predictor[ \-]?([0-9.]{1,10})" => "\\1",
4207 "P(oo|ooo)dle[ \-]?predictor" => ""
4208 ),
4209 "uri" => "http://www.gritechnologies.com/tools/spider.go"
4210 ),
4211 "pompos" => array(
4212 "icon" => "pompos",
4213 "title" => "Pompos",
4214 "rule" => array(
4215 "Pompos[ /]([0-9.]{1,10})" => "\\1"
4216 ),
4217 "uri" => ""
4218 ),
4219 "popdex" => array(
4220 "icon" => "robot",
4221 "title" => "Popdexter",
4222 "rule" => array(
4223 "Popdexter" => ""
4224 ),
4225 "uri" => ""
4226 ),
4227 "postrank" => array(
4228 "icon" => "postrank",
4229 "title" => "PostRank",
4230 "rule" => array(
4231 "^PostRank[ /]+([0-9.]{1,10})" => "\\1"
4232 ),
4233 "uri" => "http://www.postrank.com/"
4234 ),
4235 "powermarks" => array(
4236 "icon" => "robot",
4237 "title" => "Powermarks",
4238 "rule" => array(
4239 "Powermarks[ /]([0-9.]{1,10})" => "\\1"
4240 ),
4241 "uri" => ""
4242 ),
4243 "probe" => array(
4244 "icon" => "robot",
4245 "title" => "PROBE!",
4246 "rule" => array(
4247 "^PROBE!" => ""
4248 ),
4249 "uri" => ""
4250 ),
4251 "projecthoneypot" => array(
4252 "icon" => "projecthoneypot",
4253 "title" => "Project Honeypot",
4254 "rule" => array(
4255 "^PHPot Verispider[ /v]+([0-9.]{1,10})" => "\\1",
4256 "projecthoneypot" => ""
4257 ),
4258 "uri" => "http://www.projecthoneypot.org"
4259 ),
4260 "proxycache" => array(
4261 "icon" => "robot",
4262 "title" => "Proxy Cache",
4263 "rule" => array(
4264 "^Mozilla/[0-9.]{1,10} \(compatible\;\)$" => ""
4265 ),
4266 "uri" => ""
4267 ),
4268 "proxyhunter" => array(
4269 "icon" => "robot",
4270 "title" => "ProxyHunter",
4271 "rule" => array(
4272 "ProxyHunter" => ""
4273 ),
4274 "uri" => ""
4275 ),
4276 "psbot" => array(
4277 "icon" => "picsearch",
4278 "title" => "PicSearch",
4279 "rule" => array(
4280 "^psbot" => ""
4281 ),
4282 "uri" => ""
4283 ),
4284 "pubsub" => array(
4285 "icon" => "pubsub",
4286 "title" => "PubSub",
4287 "rule" => array(
4288 "^PubSub-RSS-Reader[ /]([0-9.]{1,10})" => "\\1",
4289 "^PubSub\.com" => ""
4290 ),
4291 "uri" => ""
4292 ),
4293 "pubarch" => array(
4294 "icon" => "robot",
4295 "title" => "PubArchive",
4296 "rule" => array(
4297 "publiclibraryarchive.org" => ""
4298 ),
4299 "uri" => ""
4300 ),
4301 "pukiwiki" => array(
4302 "icon" => "pukiwiki",
4303 "title" => "PukiWiki",
4304 "rule" => array(
4305 "PukiWiki[ /]([0-9.]{1,10})" => "\\1"
4306 ),
4307 "uri" => ""
4308 ),
4309 "pwebotxy" => array(
4310 "icon" => "pwebotxy",
4311 "title" => "PWeBot/X.Y",
4312 "rule" => array(
4313 "^PWeBot[ /]([0-9.]{1,10})" => "\\1"
4314 ),
4315 "uri" => "http://www.programacionweb.net/robot.php"
4316 ),
4317 "pxys" => array(
4318 "icon" => "robot",
4319 "title" => "PXYS",
4320 "rule" => array(
4321 "^pxys" => ""
4322 ),
4323 "uri" => ""
4324 ),
4325 "qango" => array(
4326 "icon" => "qango",
4327 "title" => "Qango",
4328 "rule" => array(
4329 "^Qango.com" => ""
4330 ),
4331 "uri" => "http://www.quango.com/"
4332 ),
4333 "qihoo" => array(
4334 "icon" => "qihoo",
4335 "title" => "Qihoo",
4336 "rule" => array(
4337 "QihooBot[ /]([0-9.]{1,10})" => "\\1"
4338 ),
4339 "uri" => "http://www.qihoo.com/"
4340 ),
4341 "qseero" => array(
4342 "icon" => "robot",
4343 "title" => "Qseero",
4344 "rule" => array(
4345 "Qseero v([0-9.]{1,10})" => "\\1"
4346 ),
4347 "uri" => "http://www.q0.com/"
4348 ),
4349 "quantcast" => array(
4350 "icon" => "robot",
4351 "title" => "Quantcast",
4352 "rule" => array(
4353 "Quantcastbot[ /]([0-9.]{1,10})" => "\\1"
4354 ),
4355 "uri" => "http://www.quantcast.com/"
4356 ),
4357 "quepasa" => array(
4358 "icon" => "quepasa",
4359 "title" => "Quepasa",
4360 "rule" => array(
4361 "Quepasa[ \-]?Creep" => ""
4362 ),
4363 "uri" => ""
4364 ),
4365 "questfinder" => array(
4366 "icon" => "robot",
4367 "title" => "QuestFinder",
4368 "rule" => array(
4369 "www\.questfinder\.com" => ""
4370 ),
4371 "uri" => ""
4372 ),
4373 "qweery" => array(
4374 "icon" => "robot",
4375 "title" => "Qweery",
4376 "rule" => array(
4377 "^QweeryBot[ /]([0-9.]{1,10})" => "\\1"
4378 ),
4379 "uri" => "http://qweerybot.qweery.nl"
4380 ),
4381 "racaicrawler" => array(
4382 "icon" => "robot",
4383 "title" => "RacaiCrawler",
4384 "rule" => array(
4385 "RacaiCrawler[ -]([0-9.]{1,10})" => "\\1"
4386 )
4387 ),
4388 "radian6" => array(
4389 "icon" => "robot",
4390 "title" => "Radian6",
4391 "rule" => array(
4392 "www\.radian6\.com" => ""
4393 ),
4394 "uri" => "http://www.radian6.com"
4395 ),
4396 "rambler" => array(
4397 "icon" => "rambler",
4398 "title" => "Rambler",
4399 "rule" => array(
4400 "StackRambler[ /]([0-9.]{1,10})" => "\\1"
4401 ),
4402 "uri" => ""
4403 ),
4404 "ramiba" => array(
4405 "icon" => "robot",
4406 "title" => "Ramiba",
4407 "rule" => array(
4408 "^ramiba(-bot)?" => "\\1"
4409 ),
4410 "uri" => ""
4411 ),
4412 "rankur" => array(
4413 "icon" => "rankur",
4414 "title" => "Rankur",
4415 "rule" => array(
4416 "^RankurBot/Rankur([0-9.]{1,10})" => "\\1"
4417 ),
4418 "uri" => "http://rankur.com/",
4419 ),
4420 "red" => array(
4421 "icon" => "red",
4422 "title" => "RED",
4423 "rule" => array(
4424 "RED[ /]([0-9.]{1,10})" => "\\1"
4425 ),
4426 "uri" => "http://redbot.org/"
4427 ),
4428 "rediff" => array(
4429 "icon" => "rediff",
4430 "title" => "Rediff",
4431 "rule" => array(
4432 "^RedBot/redbot[ /\-]([0-9.]{1,10})" => "\\1"
4433 ),
4434 "uri" => "http://www.rediff.com",
4435 ),
4436 "repia" => array(
4437 "icon" => "robot",
4438 "title" => "Repia",
4439 "rule" => array(
4440 "webmaster@repia\.com" => ""
4441 ),
4442 "uri" => ""
4443 ),
4444 "robotgenius" => array(
4445 "icon" => "robot",
4446 "title" => "Robot Genius",
4447 "rule" => array(
4448 "^robotgenius" => ""
4449 ),
4450 "uri" => "http://robotgenius.net",
4451 ),
4452 "robozilla" => array(
4453 "icon" => "robot",
4454 "title" => "Robozilla",
4455 "rule" => array(
4456 "Robozilla" => ""
4457 ),
4458 "uri" => ""
4459 ),
4460 "rogerbot" => array(
4461 "icon" => "moz",
4462 "title" => "Moz Rogerbot",
4463 "rule" => array(
4464 "rogerbot[ /]([0-9.]{1,10})" => "\\1"
4465 ),
4466 "uri" => "http://moz.com/help/guides/moz-procedures/who-is-rogerbot"
4467 ),
4468 "rojo" => array(
4469 "icon" => "rojo",
4470 "title" => "Rojo",
4471 "rule" => array(
4472 "Rojo[ /]([0-9.]{1,10})" => "\\1"
4473 ),
4474 "uri" => ""
4475 ),
4476 "rss-atom" => array(
4477 "icon" => "rss",
4478 "title" => "RSS / Atom",
4479 "rule" => array(
4480 "^Apple-PubSub" => "",
4481 "^AppleSyndication" => ""
4482 ),
4483 "uri" => ""
4484 ),
4485 "rssbot" => array(
4486 "icon" => "rss",
4487 "title" => "RSS-bot",
4488 "rule" => array(
4489 "rss-bot[ /]([0-9.]{1,10})" => "\\1"
4490 ),
4491 "uri" => ""
4492 ),
4493 "rssbandit" => array(
4494 "icon" => "rssbandit",
4495 "title" => "RssBandit",
4496 "rule" => array(
4497 "RssBandit[ /]([0-9.]{1,10})" => "\\1"
4498 ),
4499 "uri" => ""
4500 ),
4501 "rssimages" => array(
4502 "icon" => "rss",
4503 "title" => "RssImages",
4504 "rule" => array(
4505 "rssImagesBot[ /]([0-9.]{1,10})" => "\\1"
4506 ),
4507 "uri" => ""
4508 ),
4509 "rssmicro" => array(
4510 "icon" => "rssmicro",
4511 "title" => "RSSMicro",
4512 "rule" => array(
4513 "RSSMicro\.com" => ""
4514 ),
4515 "uri" => "http://www.rssmicro.com"
4516 ),
4517 "rssowl" => array(
4518 "icon" => "rssowl",
4519 "title" => "RSSOwl",
4520 "rule" => array(
4521 "RSSOwl[ /]([0-9a-z.]{1,10})" => "\\1"
4522 ),
4523 "uri" => ""
4524 ),
4525 "rssreader" => array(
4526 "icon" => "rss",
4527 "title" => "RssReader",
4528 "rule" => array(
4529 "RssReader[ /]([0-9.]{1,10})" => ""
4530 ),
4531 "uri" => ""
4532 ),
4533 "rtgi" => array(
4534 "icon" => "rtgi",
4535 "title" => "Rtgi",
4536 "rule" => array(
4537 "RTGI" => ""
4538 ),
4539 "uri" => "http://rtgi.fr/"
4540 ),
4541 "rufusbot" => array(
4542 "icon" => "robot",
4543 "title" => "RufusBot",
4544 "rule" => array(
4545 "RufusBot" => ""
4546 ),
4547 "uri" => ""
4548 ),
4549 "runet" => array(
4550 "icon" => "runet",
4551 "title" => "iTrack RuNet Crawler",
4552 "rule" => array(
4553 "Runet-Research-Crawler" => ""
4554 ),
4555 "uri" => "http://www.itrack.ru/research/cmsrate/"
4556 ),
4557 "runnk" => array(
4558 "icon" => "robot",
4559 "title" => "Runnk",
4560 "rule" => array(
4561 "Runnk RSS finder" => ""
4562 ),
4563 "uri" => "http://www.runnk.com/il/law"
4564 ),
4565 "sagool" => array(
4566 "icon" => "robot",
4567 "title" => "Sagool",
4568 "rule" => array(
4569 "MaSagool" => ""
4570 ),
4571 "uri" => "http://sagool.jp/"
4572 ),
4573 "sanszbot" => array(
4574 "icon" => "robot",
4575 "title" => "Sansz",
4576 "rule" => array(
4577 "SanszBot" => ""
4578 ),
4579 "uri" => ""
4580 ),
4581 "saucereader" => array(
4582 "icon" => "saucereader",
4583 "title" => "Sauce Reader",
4584 "rule" => array(
4585 "Sauce[ ]?Reader[ /]([0-9.]{1,10})" => "\\1"
4586 ),
4587 "uri" => ""
4588 ),
4589 "sbider" => array(
4590 "icon" => "sbider",
4591 "title" => "SBIder",
4592 "rule" => array(
4593 "SBIder[/ ]([0-9.]{1,10})" => "\\1",
4594 "SBIder[/ ]SBIder.([0-9.]{1,10})" => "\\1"
4595 ),
4596 "uri" => ""
4597 ),
4598 "scirus" => array(
4599 "icon" => "robot",
4600 "title" => "Scirus",
4601 "rule" => array(
4602 "FAST-WebCrawler/[0-9a-z.]{1,10}/Scirus" => ""
4603 ),
4604 "uri" => ""
4605 ),
4606 "scoutjet" => array(
4607 "icon" => "scoutjet",
4608 "title" => "ScoutJet",
4609 "rule" => array(
4610 "ScoutJet" => ""
4611 ),
4612 "uri" => "http://www.scoutjet.com/"
4613 ),
4614 "scrapy" => array(
4615 "icon" => "scrapy",
4616 "title" => "Scrapy",
4617 "rule" => array(
4618 "Scrapy[ /]([0-9.]{1,10})" => "\\1"
4619 ),
4620 "uri" => "http://scrapy.org"
4621 ),
4622 "scrubby" => array(
4623 "icon" => "scrubby",
4624 "title" => "Scrubby",
4625 "rule" => array(
4626 "Scrubby[ /]([0-9.]{1,10})" => "\\1"
4627 ),
4628 "uri" => ""
4629 ),
4630 "sdm" => array(
4631 "icon" => "sdm",
4632 "title" => "SUN Download Manager",
4633 "rule" => array(
4634 "Sun Download Manager[/ ]([0-9.]{1,10})" => "\\1"
4635 ),
4636 "uri" => ""
4637 ),
4638 "sealinks" => array(
4639 "icon" => "robot",
4640 "title" => "Sea Links",
4641 "rule" => array(
4642 "SEA-Links( HTML-Scanner Pingoo\!)?[ /]([0-9.]{1,10})" => "\\2"
4643 ),
4644 "uri" => ""
4645 ),
4646 "search17" => array(
4647 "icon" => "robot",
4648 "title" => "Search 17",
4649 "rule" => array(
4650 "Search17Bot[ /]([0-9.]{1,10})" => "\\1"
4651 ),
4652 "uri" => "http://www.search17.com/bot.php"
4653 ),
4654 "search2" => array(
4655 "icon" => "search2",
4656 "title" => "Search2.net",
4657 "rule" => array(
4658 "^S2Bot[ /]([0-9.]{1,10})" => "\\1"
4659 ),
4660 "uri" => "http://search2.net/"
4661 ),
4662 "searchbot" => array(
4663 "icon" => "robot",
4664 "title" => "Searchbot",
4665 "rule" => array(
4666 "Searchbot[ /]([0-9.]{1,10})" => "\\1"
4667 ),
4668 "uri" => ""
4669 ),
4670 "searchch" => array(
4671 "icon" => "robot",
4672 "title" => "Search.ch",
4673 "rule" => array(
4674 "search\.ch[ /]?V?([0-9.]{1,10})" => "\\1"
4675 ),
4676 "uri" => ""
4677 ),
4678 "searchengineworld" => array(
4679 "icon" => "robot",
4680 "title" => "SearchEngineWorld",
4681 "rule" => array(
4682 "searchengineworld" => ""
4683 ),
4684 "uri" => "http://www.searchengineworld.com/"
4685 ),
4686 "searchhippo" => array(
4687 "icon" => "searchhippo",
4688 "title" => "Searchhippo",
4689 "rule" => array(
4690 "searchhippo" => ""
4691 ),
4692 "uri" => "http://www.searchhippo.com/"
4693 ),
4694 "searchthruus" => array(
4695 "icon" => "robot",
4696 "title" => "SearchThruUs",
4697 "rule" => array(
4698 "www\.unitek-systems\.co\.uk[ /]([0-9.]{1,10})" => "\\1"
4699 ),
4700 "uri" => ""
4701 ),
4702 "securecomputing" => array(
4703 "icon" => "robot",
4704 "title" => "Secure Computing",
4705 "rule" => array(
4706 "securecomputing" => ""
4707 ),
4708 "uri" => ""
4709 ),
4710 "seekport" => array(
4711 "icon" => "seekport",
4712 "title" => "Seekport",
4713 "rule" => array(
4714 "Seekbot[ /]([0-9.]{1,10})" => "\\1"
4715 ),
4716 "uri" => ""
4717 ),
4718 "semanticdiscovery" => array(
4719 "icon" => "robot",
4720 "title" => "Semantic Discovery",
4721 "rule" => array(
4722 "semanticdiscovery[ /]([0-9.]{1,10})" => "\\1"
4723 ),
4724 "uri" => ""
4725 ),
4726 "semrush" => array(
4727 "icon" => "semrush",
4728 "title" => "SEMrush",
4729 "rule" => array(
4730 "SemrushBot[ /]([0-9.]{1,10})" => "\\1"
4731 ),
4732 "uri" => "http://www.semrush.com/bot.html"
4733 ),
4734 "sengine" => array(
4735 "icon" => "sengine",
4736 "title" => "Sengine",
4737 "rule" => array(
4738 "netEstate NE Crawler" => ""
4739 ),
4740 "uri" => "http://www.sengine.info/"
4741 ),
4742 "sensis" => array(
4743 "icon" => "sensis",
4744 "title" => "Sensis",
4745 "rule" => array(
4746 "^Sensis(.com.au)? Web Crawler" => ""
4747 ),
4748 "uri" => "http://sensis.com.au"
4749 ),
4750 "seokicks" => array(
4751 "icon" => "seokicks",
4752 "title" => "SEOkicks",
4753 "rule" => array(
4754 "SEOkicks-Robot" => ""
4755 ),
4756 "uri" => "http://www.seokicks.de/"
4757 ),
4758 "seoprofiler" => array(
4759 "icon" => "seoprofiler",
4760 "title" => "SEOprofiler",
4761 "rule" => array(
4762 "spbot[ /]([0-9.]{1,10})" => "\\1"
4763 ),
4764 "uri" => "http://www.seoprofiler.com/"
4765 ),
4766 "setooz" => array(
4767 "icon" => "setooz",
4768 "title" => "Setooz",
4769 "rule" => array(
4770 "OOZBOT[ /]([0-9.]{1,10})" => "\\1"
4771 ),
4772 "uri" => "http://www.setooz.com/oozbot.html"
4773 ),
4774 "seznam" => array(
4775 "icon" => "seznam",
4776 "title" => "Seznam",
4777 "rule" => array(
4778 "SeznamBot[ /]([0-9.]{1,10})" => "\\1",
4779 "Seznam" => ""
4780 ),
4781 "uri" => "http://www.seznam.cz"
4782 ),
4783 "sharpreader" => array(
4784 "icon" => "sharpreader",
4785 "title" => "SharpReader",
4786 "rule" => array(
4787 "SharpReader[ /]([0-9.]{1,10})" => "\\1"
4788 ),
4789 "uri" => ""
4790 ),
4791 "shelob" => array(
4792 "icon" => "shelob",
4793 "title" => "Sherlock Spider",
4794 "rule" => array(
4795 "^Shelob" => ""
4796 ),
4797 "uri" => "http://www.gmx.net"
4798 ),
4799 "sherlockspider" => array(
4800 "icon" => "robot",
4801 "title" => "Sherlock Spider",
4802 "rule" => array(
4803 "sherlock_spider" => ""
4804 ),
4805 "uri" => ""
4806 ),
4807 "shim" => array(
4808 "icon" => "robot",
4809 "title" => "Shim Crawler",
4810 "rule" => array(
4811 "shim[ \-]crawler" => ""
4812 ),
4813 "uri" => ""
4814 ),
4815 "shopwiki" => array(
4816 "icon" => "shopwiki",
4817 "title" => "ShopWiki",
4818 "rule" => array(
4819 "^ShopWiki[ /]([0-9.]{1,10})" => "\\1"
4820 ),
4821 "uri" => ""
4822 ),
4823 "shoula" => array(
4824 "icon" => "robot",
4825 "title" => "Shoula",
4826 "rule" => array(
4827 "^Shoula.com Crawler ([0-9.]{1,10})" => "\\1"
4828 ),
4829 "uri" => "http://www.shoula.com"
4830 ),
4831 "siege" => array(
4832 "icon" => "robot",
4833 "title" => "Siege",
4834 "rule" => array(
4835 "Siege[ /]([0-9.]{1,10})" => "\\1"
4836 ),
4837 "uri" => ""
4838 ),
4839 "siets" => array(
4840 "icon" => "robot",
4841 "title" => "Siets",
4842 "rule" => array(
4843 "SietsCrawler[ /]([0-9.]{1,10})" => "\\1"
4844 ),
4845 "uri" => ""
4846 ),
4847 "simpy" => array(
4848 "icon" => "simpy",
4849 "title" => "Simpy",
4850 "rule" => array(
4851 "^(argus|simpy)[ /]([0-9.]{1,10})" => "\\2",
4852 ),
4853 "uri" => ""
4854 ),
4855 "singingfish" => array(
4856 "icon" => "singingfish",
4857 "title" => "SingingFish",
4858 "rule" => array(
4859 "asterias[ /]([0-9.]{1,10})" => "\\1",
4860 "Asterias Crawler v([0-9.]{1,10})" => "\\1",
4861 "asterias" => ""
4862 ),
4863 "uri" => ""
4864 ),
4865 "sirketce" => array(
4866 "icon" => "robot",
4867 "title" => "Sirketce",
4868 "rule" => array(
4869 "Sirketcebot[ /v]+([0-9.]{1,10})" => "\\1"
4870 ),
4871 "uri" => "http://www.sirketce.com/bot.html"
4872 ),
4873 "sirobot" => array(
4874 "icon" => "robot",
4875 "title" => "SiroBot",
4876 "rule" => array(
4877 "sirobot" => ""
4878 ),
4879 "uri" => ""
4880 ),
4881 "sistrix" => array(
4882 "icon" => "sistrix",
4883 "title" => "SISTRIX",
4884 "rule" => array(
4885 "SISTRIX Crawler" => ""
4886 ),
4887 "uri" => "http://crawler.sistrix.net/"
4888 ),
4889 "sitebar" => array(
4890 "icon" => "sitebar",
4891 "title" => "SiteBar",
4892 "rule" => array(
4893 "SiteBar[ /]([0-9.]{1,10})" => "\\1"
4894 ),
4895 "uri" => ""
4896 ),
4897 "sitebot" => array(
4898 "icon" => "sitebot",
4899 "title" => "SiteBot",
4900 "rule" => array(
4901 "SiteBot[ /]([0-9.]{1,10})" => "\\1"
4902 ),
4903 "uri" => "http://www.sitebot.org/robot/"
4904 ),
4905 "siteexplorer" => array(
4906 "icon" => "siteexplorer",
4907 "title" => "SiteExplorer",
4908 "rule" => array(
4909 "SiteExplorer[ /]([0-9a-z.]{1,10})" => "\\1"
4910 ),
4911 "uri" => "http://siteexplorer.info/"
4912 ),
4913 "sitesell" => array(
4914 "icon" => "sitesell",
4915 "title" => "SiteSell",
4916 "rule" => array(
4917 "SBIder[/ ]([0-9a-z.\-]{1,10})" => "\\1"
4918 ),
4919 "uri" => ""
4920 ),
4921 "sitespider" => array(
4922 "icon" => "robot",
4923 "title" => "SiteSpider",
4924 "rule" => array(
4925 "^SiteSpider" => ""
4926 ),
4927 "uri" => ""
4928 ),
4929 "sitesucker" => array(
4930 "icon" => "sitesucker",
4931 "title" => "SiteSucker",
4932 "rule" => array(
4933 "Sitesucker[ /]([0-9.]{1,10})" => "\\1"
4934 ),
4935 "uri" => "http://www.sitesucker.us/"
4936 ),
4937 "sitidi" => array(
4938 "icon" => "robot",
4939 "title" => "SitiDi",
4940 "rule" => array(
4941 "SitiDiBot[ /]([0-9.]{1,10})" => "\\1"
4942 ),
4943 "uri" => ""
4944 ),
4945 "sixy" => array(
4946 "icon" => "robot",
4947 "title" => "Sixy.ch",
4948 "rule" => array(
4949 "sixy.ch[ /]([0-9a-z.]{1,10})" => "\\1"
4950 ),
4951 "uri" => "http://sixy.ch"
4952 ),
4953 "skaffe" => array(
4954 "icon" => "robot",
4955 "title" => "Skaffe",
4956 "rule" => array(
4957 "Skampy[ /]([0-9.\-]{1,10})" => "\\1"
4958 ),
4959 "uri" => "http://www.skaffe.com"
4960 ),
4961 "skizzle" => array(
4962 "icon" => "skizzle",
4963 "title" => "Skizzle",
4964 "rule" => array(
4965 "SKIZZLE! Distributed Internet Spider[ /v]+([0-9a-z.\-]{1,10})" => "\\1"
4966 ),
4967 "uri" => "http://www.skizzle.com"
4968 ),
4969 "slider" => array(
4970 "icon" => "robot",
4971 "title" => "Slider",
4972 "rule" => array(
4973 "^Slider[ /]([0-9.]{1,10})" => "\\1"
4974 ),
4975 "uri" => ""
4976 ),
4977 "slugch" => array(
4978 "icon" => "robot",
4979 "title" => "Slugch",
4980 "rule" => array(
4981 "^slug\.ch crawl ([0-9a-z.\-]{1,10})" => "\\1"
4982 ),
4983 "uri" => ""
4984 ),
4985 "smartware" => array(
4986 "icon" => "robot",
4987 "title" => "SmartWareSoft",
4988 "rule" => array(
4989 "^SWSBot-Images[ /]([0-9.]{1,10})" => "\\1"
4990 ),
4991 "uri" => "http://www.smartwaresoft.com/swsbot12.html"
4992 ),
4993 "snookit" => array(
4994 "icon" => "snookit",
4995 "title" => "Snookit",
4996 "rule" => array(
4997 "^snookit" => ""
4998 ),
4999 "uri" => "http://www.snookit.com/"
5000 ),
5001 "snoopy" => array(
5002 "icon" => "robot",
5003 "title" => "Snoopy",
5004 "rule" => array(
5005 "^Snoopy.+([0-9.]{1,10})" => "\\1",
5006 "sna-([0-9.]{1,10})" => "\\1"
5007 ),
5008 "uri" => "http://snoopy.sourceforge.net/"
5009 ),
5010 "snyke" => array(
5011 "icon" => "robot",
5012 "title" => "Snyke",
5013 "rule" => array(
5014 "^SnykeBot[ /]([0-9.]{1,10})" => "\\1"
5015 ),
5016 "uri" => "http://www.snyke.com"
5017 ),
5018 "socialradar" => array(
5019 "icon" => "socialradar",
5020 "title" => "Social Radar",
5021 "rule" => array(
5022 "Socialradarbot[ /]([0-9.]{1,10})" => "\\1"
5023 ),
5024 "uri" => "http://infegy.com/"
5025 ),
5026 "soegning" => array(
5027 "icon" => "soegning",
5028 "title" => "Søgning",
5029 "rule" => array(
5030 "soegning\.dk[/ ]spider[ /]([0-9.]{1,10})" => "\\1"
5031 ),
5032 "uri" => ""
5033 ),
5034 "soft411" => array(
5035 "icon" => "soft411",
5036 "title" => "Soft411",
5037 "rule" => array(
5038 "SOFT411 Directory" => ""
5039 ),
5040 "uri" => ""
5041 ),
5042 "sogou" => array(
5043 "icon" => "sogou",
5044 "title" => "Sogou",
5045 "rule" => array(
5046 "Sogou web spider[ /]([0-9.]{1,10})" => "\\1"
5047 ),
5048 "uri" => "http://www.sogou.com/docs/help/webmasters.htm#07"
5049 ),
5050 "sohu" => array(
5051 "icon" => "robot",
5052 "title" => "Sohu",
5053 "rule" => array(
5054 "sohu[ \-](agent|search)" => ""
5055 ),
5056 "uri" => ""
5057 ),
5058 "somewhere" => array(
5059 "icon" => "robot",
5060 "title" => "Somewhere.com",
5061 "rule" => array(
5062 "Mozilla\@somewhere\.com" => "\\1"
5063 ),
5064 "uri" => "http://www.somewhere.com/"
5065 ),
5066 "sopheus" => array(
5067 "icon" => "robot",
5068 "title" => "Sopheus",
5069 "rule" => array(
5070 "Sopheus Project[ /]([0-9.]{1,10})" => "\\1"
5071 ),
5072 "uri" => "http://www.thenetplanet.com"
5073 ),
5074 "soso" => array(
5075 "icon" => "soso",
5076 "title" => "Soso",
5077 "rule" => array(
5078 "^Soso(image)?spider" => ""
5079 ),
5080 "uri" => "http://help.soso.com/soso-image-spider.htm"
5081 ),
5082 "souppot" => array(
5083 "icon" => "robot",
5084 "title" => "SoupPot",
5085 "rule" => array(
5086 "SoupPotBot" => ""
5087 ),
5088 "uri" => ""
5089 ),
5090 "specificmedia" => array(
5091 "icon" => "specificmedia",
5092 "title" => "Specific Media",
5093 "rule" => array(
5094 "^SMBot[ /]([0-9.]{1,10})" => "\\1"
5095 ),
5096 "uri" => ""
5097 ),
5098 "sphider" => array(
5099 "icon" => "sphider",
5100 "title" => "Sphider",
5101 "rule" => array(
5102 "Sphider" => ""
5103 ),
5104 "uri" => "http://www.sphider.eu"
5105 ),
5106 "spinn3r" => array(
5107 "icon" => "robot",
5108 "title" => "Spinn3r",
5109 "rule" => array(
5110 "Spinn3r[ /]([0-9.]{1,10})" => "\\1"
5111 ),
5112 "uri" => "http://spinn3r.com/robot"
5113 ),
5114 "sproose" => array(
5115 "icon" => "robot",
5116 "title" => "Sproose",
5117 "rule" => array(
5118 "^sproose[ /]([0-9a-z.]{1,10})" => "\\1"
5119 ),
5120 "uri" => "http://www.sproose.com/bot.html"
5121 ),
5122 "spurlbot" => array(
5123 "icon" => "robot",
5124 "title" => "SpurlBot",
5125 "rule" => array(
5126 "SpurlBot[/ ]([0-9.]{1,10})" => "\\1"
5127 ),
5128 "uri" => ""
5129 ),
5130 "stardownloader" => array(
5131 "icon" => "stardownloader",
5132 "title" => "Star Downloader",
5133 "rule" => array(
5134 "^Star Downloader( Pro)?" => ""
5135 ),
5136 "uri" => ""
5137 ),
5138 "steeler" => array(
5139 "icon" => "robot",
5140 "title" => "Steeler",
5141 "rule" => array(
5142 "Steeler[ /]([0-9.]{1,10})" => "\\1"
5143 ),
5144 "uri" => ""
5145 ),
5146 "strategicboard" => array(
5147 "icon" => "strategicboard",
5148 "title" => "Strategic Board",
5149 "rule" => array(
5150 "Strategic Board Bot" => ""
5151 ),
5152 "uri" => "http://www.strategicboard.com"
5153 ),
5154 "suchbaer" => array(
5155 "icon" => "robot",
5156 "title" => "Suchbaer.de",
5157 "rule" => array(
5158 "^suchbaer\.de" => ""
5159 ),
5160 "uri" => "http://www.suchbaer.de/"
5161 ),
5162 "suchbot" => array(
5163 "icon" => "robot",
5164 "title" => "Suchbot",
5165 "rule" => array(
5166 "^suchbot" => ""
5167 ),
5168 "uri" => ""
5169 ),
5170 "suchende" => array(
5171 "icon" => "suchende",
5172 "title" => "Suchen.de",
5173 "rule" => array(
5174 "^gonzo([0-9]{1,2}).*www.suchen.de" => "\\1",
5175 "^gonzo/([0-9.]{1,10})" => "\\1"
5176 ),
5177 "uri" => "http://www.suchen.de/"
5178 ),
5179 "suchknecht" => array(
5180 "icon" => "robot",
5181 "title" => "Suchknecht",
5182 "rule" => array(
5183 "^Suchknecht.at-Robot" => ""
5184 ),
5185 "uri" => "http://www.suchknecht.at/"
5186 ),
5187 "suchpad" => array(
5188 "icon" => "robot",
5189 "title" => "Suchpad",
5190 "rule" => array(
5191 "^suchpadbot[ /]([0-9.]{1,10})" => "\\1"
5192 ),
5193 "uri" => "http://www.suchpad.de"
5194 ),
5195 "sunrise" => array(
5196 "icon" => "sunrise",
5197 "title" => "Sunrise",
5198 "rule" => array(
5199 "^Sunrise[ /]([0-9a-z.]{1,10})" => "\\1"
5200 ),
5201 "uri" => ""
5202 ),
5203 "superbot" => array(
5204 "icon" => "superbot",
5205 "title" => "SuperBot",
5206 "rule" => array(
5207 "SuperBot[ /]([0-9.]{1,10})" => "\\1"
5208 ),
5209 "uri" => ""
5210 ),
5211 "surfcontrol" => array(
5212 "icon" => "robot",
5213 "title" => "SurfControl",
5214 "rule" => array(
5215 "SurfControl" => "",
5216 "ScSpider[ /]([0-9.]{1,10})" => "\\1"
5217 ),
5218 "uri" => ""
5219 ),
5220 "surfnet" => array(
5221 "icon" => "robot",
5222 "title" => "SURFnet",
5223 "rule" => array(
5224 "AVSearch[ \-]([0-9.]{1,10})" => "\\1"
5225 ),
5226 "uri" => ""
5227 ),
5228 "surfsafely" => array(
5229 "icon" => "robot",
5230 "title" => "Surfsafely",
5231 "rule" => array(
5232 "Submission Spider at surfsafely.com" => ""
5233 ),
5234 "uri" => "http://www.surfsafely.com"
5235 ),
5236 "surphace" => array(
5237 "icon" => "spherescout",
5238 "title" => "Surphace",
5239 "rule" => array(
5240 "Sphere Scout.+([0-9.]{1,10})" => "\\1",//Previous called Sphere Scout
5241 "Surphace.+v([0-9.]{1,10})" => "\\1"
5242 ),
5243 "uri" => "http://www.surphace.com"
5244 ),
5245 "surveybot" => array(
5246 "icon" => "surveybot",
5247 "title" => "Whois Survey",
5248 "rule" => array(
5249 "SurveyBot[ /]([0-9.]{1,10})" => "\\1"
5250 ),
5251 "uri" => ""
5252 ),
5253 "swoogle" => array(
5254 "icon" => "robot",
5255 "title" => "Swoogle",
5256 "rule" => array(
5257 "^Swooglebot[ /]([0-9.]{1,10})" => "\\1"
5258 ),
5259 "uri" => "http://swoogle.umbc.edu/swooglebot.htm"
5260 ),
5261 "swse" => array(
5262 "icon" => "robot",
5263 "title" => "SWSE",
5264 "rule" => array(
5265 "sw\.deri\.org" => ""
5266 ),
5267 "uri" => "http://sw.deri.org/2006/04/multicrawler/robots.html"
5268 ),
5269 "swish-e" => array(
5270 "icon" => "swish-e",
5271 "title" => "Swish-e",
5272 "rule" => array(
5273 "^swish-e" => ""
5274 ),
5275 "uri" => "http://swish-e.org/"
5276 ),
5277 "sygol" => array(
5278 "icon" => "sygol",
5279 "title" => "Sygol",
5280 "rule" => array(
5281 "www.sygol.(com|net)" => ""
5282 ),
5283 "uri" => "http://www.sygol.com"
5284 ),
5285 "syllabs" => array(
5286 "icon" => "syllabs",
5287 "title" => "Syllabs",
5288 "rule" => array(
5289 "Focal[-]([0-9.]{1,10})" => "\\1"
5290 ),
5291 "uri" => "http://www.syllabs.com/crawler.html"
5292 ),
5293 "synapse" => array(
5294 "icon" => "robot",
5295 "title" => "Synapse",
5296 "rule" => array(
5297 " Synapse\)" => ""
5298 ),
5299 "uri" => "http://ws.apache.org/synapse/"
5300 ),
5301 "sync2it" => array(
5302 "icon" => "robot",
5303 "title" => "Sync2it",
5304 "rule" => array(
5305 "^\!Susie" => ""
5306 ),
5307 "uri" => "http://www.sync2it.com/bms/susie.php"
5308 ),
5309 "syncit" => array(
5310 "icon" => "robot",
5311 "title" => "Syncit",
5312 "rule" => array(
5313 "^SyncIT[ /]([0-9.]{1,10})" => "\\1"
5314 ),
5315 "uri" => "http://www.syncit.com/"
5316 ),
5317 "syndic8" => array(
5318 "icon" => "syndic8",
5319 "title" => "Syndic8",
5320 "rule" => array(
5321 "Syndic8[ /]([0-9.]{1,10})" => "\\1"
5322 ),
5323 "uri" => "http://www.syndic8.com/"
5324 ),
5325 "syndicatie" => array(
5326 "icon" => "robot",
5327 "title" => "Syndicatie.nl",
5328 "rule" => array(
5329 "Syndicatie\.nl robot v ([0-9.]{1,10})" => "\\1",
5330 "Syndicatie\.nl robot;" => ""
5331 ),
5332 "uri" => ""
5333 ),
5334 "synomia" => array(
5335 "icon" => "robot",
5336 "title" => "Synomia",
5337 "rule" => array(
5338 "^SynoBot" => ""
5339 ),
5340 "uri" => ""
5341 ),
5342 "synoo" => array(
5343 "icon" => "robot",
5344 "title" => "SynooBot",
5345 "rule" => array(
5346 "SynooBot[ /]([0-9.]{1,10})" => "\\1",
5347 ),
5348 "uri" => ""
5349 ),
5350 "szukacz" => array(
5351 "icon" => "szukacz",
5352 "title" => "Szukacz",
5353 "rule" => array(
5354 "Szukacz[ /]([0-9.]{1,10})" => "\\1"
5355 ),
5356 "uri" => ""
5357 ),
5358 "tagoo" => array(
5359 "icon" => "tagoobot",
5360 "title" => "Tagoo",
5361 "rule" => array(
5362 "Tagoobot[ /]([0-9.]{1,10})" => "\\1"
5363 ),
5364 "uri" => "http://www.tagoo.ru"
5365 ),
5366 "tagword" => array(
5367 "icon" => "tagword",
5368 "title" => "Tagword",
5369 "rule" => array(
5370 "^Tagword" => ""
5371 ),
5372 "uri" => "http://tagword.com/dmoz_survey.php"
5373 ),
5374 "trailfire" => array(
5375 "icon" => "trailfire",
5376 "title" => "Trailfire",
5377 "rule" => array(
5378 "^Trailfire-bot[ /]([0-9.]{1,10})" => "\\1"
5379 ),
5380 "uri" => "http://trailfire.com"
5381 ),
5382 "tamu" => array(
5383 "icon" => "tamu",
5384 "title" => "Tamu Crawler",
5385 "rule" => array(
5386 "IRLbot[ /]([0-9.]{1,10})" => "\\1",
5387 "TAMU_CS_IRL_CRAWLER[ /]([0-9.]{1,10})" => "\\1"
5388 ),
5389 "uri" => "http://irl.cs.tamu.edu/crawler/"
5390 ),
5391 "taptubot" => array(
5392 "icon" => "taptubot",
5393 "title" => "Taptu",
5394 "rule" => array(
5395 "taptubot" => ""
5396 ),
5397 "uri" => "http://www.taptu.com/corp/taptubot"
5398 ),
5399 "targetseek" => array(
5400 "icon" => "robot",
5401 "title" => "TargetSeek",
5402 "rule" => array(
5403 "TargetSeek[ /]([0-9.]{1,10})" => "\\1"
5404 ),
5405 "uri" => "http://www.targetgroups.net/TargetSeek.html"
5406 ),
5407 "taw" => array(
5408 "icon" => "taw",
5409 "title" => "TAW",
5410 "rule" => array(
5411 "TAW[ /]([0-9.]{1,10})" => "\\1"
5412 ),
5413 "uri" => "http://www.tawdis.net"
5414 ),
5415 "tcd" => array(
5416 "icon" => "tcd",
5417 "title" => "Trinity College Dublin",
5418 "rule" => array(
5419 "^TCDBOT/Nutch-([0-9.]{1,10})" => "\\1"
5420 ),
5421 "uri" => "http://www.tcd.ie"
5422 ),
5423 "technorati" => array(
5424 "icon" => "technorati",
5425 "title" => "Technorati",
5426 "rule" => array(
5427 "Technoratibot[ /]([0-9.]{1,10})" => "\\1"
5428 ),
5429 "uri" => ""
5430 ),
5431 "teleport" => array(
5432 "icon" => "teleport",
5433 "title" => "Teleport",
5434 "rule" => array(
5435 "Teleport[ \-]?Pro" => ""
5436 ),
5437 "uri" => ""
5438 ),
5439 "terrar" => array(
5440 "icon" => "robot",
5441 "title" => "Terrar",
5442 "rule" => array(
5443 "^Fresh Search :: Terrar" => ""
5444 ),
5445 "uri" => ""
5446 ),
5447 "theophrastus" => array(
5448 "icon" => "robot",
5449 "title" => "Theophrastus",
5450 "rule" => array(
5451 "Theophrastus[ /]([0-9.]{1,10})" => "\\1"
5452 ),
5453 "uri" => "http://users.cs.cf.ac.uk/N.A.Smith/theophrastus.php"
5454 ),
5455 "thumbnailscz" => array(
5456 "icon" => "robot",
5457 "title" => "Thumbnails.cz",
5458 "rule" => array(
5459 "^thumbnail\.cz robot[ /]([0-9.]{1,10})" => "\\1"
5460 ),
5461 "uri" => ""
5462 ),
5463 "thumbshot" => array(
5464 "icon" => "robot",
5465 "title" => "Thumbshots",
5466 "rule" => array(
5467 "^thumbshots.*(Version: |v)([0-9.]{2,10})e" => "\\1",
5468 "^thumbshots-de" => ""
5469 ),
5470 "uri" => "http://www.thumbshots.de"
5471 ),
5472 "thunderstone" => array(
5473 "icon" => "thunderstone",
5474 "title" => "Thunderstone",
5475 "rule" => array(
5476 "T-H-U-N-D-E-R-S-T-O-N-E" => "",
5477 "search.thunderstone.com" => ""
5478 ),
5479 "uri" => "http://search.thunderstone.com/"
5480 ),
5481 "timbobot" => array(
5482 "icon" => "robot",
5483 "title" => "TimboBot",
5484 "rule" => array(
5485 "timboBot" => ""
5486 ),
5487 "uri" => ""
5488 ),
5489 "topsy" => array(
5490 "icon" => "topsy",
5491 "title" => "Topsy",
5492 "rule" => array(
5493 "Butterfly[ /]([0-9.]{1,10})" => "\\1"
5494 ),
5495 "uri" => "http://labs.topsy.com/butterfly.html"
5496 ),
5497 "trayce" => array(
5498 "icon" => "robot",
5499 "title" => "Trayce",
5500 "rule" => array(
5501 "traycebot[ /]([0-9a-z.\-]{1,10})" => "\\1"
5502 ),
5503 "uri" => ""
5504 ),
5505 "tricus" => array(
5506 "icon" => "robot",
5507 "title" => "Tricus",
5508 "rule" => array(
5509 "B_l_i_t_z_B_O_T_@_t_r_i_c_u_s_\._c_o_m" => ""
5510 ),
5511 "uri" => ""
5512 ),
5513 "topicblogs" => array(
5514 "icon" => "robot",
5515 "title" => "Topicblogs",
5516 "rule" => array(
5517 "topicblogs[ /]([0-9.]{1,10})" => "\\1"
5518 ),
5519 "uri" => ""
5520 ),
5521 "touche" => array(
5522 "icon" => "touche",
5523 "title" => "Touché",
5524 "rule" => array(
5525 "^Touche" => ""
5526 ),
5527 "uri" => "http://touche.com.ve"
5528 ),
5529 "tuezilla" => array(
5530 "icon" => "robot",
5531 "title" => "TÃœzilla",
5532 "rule" => array(
5533 "tuezilla.de" => ""
5534 ),
5535 "uri" => "http://tuezilla.de/t_st-odp-entries-agent.html"
5536 ),
5537 "turnitin" => array(
5538 "icon" => "turnitin",
5539 "title" => "Turnitin",
5540 "rule" => array(
5541 "TurnitinBot[ /]([0-9.]{1,10})" => "\\1"
5542 ),
5543 "uri" => ""
5544 ),
5545 "tutorgig" => array(
5546 "icon" => "robot",
5547 "title" => "TutorGig",
5548 "rule" => array(
5549 "TutorGig(Bot)?[ /]([0-9.]{1,10})" => "\\2"
5550 ),
5551 "uri" => ""
5552 ),
5553 "twiceler" => array(
5554 "icon" => "cuill",
5555 "title" => "Cuill",
5556 "rule" => array(
5557 "Twiceler[ /-]([0-9.]{1,10})" => "\\1",
5558 "Twiceler" => ""
5559 ),
5560 "uri" => "http://www.cuill.com/twiceler/robot.html"
5561 ),
5562 "twingly" => array(
5563 "icon" => "twingly",
5564 "title" => "Twingly",
5565 "rule" => array(
5566 "Twingly Recon" => ""
5567 ),
5568 "uri" => "http://www.twingly.com/"
5569 ),
5570 "twitter" => array(
5571 "icon" => "twitter",
5572 "title" => "Twitter",
5573 "rule" => array(
5574 "Twitterbot[ /-]([0-9.]{1,10})" => "\\1"
5575 ),
5576 "uri" => "https://dev.twitter.com/cards/getting-started#crawling"
5577 ),
5578 "typepad" => array(
5579 "icon" => "typepad",
5580 "title" => "TypePad",
5581 "rule" => array(
5582 "TypePad/([0-9a-z.]{1,10})" => "\\1"
5583 ),
5584 "uri" => ""
5585 ),
5586 "udmsearch" => array(
5587 "icon" => "robot",
5588 "title" => "UdmSearch",
5589 "rule" => array(
5590 "UdmSearch[/ ]([0-9.]{1,10})" => "\\1"
5591 ),
5592 "uri" => ""
5593 ),
5594 "ukwizz" => array(
5595 "icon" => "ukwizz",
5596 "title" => "UKWizz",
5597 "rule" => array(
5598 "^Mackster.*ukwizz" => ""
5599 ),
5600 "uri" => "http://www.ukwizz.com"
5601 ),
5602 "ultraseek" => array(
5603 "icon" => "robot",
5604 "title" => "Ultraseek",
5605 "rule" => array(
5606 "Ultraseek" => ""
5607 ),
5608 "uri" => ""
5609 ),
5610 "ultraspider" => array(
5611 "icon" => "robot",
5612 "title" => "UltraSpider",
5613 "rule" => array(
5614 "UltraSpider3000[/ ]([0-9.]{1,10})" => "\\1"
5615 ),
5616 "uri" => "http://www.search.ch"
5617 ),
5618 "umai" => array(
5619 "icon" => "robot",
5620 "title" => "Umai",
5621 "rule" => array(
5622 "umai[/ ]([0-9.]{1,10})" => "\\1"
5623 ),
5624 "uri" => ""
5625 ),
5626 "unchaos" => array(
5627 "icon" => "robot",
5628 "title" => "Unchaos",
5629 "rule" => array(
5630 "unchaos_crawler[_ /]([0-9.]{1,10})" => "\\1",
5631 "unchaos" => ""
5632 ),
5633 "uri" => ""
5634 ),
5635 "unido" => array(
5636 "icon" => "robot",
5637 "title" => "UNIdo",
5638 "rule" => array(
5639 "^unido-bot" => "\\1"
5640 ),
5641 "uri" => "http://mobicom.cs.uni-dortmund.de/bot.html"
5642 ),
5643 "updated" => array(
5644 "icon" => "robot",
5645 "title" => "Updated",
5646 "rule" => array(
5647 "updated[ /]([0-9a-z.]{1,10})" => "\\1"
5648 ),
5649 "uri" => ""
5650 ),
5651 "uptimebot" => array(
5652 "icon" => "robot",
5653 "title" => "UptimeBot",
5654 "rule" => array(
5655 "^UptimeBot" => ""
5656 ),
5657 "uri" => "http://www.uptimebot.com/"
5658 ),
5659 "urifetch" => array(
5660 "icon" => "robot",
5661 "title" => "URI::Fetch",
5662 "rule" => array(
5663 "^URI::Fetch[ /]([0-9.]{1,10})" => "\\1"
5664 ),
5665 "uri" => ""
5666 ),
5667 "urlbase" => array(
5668 "icon" => "robot",
5669 "title" => "URLBase",
5670 "rule" => array(
5671 "URLBase[ /]([0-9.]{1,10})" => "\\1"
5672 ),
5673 "uri" => ""
5674 ),
5675 "urlblaze" => array(
5676 "icon" => "robot",
5677 "title" => "URLBlaze",
5678 "rule" => array(
5679 "^URLBlaze" => ""
5680 ),
5681 "uri" => ""
5682 ),
5683 "urlcontr" => array(
5684 "icon" => "robot",
5685 "title" => "MS URL Control",
5686 "rule" => array(
5687 "Microsoft URL[ \-]?Control" => ""
5688 ),
5689 "uri" => ""
5690 ),
5691 "urlgetfile" => array(
5692 "icon" => "robot",
5693 "title" => "URLGetFile",
5694 "rule" => array(
5695 "^URLGetFile" => ""
5696 ),
5697 "uri" => ""
5698 ),
5699 "urlscope" => array(
5700 "icon" => "robot",
5701 "title" => "UrlScope",
5702 "rule" => array(
5703 "UrlScope" => ""
5704 ),
5705 "uri" => ""
5706 ),
5707 "urltrends" => array(
5708 "icon" => "urltrends",
5709 "title" => "UrlTrends",
5710 "rule" => array(
5711 "Snappy/([0-9.]{1,10})" => "\\1",
5712 ),
5713 "uri" => ""
5714 ),
5715 "usww" => array(
5716 "icon" => "usww",
5717 "title" => "USWW",
5718 "rule" => array(
5719 "usww\.com" => "",
5720 "Mozilla/5\.0 URL-Spider" => ""
5721 ),
5722 "uri" => "http://www.usww.com/"
5723 ),
5724 "usyd" => array(
5725 "icon" => "robot",
5726 "title" => "USyd-NLP-Spider",
5727 "rule" => array(
5728 "^USyd-NLP-Spider" => ""
5729 ),
5730 "uri" => "http://www.it.usyd.edu.au/~vinci/bot.html"
5731 ),
5732 "vagabondo" => array(
5733 "icon" => "wiseguys",
5734 "title" => "WiseGuys",
5735 "rule" => array(
5736 "Vagabondo[ /]([0-9.]{1,10})" => "\\1",
5737 "Vagabondo-WAP[ /]([0-9.]{1,10})" => "\\1"
5738 ),
5739 "uri" => ""
5740 ),
5741 "unicorn" => array(
5742 "icon" => "w3c",
5743 "title" => "W3C Unicorn",
5744 "rule" => array(
5745 "Unicorn[ /]([0-9.]{1,10})" => "\\1",
5746 ),
5747 "uri" => "http://validator.w3.org/unicorn/"
5748 ),
5749 "validator" => array(
5750 "icon" => "w3c",
5751 "title" => "W3C Validator",
5752 "rule" => array(
5753 "W3C_Validator[ /]([0-9.]{1,10})" => "\\1"
5754 ),
5755 "uri" => "http://validator.w3.org/"
5756 ),
5757 "validator.nu" => array(
5758 "icon" => "validatornu",
5759 "title" => "Validator.nu",
5760 "rule" => array(
5761 "^Validator.nu[ /]([0-9.]{1,10})" => "\\1",
5762 "^Validator.nu/LV" => "\\1"
5763 ),
5764 "uri" => "http://validator.nu/"
5765 ),
5766 "verity" => array(
5767 "icon" => "robot",
5768 "title" => "Verity",
5769 "rule" => array(
5770 "^vspider[ /]([0-9.]{1,10})" => "\\1",
5771 "^vspider" => ""
5772 ),
5773 "uri" => "http://www.verity.com/"
5774 ),
5775 "versionsproject" => array(
5776 "icon" => "robot",
5777 "title" => "Versions-project",
5778 "rule" => array(
5779 "InfoFly[ /]([0-9.]{1,10})" => "\\1"
5780 ),
5781 "uri" => "http://www.versions-project.org/"
5782 ),
5783 "verticalmatch" => array(
5784 "icon" => "robot",
5785 "title" => "VerticalMatch",
5786 "rule" => array(
5787 "^VMBot[ /]([0-9.]{1,10})" => "\\1"
5788 ),
5789 "uri" => "http://www.VerticalMatch.com/"
5790 ),
5791 "verzamelgids" => array(
5792 "icon" => "robot",
5793 "title" => "Verzamelgids",
5794 "rule" => array(
5795 "Verzamelgids[ /]([0-9.]{1,10})" => "\\1"
5796 ),
5797 "uri" => "http://www.verzamelgids.nl/"
5798 ),
5799 "vestris" => array(
5800 "icon" => "vestris",
5801 "title" => "Vestris",
5802 "rule" => array(
5803 "AlkalineBOT[ /]([0-9.]{1,10})" => "\\1"
5804 ),
5805 "uri" => "http://alkaline.vestris.com/"
5806 ),
5807 "vindex" => array(
5808 "icon" => "vindex",
5809 "title" => "Vindex",
5810 "rule" => array(
5811 "Vindex[ /]([0-9.]{1,10})" => "\\1"
5812 ),
5813 "uri" => ""
5814 ),
5815 "visvo" => array(
5816 "icon" => "robot",
5817 "title" => "Visvo",
5818 "rule" => array(
5819 "VisBot[ /]([0-9.]{1,10})" => "\\1"
5820 ),
5821 "uri" => "http://www.visvo.com"
5822 ),
5823 "voila" => array(
5824 "icon" => "voila",
5825 "title" => "Voila",
5826 "rule" => array(
5827 "VoilaBot[ /]?[a-z ]*([0-9.]{1,10})" => "\\1",
5828 "VoilaBot;[ /]([0-9.]{1,10})" => "\\1"
5829 ),
5830 "uri" => ""
5831 ),
5832 "vonna" => array(
5833 "icon" => "robot",
5834 "title" => "Vonna",
5835 "rule" => array(
5836 "Vonna.com b o t" => ""
5837 ),
5838 "uri" => ""
5839 ),
5840 "vortex" => array(
5841 "icon" => "robot",
5842 "title" => "Vortex",
5843 "rule" => array(
5844 "Vortex[ /]([0-9.]{1,10})" => "\\1"
5845 ),
5846 "uri" => "http://marty.anstey.ca/robots/vortex/"
5847 ),
5848 "w3sitesearch" => array(
5849 "icon" => "w3sitesearch",
5850 "title" => "W3SiteSearch",
5851 "rule" => array(
5852 "^W3SiteSearch Crawler[\_v]*([0-9.]{1,10})" => "\\1"
5853 ),
5854 "uri" => "http://www.w3sitesearch.de"
5855 ),
5856 "wagger" => array(
5857 "icon" => "robot",
5858 "title" => "Wagger",
5859 "rule" => array(
5860 "^Waggr" => ""
5861 ),
5862 "uri" => "http://www.waggr.com/"
5863 ),
5864 "wanadoo" => array(
5865 "icon" => "robot",
5866 "title" => "Wanadoo",
5867 "rule" => array(
5868 "^SurferF3[ /]([0-9./]{1,10})" => "\\1"
5869 ),
5870 "uri" => "http://www.wanadoo.fr/"
5871 ),
5872 "wapalizer" => array(
5873 "icon" => "robot",
5874 "title" => "Wapalizer",
5875 "rule" => array(
5876 "wapalizer[ /]([0-9.]{1,10})" => "\\1"
5877 ),
5878 "uri" => "http://www.wapdrive.com/"
5879 ),
5880 "watson" => array(
5881 "icon" => "addy",
5882 "title" => "Dr.Watson",
5883 "rule" => array(
5884 "Watson[ /]([0-9.]{1,10})" => "\\1",
5885 "watson\.addy\.com" => ""
5886 ),
5887 "uri" => ""
5888 ),
5889 "wavefire" => array(
5890 "icon" => "robot",
5891 "title" => "Wavefire",
5892 "rule" => array(
5893 "^Wavefire[ /]([0-9.]{1,10})" => "\\1"
5894 ),
5895 "uri" => ""
5896 ),
5897 "waypath" => array(
5898 "icon" => "waypath",
5899 "title" => "Waypath",
5900 "rule" => array(
5901 "Waypath[ \-]?Scout" => "",
5902 "Waypath (development )?crawler" => ""
5903 ),
5904 "uri" => ""
5905 ),
5906 "wauuu" => array(
5907 "icon" => "wauuu",
5908 "title" => "Wauuu",
5909 "rule" => array(
5910 "Wauuu[/ ]([0-9.]{1,10})" => "\\2"
5911 ),
5912 "uri" => "http://www.wauuu.com"
5913 ),
5914 "wdg" => array(
5915 "icon" => "wdg",
5916 "title" => "WDG Validator",
5917 "rule" => array(
5918 "^WDG_(Site)?Validator[/ ]([0-9.]{1,10})" => "\\2"
5919 ),
5920 "uri" => "http://www.htmlhelp.com/tools/validator/"
5921 ),
5922 "webagogo" => array(
5923 "icon" => "webagogo",
5924 "title" => "Webagogo",
5925 "rule" => array(
5926 "^Webagogo" => ""
5927 ),
5928 "uri" => "http://www.webagogo.be/"
5929 ),
5930 "webalta" => array(
5931 "icon" => "webalta",
5932 "title" => "WebAlta",
5933 "rule" => array(
5934 "^WebAlta( Crawler)?[/ ]([0-9.]{1,10})" => "\\2"
5935 ),
5936 "uri" => "http://www.webalta.net/ru/about_webmaster.html"
5937 ),
5938 "webdigity" => array(
5939 "icon" => "robot",
5940 "title" => "Webdigity Whois Service",
5941 "rule" => array(
5942 "^webdigity whois service" => ""
5943 ),
5944 "uri" => "http://www.webdigity.com/ws"
5945 ),
5946 "webelixir" => array(
5947 "icon" => "webelixir",
5948 "title" => "Webelixir",
5949 "rule" => array(
5950 "^webelixir" => ""
5951 ),
5952 "uri" => "http://www.webelixir.net/"
5953 ),
5954 "webbotru" => array(
5955 "icon" => "robot",
5956 "title" => "Webbot.ru",
5957 "rule" => array(
5958 " Webbot[/ ]([0-9.]{1,10})" => "\\1"
5959 ),
5960 "uri" => "http://www.webbot.ru/bot.html"
5961 ),
5962 "webcapture" => array(
5963 "icon" => "robot",
5964 "title" => "WebCapture",
5965 "rule" => array(
5966 "WebCapture[/ ]([0-9.]{1,10})" => "\\1"
5967 ),
5968 "uri" => ""
5969 ),
5970 "webcollage" => array(
5971 "icon" => "robot",
5972 "title" => "Webcollage",
5973 "rule" => array(
5974 "webcollage" => ""
5975 ),
5976 "uri" => ""
5977 ),
5978 "webcopier" => array(
5979 "icon" => "webcopier",
5980 "title" => "WebCopier",
5981 "rule" => array(
5982 "WebCopier[/ ]v?([0-9.]{1,10})" => "\\1"
5983 ),
5984 "uri" => ""
5985 ),
5986 "webcorp" => array(
5987 "icon" => "webcorp",
5988 "title" => "WebCorp",
5989 "rule" => array(
5990 "WebCorp[/ ]+([0-9.]{1,10})" => "\\1"
5991 ),
5992 "uri" => "http://www.webcorp.org.uk/"
5993 ),
5994 "webcrawl" => array(
5995 "icon" => "robot",
5996 "title" => "WebCrawl",
5997 "rule" => array(
5998 "webcrawl\.net" => ""
5999 ),
6000 "uri" => ""
6001 ),
6002 "webdownloader" => array(
6003 "icon" => "robot",
6004 "title" => "Web Downloader",
6005 "rule" => array(
6006 "Web Downloader[/ ]([0-9.]{1,10})" => "\\1"
6007 ),
6008 "uri" => ""
6009 ),
6010 "webfetch" => array(
6011 "icon" => "robot",
6012 "title" => "WebFetch",
6013 "rule" => array(
6014 "^webfetch[/ ]([0-9.]{1,10})" => "\\1"
6015 ),
6016 "uri" => ""
6017 ),
6018 "webfind" => array(
6019 "icon" => "robot",
6020 "title" => "WebFind",
6021 "rule" => array(
6022 "^WebFindBot" => ""
6023 ),
6024 "uri" => "http://www.web-find.com"
6025 ),
6026 "webglimpse" => array(
6027 "icon" => "robot",
6028 "title" => "Webglimpse",
6029 "rule" => array(
6030 "^Webglimpse[/ ]([0-9.]{1,10})" => "\\1"
6031 ),
6032 "uri" => "http://webglimpse.net"
6033 ),
6034 "webgobbler" => array(
6035 "icon" => "robot",
6036 "title" => "webGobbler",
6037 "rule" => array(
6038 "^webGobbler[/ ]([0-9.]{1,10})" => "\\1"
6039 ),
6040 "uri" => ""
6041 ),
6042 "webimages" => array(
6043 "icon" => "webimages",
6044 "title" => "WebImages",
6045 "rule" => array(
6046 "^WebImages[/ ]([0-9.]{1,10})" => "\\1"
6047 ),
6048 "uri" => "http://herbert.groot.jebbink.nl/"
6049 ),
6050 "weblight" => array(
6051 "icon" => "robot",
6052 "title" => "WebLight",
6053 "rule" => array(
6054 "^WebLight[/ ]([0-9.]{1,10})" => "\\1"
6055 ),
6056 "uri" => "http://www.illumit.com/Products/weblight/"
6057 ),
6058 "weblinks" => array(
6059 "icon" => "robot",
6060 "title" => "WebLink's",
6061 "rule" => array(
6062 "^Weblink.s checker" => ""
6063 ),
6064 "uri" => ""
6065 ),
6066 "webmeasurement" => array(
6067 "icon" => "robot",
6068 "title" => "Webmeasurement",
6069 "rule" => array(
6070 "^webmeasurement-bot" => ""
6071 ),
6072 "uri" => "http://rvs.informatik.uni-leipzig.de"
6073 ),
6074 "webminer" => array(
6075 "icon" => "robot",
6076 "title" => "WebMiner",
6077 "rule" => array(
6078 "^WebMiner[/ ]([0-9.]{1,10})" => "\\1"
6079 ),
6080 "uri" => ""
6081 ),
6082 "webmin" => array(
6083 "icon" => "webmin",
6084 "title" => "Webmin",
6085 "rule" => array(
6086 "^webmin" => ""
6087 ),
6088 "uri" => ""
6089 ),
6090 "webmon" => array(
6091 "icon" => "webmon",
6092 "title" => "Webmon",
6093 "rule" => array(
6094 "WebMon[ /]([0-9.]{1,10})" => "\\1"
6095 ),
6096 "uri" => "http://www.markwell.btinternet.co.uk/webmon/"
6097 ),
6098 "webox" => array(
6099 "icon" => "robot",
6100 "title" => " WeBoX",
6101 "rule" => array(
6102 "WeBoX[/ ]([0-9.]{1,10})" => "\\1"
6103 ),
6104 "uri" => ""
6105 ),
6106 "webpatrol" => array(
6107 "icon" => "webpatrol",
6108 "title" => "WebPatrol",
6109 "rule" => array(
6110 "^WebPatrol[ /]([0-9.]{1,10})" => "\\1"
6111 ),
6112 "uri" => "http://soft.macfeeling.com/WebPatrol.html"
6113 ),
6114 "webpix" => array(
6115 "icon" => "webpix",
6116 "title" => "WebPix",
6117 "rule" => array(
6118 "WebPix[/ ]([0-9.]{1,10})" => "\\1"
6119 ),
6120 "uri" => ""
6121 ),
6122 "webrace" => array(
6123 "icon" => "robot",
6124 "title" => "WebRACE",
6125 "rule" => array(
6126 "^WebRACE[/ ]([0-9.]{1,10})" => "\\1"
6127 ),
6128 "uri" => ""
6129 ),
6130 "webreaper" => array(
6131 "icon" => "webreaper",
6132 "title" => "WebReaper",
6133 "rule" => array(
6134 "^WebReaper " => ""
6135 ),
6136 "uri" => "http://www.webreaper.net/"
6137 ),
6138 "webresult" => array(
6139 "icon" => "robot",
6140 "title" => "Webresult",
6141 "rule" => array(
6142 "Der webresult\.de Robot" => ""
6143 ),
6144 "uri" => ""
6145 ),
6146 "webring" => array(
6147 "icon" => "robot",
6148 "title" => "Webring Checker",
6149 "rule" => array(
6150 "WebRingChecker[/ ]([0-9.]{1,10})" => "\\1"
6151 ),
6152 "uri" => ""
6153 ),
6154 "webripper" => array(
6155 "icon" => "webripper",
6156 "title" => "WebRipper",
6157 "rule" => array(
6158 "^WebRipper" => ""
6159 ),
6160 "uri" => "http://calluna-software.com"
6161 ),
6162 "webscaled" => array(
6163 "icon" => "webscaled",
6164 "title" => "Webscaled",
6165 "rule" => array(
6166 "Swarm" => ""
6167 ),
6168 "uri" => "http://webscaled.com/"
6169 ),
6170 "websearchau" => array(
6171 "icon" => "websearchau",
6172 "title" => "WebSearch.COM.AU",
6173 "rule" => array(
6174 "WebSearch.COM.AU[/ ]+([0-9.]{1,10})" => "\\1"
6175 ),
6176 "uri" => "http://WebSearch.com.au/"
6177 ),
6178 "websearchbench" => array(
6179 "icon" => "robot",
6180 "title" => "WebSearchBench",
6181 "rule" => array(
6182 "WebSearchBench WebCrawler[v/ ]+([0-9.]{1,10})" => "\\1"
6183 ),
6184 "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6185 ),
6186 "websense" => array(
6187 "icon" => "websense",
6188 "title" => "Websense",
6189 "rule" => array(
6190 "(Sqworm|websense|Konqueror/3\.(0|1)(-rc[1-6])?; i686 Linux; 2002[0-9]{4})" => ""
6191 ),
6192 "uri" => ""
6193 ),
6194 "websiteshadow" => array(
6195 "icon" => "websiteshadow",
6196 "title" => "Websiteshadow",
6197 "rule" => array(
6198 "Websiteshadowbot[ /]([0-9.]{1,10})" => "\\1"
6199 ),
6200 "uri" => "http://websiteshadow.com"
6201 ),
6202 "websiteworth" => array(
6203 "icon" => "robot",
6204 "title" => "WebsiteWorth",
6205 "rule" => array(
6206 "WebsiteWorth[v/ ]+([0-9.]{1,10})" => "\\1"
6207 ),
6208 "uri" => "http://directory.sootle.com/website-worth/tata.php"
6209 ),
6210 "websquash" => array(
6211 "icon" => "websquash",
6212 "title" => "Websquash",
6213 "rule" => array(
6214 "webs(quash\.com|ite[ \-]?Monitor)" => ""
6215 ),
6216 "uri" => ""
6217 ),
6218 "webstripper" => array(
6219 "icon" => "robot",
6220 "title" => "WebStripper",
6221 "rule" => array(
6222 "WebStripper[ /]([0-9.]{1,10})" => "\\1"
6223 ),
6224 "uri" => ""
6225 ),
6226 "webzip" => array(
6227 "icon" => "webzip",
6228 "title" => "WebZIP",
6229 "rule" => array(
6230 "Web[ \-]?ZIP[ /]([0-9.]{1,10})" => "\\1"
6231 ),
6232 "uri" => ""
6233 ),
6234 "wep" => array(
6235 "icon" => "robot",
6236 "title" => "WEP Search",
6237 "rule" => array(
6238 "WEP Search[ /]([0-9.]{1,10})" => "\\1"
6239 ),
6240 "uri" => ""
6241 ),
6242 "westwind" => array(
6243 "icon" => "robot",
6244 "title" => "West Wind Internet Protocols",
6245 "rule" => array(
6246 "^West Wind Internet Protocols[ /]([0-9.]{1,10})" => "\\1"
6247 ),
6248 "uri" => "http://www.west-wind.com/wwipstuff.asp"
6249 ),
6250 "wget" => array(
6251 "icon" => "wget",
6252 "title" => "Wget",
6253 "rule" => array(
6254 "Wget[ /]([0-9.]{1,10})" => "\\1",
6255 "Wget" => ""
6256 ),
6257 "uri" => ""
6258 ),
6259 "whizbang" => array(
6260 "icon" => "whizbang",
6261 "title" => "WhizBang",
6262 "rule" => array(
6263 "WhizBang" => ""
6264 ),
6265 "uri" => "http://www.whizbang.com/crawler/"
6266 ),
6267 "whois" => array(
6268 "icon" => "whois",
6269 "title" => "Who.is",
6270 "rule" => array(
6271 "Who.is Bot" => ""
6272 ),
6273 "uri" => "http://www.who.is/"
6274 ),
6275 "wikiwix" => array(
6276 "icon" => "wikiwix",
6277 "title" => "Wikiwix",
6278 "rule" => array(
6279 "wikiwix-bot-([0-9.]{1,10})" => "\\1"
6280 ),
6281 "uri" => "http://www.wikiwix.com/"
6282 ),
6283 "wingflyer" => array(
6284 "icon" => "robot",
6285 "title" => "WingFlyer",
6286 "rule" => array(
6287 "^WebFetch" => ""
6288 ),
6289 "uri" => "http://www.wingflyer.com/"
6290 ),
6291 "wininet" => array(
6292 "icon" => "robot",
6293 "title" => "WinInet",
6294 "rule" => array(
6295 "TeamSoft WinInet Component" => ""
6296 ),
6297 "uri" => "http://www.winsoft.sk/wininet.htm"
6298 ),
6299 "winhttp" => array(
6300 "icon" => "robot",
6301 "title" => "WinHTTP",
6302 "rule" => array(
6303 "WinHttp\.WinHttpRequest\.([0-9.]{1,10})" => "\\1"
6304 ),
6305 "uri" => ""
6306 ),
6307 "wire" => array(
6308 "icon" => "robot",
6309 "title" => "WIRE",
6310 "rule" => array(
6311 "^WIRE[ /]([0-9.]{1,10})" => "\\1"
6312 ),
6313 "uri" => ""
6314 ),
6315 "wmp" => array(
6316 "icon" => "robot",
6317 "title" => "WMP",
6318 "rule" => array(
6319 "^WMP" => ""
6320 ),
6321 "uri" => ""
6322 ),
6323 "woozweb" => array(
6324 "icon" => "woozweb",
6325 "title" => "Woozweb",
6326 "rule" => array(
6327 "woozweb" => ""
6328 ),
6329 "uri" => "http://www.woozweb.com/"
6330 ),
6331 "wordchamp" => array(
6332 "icon" => "robot",
6333 "title" => "WordChamp",
6334 "rule" => array(
6335 "^WordChampBot" => ""
6336 ),
6337 "uri" => "http://www.wordchamp.com/"
6338 ),
6339 "wordpress" => array(
6340 "icon" => "wordpress",
6341 "title" => "WordPress",
6342 "rule" => array(
6343 "WordPress[ /]([0-9.]{1,10})" => "\\1"
6344 ),
6345 "uri" => ""
6346 ),
6347 "worio" => array(
6348 "icon" => "worio",
6349 "title" => "Worio",
6350 "rule" => array(
6351 "woriobot" => ""
6352 ),
6353 "uri" => "http://worio.com/"
6354 ),
6355 "worldlight" => array(
6356 "icon" => "worldlight",
6357 "title" => "WorldLight",
6358 "rule" => array(
6359 "^WorldLight" => ""
6360 ),
6361 "uri" => ""
6362 ),
6363 "worqmada" => array(
6364 "icon" => "robot",
6365 "title" => "WorQmada",
6366 "rule" => array(
6367 "WorQmada[ /]([0-9.]{1,10})" => "\\1"
6368 ),
6369 "uri" => ""
6370 ),
6371 "wotbox" => array(
6372 "icon" => "wotbox",
6373 "title" => "Wotbox",
6374 "rule" => array(
6375 "Wotbox[ /]?[a-z]*([0-9.]{1,10})" => "\\1"
6376 ),
6377 "uri" => ""
6378 ),
6379 "wp" => array(
6380 "icon" => "wp",
6381 "title" => "Wirtualna Polska",
6382 "rule" => array(
6383 "NetSprint[ /\-]{1,4}([0-9.]{1,10})" => "\\1"
6384 ),
6385 "uri" => "http://wp.pl"
6386 ),
6387 "wsb" => array(
6388 "icon" => "robot",
6389 "title" => "WebSearchBench",
6390 "rule" => array(
6391 "WSB WebCrawler V([0-9.]{1,10})" => "\\1",
6392 "WSB " => ""
6393 ),
6394 "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6395 ),
6396 "wume" => array(
6397 "icon" => "robot",
6398 "title" => "WUME Lab's",
6399 "rule" => array(
6400 "^wume_crawler[ /]([0-9.]{1,10})" => "\\1",
6401 ),
6402 "uri" => "http://wume.cse.lehigh.edu/~xiq204/crawler/"
6403 ),
6404 "wusage" => array(
6405 "icon" => "wusage",
6406 "title" => "Wusage",
6407 "rule" => array(
6408 "Wusage[ /]([0-9.]{1,10})" => "\\1",
6409 ),
6410 "uri" => "http://www.boutell.com/wusage/"
6411 ),
6412 "wwgrapevine" => array(
6413 "icon" => "wwgrapevine",
6414 "title" => "WWgrapevine",
6415 "rule" => array(
6416 "wwgrapevine[ /]([0-9.]{1,10})" => "\\1"
6417 ),
6418 "uri" => ""
6419 ),
6420 "wws" => array(
6421 "icon" => "robot",
6422 "title" => "WWSBOT",
6423 "rule" => array(
6424 "WWSBOT[ /]([0-9.]{1,10})" => "\\1",
6425 ),
6426 "uri" => "http://www.analyzer.nu"
6427 ),
6428 "www4mail" => array(
6429 "icon" => "robot",
6430 "title" => "WWW4mail",
6431 "rule" => array(
6432 "^www4mail[ /]([0-9.]{1,10})" => "\\1"
6433 ),
6434 "uri" => "http://www.www4mail.org/"
6435 ),
6436 "wwwc" => array(
6437 "icon" => "wwwc",
6438 "title" => "WWWC",
6439 "rule" => array(
6440 "^WWWC[ /]([0-9.]{1,10})" => "\\1"
6441 ),
6442 "uri" => ""
6443 ),
6444 "wwwd" => array(
6445 "icon" => "robot",
6446 "title" => "WWWD",
6447 "rule" => array(
6448 "^WWWD[ /]([0-9.]{1,10})" => "\\1"
6449 ),
6450 "uri" => ""
6451 ),
6452 "wwweasel" => array(
6453 "icon" => "wwweasel",
6454 "title" => "WWWeasel",
6455 "rule" => array(
6456 "WWWeasel( Robot)?[/ ]v?([0-9.]{1,10})" => "\\2"
6457 ),
6458 "uri" => ""
6459 ),
6460 "wwwfi" => array(
6461 "icon" => "wwwfi",
6462 "title" => "www.fi",
6463 "rule" => array(
6464 "www\.fi crawler" => ""
6465 ),
6466 "uri" => "http://www.fi/"
6467 ),
6468 "wwwmechanize" => array(
6469 "icon" => "robot",
6470 "title" => "WWW-Mechanize",
6471 "rule" => array(
6472 "^WWW-Mechanize[/ ]([0-9.]{1,10})" => "\\1"
6473 ),
6474 "uri" => ""
6475 ),
6476 "wwwoffle" => array(
6477 "icon" => "robot",
6478 "title" => "WWWoffle",
6479 "rule" => array(
6480 "^wwwoffle[/ ]([0-9.]{1,10})" => "\\1"
6481 ),
6482 "uri" => ""
6483 ),
6484 "wwwster" => array(
6485 "icon" => "robot",
6486 "title" => "WWWster",
6487 "rule" => array(
6488 "^wwwster[/ ]([0-9.]{1,10})" => "\\1"
6489 ),
6490 "uri" => ""
6491 ),
6492 "wysigot" => array(
6493 "icon" => "wysigot",
6494 "title" => "Wysigot",
6495 "rule" => array(
6496 "Wysigot[/ ]([0-9.]{1,10})" => "\\1"
6497 ),
6498 "uri" => ""
6499 ),
6500 "xaldon" => array(
6501 "icon" => "xaldon",
6502 "title" => "Xaldon",
6503 "rule" => array(
6504 "Xaldon WebSpider" => ""
6505 ),
6506 "uri" => "http://www.xaldon.de/"
6507 ),
6508 "xenu" => array(
6509 "icon" => "xenu",
6510 "title" => "Xenu Link Sleuth",
6511 "rule" => array(
6512 "Xenu Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6513 "Xenu(&#039;s)? Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6514 "Xenu_Link_Sleuth_([0-9a-z.]{1,10})" => "\\1"
6515 ),
6516 "uri" => "http://home.snafu.de/tilman/xenulink.html"
6517 ),
6518 "xerka" => array(
6519 "icon" => "xerka",
6520 "title" => "Xerka",
6521 "rule" => array(
6522 "^Xerka WebBot v([0-9a-z.]{1,10})" => "\\1"
6523 ),
6524 "uri" => "http://www.diana-teknologia.com/www1/english/xerka.htm"
6525 ),
6526 "xirq" => array(
6527 "icon" => "robot",
6528 "title" => "XIRQ",
6529 "rule" => array(
6530 "^xirq[ /]([0-9a-z.]{1,10})" => "\\1"
6531 ),
6532 "uri" => "http://www.xirq.com"
6533 ),
6534 "xmlslurp" => array(
6535 "icon" => "robot",
6536 "title" => "XMLSlurp",
6537 "rule" => array(
6538 "^XMLSlurp[ /]([0-9a-z.]{1,10})" => "\\1"
6539 ),
6540 "uri" => ""
6541 ),
6542 "xml-sitemaps" => array(
6543 "icon" => "xml-sitemaps",
6544 "title" => "XML-Sitemaps",
6545 "rule" => array(
6546 "XML-Sitemaps[ /]([0-9a-z.]{1,10})" => "\\1"
6547 ),
6548 "uri" => ""
6549 ),
6550 "xmlrpc" => array(
6551 "icon" => "robot",
6552 "title" => "Trackback",
6553 "rule" => array(
6554 "XMLRPC" => ""
6555 ),
6556 "uri" => ""
6557 ),
6558 "xovi" => array(
6559 "icon" => "xovi",
6560 "title" => "Xovi",
6561 "rule" => array(
6562 "XoviBot[ /]([0-9a-z.]{1,10})" => "\\1"
6563 ),
6564 "uri" => "http://www.xovibot.net"
6565 ),
6566 "yacy" => array(
6567 "icon" => "yacy",
6568 "title" => "Yacy",
6569 "rule" => array(
6570 "yacy\.net" => ""
6571 ),
6572 "uri" => ""
6573 ),
6574 "yahoo" => array(
6575 "icon" => "yahoo",
6576 "title" => "Yahoo",
6577 "rule" => array(
6578 "Yahoo(! ([a-z]{1,3} )?Slurp|-)" => "",
6579 "Yahoo-MMCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6580 "Yahoo-VerticalCrawler-FormerWebCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6581 "^AnzwersCrawl[/ ]([0-9a-z.]{1,10})" => "\\1",
6582 "Y!J(-BSC|-SRD)*[/ ]([0-9a-z.]{1,10})" => "\\2",
6583 "Y!OASIS/TEST" => "",
6584 "Harvest-NG[/ ]([0-9a-z.]{1,10})" => "\\1",
6585 "Y!J; for robot study" => "",
6586 "Yahoo Japan; for robot study" => ""
6587 ),
6588 "uri" => "http://www.yahoo.com"
6589 ),
6590 "yahoo-feed" => array(
6591 "icon" => "yahoo",
6592 "title" => "Yahoo Feedseeker",
6593 "rule" => array(
6594 "^YahooFeedSeeker[/ ]([0-9a-z.]{1,10})" => "\\1"
6595 ),
6596 "uri" => "http://www.yahoo.com"
6597 ),
6598 "yandex" => array(
6599 "icon" => "yandex",
6600 "title" => "Yandex",
6601 "rule" => array(
6602 "Yandex[/ ]([0-9.]{1,10})" => "\\1",
6603 "Yandex(Bot|Images|Media|Antivirus)[/ ]([0-9.]{1,10})" => "\\2"
6604 ),
6605 "uri" => "http://yandex.com/bots"
6606 ),
6607 "yanga" => array(
6608 "icon" => "yanga",
6609 "title" => "Yanga",
6610 "rule" => array (
6611 "^Yanga.*v([0-9.]{1,10})" => "\\1"
6612 ),
6613 "uri" => "http://www.yanga.co.uk/"
6614 ),
6615 "yap" => array(
6616 "icon" => "yap",
6617 "title" => "Yap",
6618 "rule" => array(
6619 "^YapBot[_/ ]v([0-9.]{1,10})" => "\\1"
6620 ),
6621 "uri" => "http://www.yapinc.com/"
6622 ),
6623 "yarienavoir" => array(
6624 "icon" => "robot",
6625 "title" => "Yarienavoir",
6626 "rule" => array(
6627 "^yarienavoir.net[/ ]([0-9.]{1,10})" => "\\1"
6628 ),
6629 "uri" => "http://www.yarienavoir.net/"
6630 ),
6631 "yell" => array(
6632 "icon" => "yell",
6633 "title" => "Yell",
6634 "rule" => array(
6635 "YellCrawl[ /]V?([0-9.]{1,10})" => "\\1",
6636 "Yellbot[ /]Nutch-([0-9.]{1,10})" => "\\1",
6637 ),
6638 "uri" => ""
6639 ),
6640 "youdao" => array(
6641 "icon" => "youdao",
6642 "title" => "Youdao",
6643 "rule" => array(
6644 "YodaoBot-(Image|Mobile)?[ /]([0-9.]{1,10})" => "\\2",
6645 "YoudaoBot[ /]([0-9.]{1,10})" => "\\1"
6646 ),
6647 "uri" => "http://www.youdao.com/help/webmaster/spider/"
6648 ),
6649 "yoogli" => array(
6650 "icon" => "yoogli",
6651 "title" => "Yoogli",
6652 "rule" => array(
6653 "yoogliFetchAgent[ /]([0-9.]{1,10})" => "\\1"
6654 ),
6655 "uri" => "http://www.yoogli.com"
6656 ),
6657 "yotta" => array(
6658 "icon" => "robot",
6659 "title" => "Yotta",
6660 "rule" => array(
6661 "Yotta(Shopping|Cars)_Bot[ /]([0-9.]{1,10})" => "\\2",
6662 "OmniExplorer_Bot[ /]([0-9.]{1,10})" => "\\1"
6663 ),
6664 "uri" => "http://www.yottacars.com"
6665 ),
6666 "yoono" => array(
6667 "icon" => "yoono",
6668 "title" => "Yoono",
6669 "rule" => array(
6670 "Yoono" => ""
6671 ),
6672 "uri" => "http://www.yoono.com/"
6673 ),
6674 "yowedo" => array(
6675 "icon" => "robot",
6676 "title" => "Yowedo",
6677 "rule" => array(
6678 "Yowedo[ /]([0-9.]{1,10})" => "\\1"
6679 ),
6680 "uri" => "http://yowedo.com/en/partners.html"
6681 ),
6682 "yuntis" => array(
6683 "icon" => "robot",
6684 "title" => "Yuntis",
6685 "rule" => array(
6686 "Gulper Web Bot[ /]([0-9.]{1,10})" => "\\1"
6687 ),
6688 "uri" => "http://yuntis.ecsl.cs.sunysb.edu/help/robot/"
6689 ),
6690 "zao" => array(
6691 "icon" => "robot",
6692 "title" => "Zao",
6693 "rule" => array(
6694 "Zao[ /]([0-9.]{1,10})" => "\\1",
6695 "Zao-crawler" => ""
6696 ),
6697 "uri" => ""
6698 ),
6699 "zealbot" => array(
6700 "icon" => "zeal",
6701 "title" => "ZealBot",
6702 "rule" => array(
6703 "Zealbot[ /]([0-9.]{1,10})" => "\\1"
6704 ),
6705 "uri" => ""
6706 ),
6707 "zearchit" => array(
6708 "icon" => "zearchit",
6709 "title" => "Zearchit",
6710 "rule" => array(
6711 "Zearchit" => ""
6712 ),
6713 "uri" => "http://www.zearchit.de/"
6714 ),
6715 "zebz" => array(
6716 "icon" => "robot",
6717 "title" => "ze.bz",
6718 "rule" => array(
6719 "^ZeBot_(lseek\.net|www\.ze\.bz)" => ""
6720 ),
6721 "uri" => "http://www.ze.bz/"
6722 ),
6723 "zedzo" => array(
6724 "icon" => "robot",
6725 "title" => "Zedzo",
6726 "rule" => array(
6727 "zedzo.digest[ /]([0-9.]{1,10})" => "\\1"
6728 ),
6729 "uri" => "http://www.zedzo.com/"
6730 ),
6731 "zerx" => array(
6732 "icon" => "zerx",
6733 "title" => "Zerx",
6734 "rule" => array(
6735 "^zerxbot[ /](Version|v)*[ /]*([0-9.]{1,10})" => "\\2"
6736 ),
6737 "uri" => "http://www.zerx.com/"
6738 ),
6739 "zeus" => array(
6740 "icon" => "zeus",
6741 "title" => "Zeus",
6742 "rule" => array(
6743 "Zeus" => ""
6744 ),
6745 "uri" => "http://www.zeus.com"
6746 ),
6747 "zippp" => array(
6748 "icon" => "robot",
6749 "title" => "Zippp",
6750 "rule" => array(
6751 "ZipppBot[ /]([0-9.]{1,10})" => "\\1"
6752 ),
6753 "uri" => ""
6754 ),
6755 "zippy" => array(
6756 "icon" => "robot",
6757 "title" => "Zippy",
6758 "rule" => array(
6759 "^Zippy[ v/]*([0-9.]{1,10})" => "\\1"
6760 ),
6761 "uri" => "http://www.zippyfinder.com"
6762 ),
6763 "zoeky" => array(
6764 "icon" => "robot",
6765 "title" => "Zoeky",
6766 "rule" => array(
6767 "Zoekybot[ /]([0-9.]{1,10})" => "\\1"
6768 ),
6769 "uri" => ""
6770 ),
6771 "zoom" => array(
6772 "icon" => "zoom",
6773 "title" => "ZoomSpider",
6774 "rule" => array(
6775 "^ZoomSpider" => ""
6776 ),
6777 "uri" => "http://www.wrensoft.com/"
6778 ),
6779 "zspider" => array(
6780 "icon" => "robot",
6781 "title" => "Zspider",
6782 "rule" => array(
6783 "zspider[ /]([0-9.a-z]{1,10})" => "\\1"
6784 ),
6785 "uri" => "http://feedback.redkolibri.com/"
6786 ),
6787 "zumbot" => array(
6788 "icon" => "robot",
6789 "title" => "ZUM Search",
6790 "rule" => array(
6791 "ZumBot[ /]([0-9.]{1,10})" => "\\1"
6792 ),
6793 "uri" => "http://help.zum.com/inquiry"
6794 ),
6795 "zyborg" => array(
6796 "icon" => "zyborg",
6797 "title" => "WiseNutBot",
6798 "rule" => array(
6799 "(WISE|Zy)bo(rg|t)[ /]([0-9.]{1,10})" => "\\3"
6800 ),
6801 "uri" => ""
6802 ),
6803 // Catch up for the originals, they got to stay in that order.
6804 "blogbot" => array(
6805 "icon" => "blogbot",
6806 "title" => "BlogBot",
6807 "rule" => array(
6808 "Blog[ \-]?Bot" => ""
6809 ),
6810 "uri" => "http://www.blogbot.com/"
6811 ),
6812 "centrum" => array(
6813 "icon" => "centrum",
6814 "title" => "Centrum",
6815 "rule" => array(
6816 "holmes[/ ]([0-9.]{1,10})" => "\\1",
6817 "^Centrum-checker" => ""
6818 ),
6819 "uri" => ""
6820 ),
6821 "httpclient" => array(
6822 "icon" => "robot",
6823 "title" => "HTTPClient",
6824 "rule" => array(
6825 "HTTP[ \-]?Client[ /]([0-9.]{1,10})" => "\\1",
6826 "HTTP[ \-]?Client" => ""
6827 ),
6828 "uri" => "http://www.innovation.ch/java/HTTPClient/"
6829 ),
6830 "incywincy" => array(
6831 "icon" => "robot",
6832 "title" => "IncyWincy",
6833 "rule" => array(
6834 "^IncyWincy[ /]([0-9.]{1,10})" => "\\1",
6835 "^IncyWincy" => ""
6836 ),
6837 "uri" => ""
6838 ),
6839 "java" => array(
6840 "icon" => "java",
6841 "title" => "Java",
6842 "rule" => array(
6843 "^java[ /]*([0-9.a-z]{1,10})" => "\\1"
6844 ),
6845 "uri" => ""
6846 ),
6847 "libfetch" => array(
6848 "icon" => "robot",
6849 "title" => "Libfetch",
6850 "rule" => array(
6851 "^(fetch )?libfetch[ /]([0-9.]{1,10})" => "\\2"
6852 ),
6853 "uri" => "http://www.freebsd.org/"
6854 ),
6855 "libwww" => array(
6856 "icon" => "libwww",
6857 "title" => "LibWWW",
6858 "rule" => array(
6859 "^libww(w|w-perl|w-FM)[ /]([0-9.]{1,10})" => "\\2",
6860 "^libww(w|w-perl|w-FM)" => "",
6861 "MyApp.*libww(w|w-perl|w-FM)" => ""
6862 ),
6863 "uri" => ""
6864 ),
6865 "litefinder" => array(
6866 "icon" => "litefinder",
6867 "title" => "LiteFinder",
6868 "rule" => array(
6869 "LiteFinder[ /]([0-9.]{1,10})" => "\\1"
6870 ),
6871 "uri" => "http://www.litefinder.net/about.html"
6872 ),
6873 "nutchorg" => array(
6874 "icon" => "nutchorg",
6875 "title" => "Nutch",
6876 "rule" => array(
6877 "Nutc(hOrg|hCVS|h)?[ /]([0-9.]{1,10})" => "\\2",
6878 "Nutch" => ""
6879 ),
6880 "uri" => "http://lucene.apache.org/nutch/"
6881 ),
6882 "pythonurl" => array(
6883 "icon" => "pythonurl",
6884 "title" => "Python-url",
6885 "rule" => array(
6886 "Python[ \-]?urllib" => ""
6887 ),
6888 "uri" => ""
6889 ),
6890 // Know Robots as SPAM BOTS
6891 "SPAM" => array(
6892 "icon" => "robot",
6893 "title" => "SPAM",
6894 "rule" => array(
6895 "NASA Search[/ ]([0-9.]{1,10})" => "\\1",
6896 "^PHOTO CHECK" => "",
6897 "^FOTOCHECKER" => "",
6898 "^IPTC CHECK" => "",
6899 "^DataCha0s" => "",
6900 "^Mac Finder" => "",
6901 "^Missigua Locator[ /]([0-9.]{1,10})" => "\\1",
6902 "^Missouri College Browse" => "",
6903 "Email[ \-]?Siphon" => "",
6904 "atSpider" => "",
6905 "autoemailspider" => "",
6906 "^Demo Bot" => "",
6907 "^Program Shareware" => "",
6908 "^Snapbot" => "",
6909 "^snap.com" => "",
6910 "^Guestbook Auto Submitter" => "",
6911 "panscient.com" => "",
6912 ),
6913 "uri" => ""
6914 ),
6915 // Things we don't know by now
6916 "robot" => array(
6917 "icon" => "robot",
6918 "title" => "Robot",
6919 "rule" => array(
6920 "(robot|spider|harvest|(?<!orange)bot|(?<!msie)crawler)" => ""
6921 )
6922 )
6923 );
6924 ?>

Properties

Name Value
svn:keywords Id