ViewVC Help
View File | Revision Log | Show Annotations | View Changeset | Root Listing
root/BBClone/trunk/lib/robot.php
Revision: 430
Committed: Wed Apr 26 15:57:01 2023 UTC (19 months ago) by joku
File size: 160840 byte(s)
Log Message:

File Contents

# Content
1 <?php
2 /* This file is part of BBClone (A PHP based Web Counter on Steroids)
3 *
4 * SVN FILE $Id$
5 *
6 * Copyright (C) 2001-2023, the BBClone Team (see doc/authors.txt for details)
7 *
8 * This program is free software: you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License as published by
10 * the Free Software Foundation, either version 3 of the License, or
11 * (at your option) any later version.
12 *
13 * This program is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 * GNU General Public License for more details.
17 *
18 * See doc/copying.txt for details
19 */
20
21 /////////////////////
22 // Robot Detection //
23 /////////////////////
24
25 $robot = array(
26 "1noon" => array(
27 "icon" => "1noon",
28 "title" => "1noon",
29 "rule" => array(
30 "1Noonbot[/ ]([0-9.]{1,10})" => "\\1",
31 "^Yeti$" => ""
32 ),
33 "uri" => ""
34 ),
35 "123people" => array(
36 "icon" => "123people",
37 "title" => "123people",
38 "rule" => array(
39 "123peoplebot[ /]([0-9.]{1,10})" => "\\1"
40 ),
41 "uri" => "http://www.123people.fr/"
42 ),
43 "123spider" => array(
44 "icon" => "robot",
45 "title" => "123Spider",
46 "rule" => array(
47 "123spider-Bot \(Version: ([0-9.]{1,10})" => "\\1"
48 ),
49 "uri" => "http://www.123spider.de/"
50 ),
51 "192com" => array(
52 "icon" => "robot",
53 "title" => "192.com",
54 "rule" => array(
55 "192.comAgent" => ""
56 ),
57 "uri" => "http://www.192.com/"
58 ),
59 "200please" => array(
60 "icon" => "200please",
61 "title" => "200please Crawler",
62 "rule" => array(
63 "200PleaseBot[ /]([0-9.]{1,10})" => "\\1"
64 ),
65 "uri" => "http://www.200please.com/bot"
66 ),
67 "2dehands" => array(
68 "icon" => "2dehands",
69 "title" => "2deHands",
70 "rule" => array(
71 "2dehands\.nl" => ""
72 ),
73 "uri" => ""
74 ),
75 "80legs" => array(
76 "icon" => "80legs",
77 "title" => "80legs",
78 "rule" => array(
79 "008[/ ]([0-9.]{1,10}).*80legs" => "\\1"
80 ),
81 "uri" => "http://www.80legs.com/"
82 ),
83 "a1sitemap" => array(
84 "icon" => "a1sitemap",
85 "title" => "A1 Sitemap",
86 "rule" => array(
87 "^A1 Sitemap Generator[ /]([0-9.]{1,10})" => "\\1",
88 "miggibot[ /]([0-9.]{1,10})" => "\\1"
89 ),
90 "uri" => "http://www.micro-sys.dk/products/sitemap-generator/"
91 ),
92 "a2b" => array(
93 "icon" => "a2b",
94 "title" => "A2B",
95 "rule" => array(
96 "www\.a2b\.cc" => ""
97 ),
98 "uri" => "http://www.a2b.cc"
99 ),
100 "abacho" => array(
101 "icon" => "robot",
102 "title" => "Abacho",
103 "rule" => array(
104 "^ABACHOBot" => ""
105 ),
106 "uri" => ""
107 ),
108 "abcdatos" => array(
109 "icon" => "abcdatos",
110 "title" => "ABCdatos",
111 "rule" => array(
112 "^ABCdatos BotLink[ /]([0-9.]{1,10})" => "\\1"
113 ),
114 "uri" => "http://www.abcdatos.com/"
115 ),
116 "abot" => array(
117 "icon" => "abot",
118 "title" => "aBot",
119 "rule" => array(
120 "^abot[ /]([0-9.]{1,10})" => "\\1"
121 ),
122 "uri" => ""
123 ),
124 "about" => array(
125 "icon" => "about",
126 "title" => "About",
127 "rule" => array(
128 "Libby[_/ ]([0-9.]{1,10})" => "\\1",
129 "About[_/ ]([0-9.]{1,10})libwww-perl" => "\\1"
130 ),
131 "uri" => ""
132 ),
133 "aboutus" => array(
134 "icon" => "aboutus",
135 "title" => "AboutUs",
136 "rule" => array(
137 "AboutUsBot" => ""
138 ),
139 "uri" => "http://www.aboutus.org/"
140 ),
141 "ackerm" => array(
142 "icon" => "robot",
143 "title" => "Ackerm",
144 "rule" => array(
145 "www.ackerm.com" => ""
146 ),
147 "uri" => "http://www.ackerm.com/"
148 ),
149 "acoi" => array(
150 "icon" => "acoi",
151 "title" => "AcoiRobot",
152 "rule" => array(
153 "^AcoiRobot" => ""
154 ),
155 "uri" => "http://monetdb.cwi.nl/acoi/projects.html"
156 ),
157 "acoon" => array(
158 "icon" => "acoon",
159 "title" => "Acoon",
160 "rule" => array(
161 "Acoon[ \-]?Robot" => ""
162 ),
163 "uri" => ""
164 ),
165 "accoona" => array(
166 "icon" => "accoona",
167 "title" => "Accoona",
168 "rule" => array(
169 "Accoona-AI-Agent[/ ]([0-9.]{1,10})" => "\\1",
170 "^accoona" => ""
171 ),
172 "uri" => ""
173 ),
174 "acme" => array(
175 "icon" => "acme",
176 "title" => "Acme",
177 "rule" => array(
178 "^Acme\.Spider" => ""
179 ),
180 "uri" => "http://www.acme.com/java/software/Acme.Spider.html"
181 ),
182 "active" => array(
183 "icon" => "robot",
184 "title" => "ActiveBookmark",
185 "rule" => array(
186 "ActiveBookmark[/ ]([0-9.]{1,10})" => "\\1"
187 ),
188 "uri" => ""
189 ),
190 "admuncher" => array(
191 "icon" => "robot",
192 "title" => "Ad Muncher",
193 "rule" => array(
194 "Ad Muncher[/ v]*([0-9.]{1,10})" => "\\1"
195 ),
196 "uri" => ""
197 ),
198 "aesop" => array(
199 "icon" => "robot",
200 "title" => "Aesop",
201 "rule" => array(
202 "^AESOP_com_SpiderMan" => ""
203 ),
204 "uri" => "http://www.aesop.com"
205 ),
206 "agada" => array(
207 "icon" => "robot",
208 "title" => "Agada",
209 "rule" => array(
210 "^agadine[/ ]([0-9.]{1,10})" => "\\1"
211 ),
212 "uri" => ""
213 ),
214 "ahrefs" => array(
215 "icon" => "ahrefs",
216 "title" => "Ahrefs",
217 "rule" => array(
218 "AhrefsBot[ /]([0-9.]{1,10})" => "\\1"
219 ),
220 "uri" => "http://ahrefs.com/"
221 ),
222 "aibot" => array(
223 "icon" => "robot",
224 "title" => "Aibot",
225 "rule" => array(
226 "AIBOT[/ ]([0-9.]{1,10})" => "\\1"
227 ),
228 "uri" => ""
229 ),
230 "aihitbot" => array(
231 "icon" => "robot",
232 "title" => "aiHit",
233 "rule" => array(
234 "aiHitBot[/ ]([0-9.]{1,10})" => "\\1"
235 ),
236 "uri" => "http://www.aihit.com/"
237 ),
238 "aipbot" => array(
239 "icon" => "robot",
240 "title" => "Aipbot",
241 "rule" => array(
242 "aipbot[/ ]([0-9.]{1,10})" => "\\1"
243 ),
244 "uri" => ""
245 ),
246 "aleksika" => array(
247 "icon" => "aleksika",
248 "title" => "Aleksika",
249 "rule" => array(
250 "Aleksika Spider[/ ]([0-9.]{1,10})" => "\\1"
251 ),
252 "uri" => ""
253 ),
254 "alertsite" => array(
255 "icon" => "alertsite",
256 "title" => "AlertSite",
257 "rule" => array(
258 "ipd[ /]([0-9.]{1,10}).*Alertsite\.com" => "\\1"
259 ),
260 "uri" => "http://www.alertsite.com/index.html"
261 ),
262 "alexa" => array(
263 "icon" => "alexa",
264 "title" => "Alexa",
265 "rule" => array(
266 "^ia_archive" => ""
267 ),
268 "uri" => "http://www.alexa.com/"
269 ),
270 "almaden" => array(
271 "icon" => "almaden",
272 "title" => "IBM Crawler",
273 "rule" => array(
274 "www\.almaden\.ibm\.com/cs/crawler" => ""
275 ),
276 "uri" => "http://www.almaden.ibm.com/cs/crawler/"
277 ),
278 "altavista" => array(
279 "icon" => "altavista",
280 "title" => "Altavista",
281 "rule" => array(
282 "Scooter[ /\-]*[a-z]*([0-9.]{1,10})" => "\\1",
283 "AltaVista V([0-9.]{1,10})" => "\\1",
284 "AltaVista Intranet V([0-9.]{1,10})" => "\\1"
285 ),
286 "uri" => "http://www.altavista.com/"
287 ),
288 "amazon" => array(
289 "icon" => "amazon",
290 "title" => "Amazon",
291 "rule" => array(
292 "^(aranhabot|amzn_assoc)" => "",
293 "^NutchEC2Test" => "",
294 "Amazonbot[/ ]([0-9.]{1,10})" => "\\1"
295 ),
296 "uri" => "http://www.amazon.com/"
297 ),
298 "amidalla" => array(
299 "icon" => "amidalla",
300 "title" => "Amidalla",
301 "rule" => array(
302 "^amibot" => ""
303 ),
304 "uri" => ""
305 ),
306 "amfibi" => array(
307 "icon" => "amfibi",
308 "title" => "Amfibi",
309 "rule" => array(
310 "Amfibibot[/ ]([0-9.]{1,10})" => "\\1",
311 "Amfibibot" => ""
312 ),
313 "uri" => ""
314 ),
315 "amphetadesk" => array(
316 "icon" => "robot",
317 "title" => "AmphetaDesk",
318 "rule" => array(
319 "AmphetaDesk[/ ]([0-9.]{1,10})" => "\\1"
320 ),
321 "uri" => ""
322 ),
323 "amphetameme" => array(
324 "icon" => "robot",
325 "title" => "Amphetameme",
326 "rule" => array(
327 "amphetameme[ \-]?crawler" => ""
328 ),
329 "uri" => ""
330 ),
331 "annomille" => array(
332 "icon" => "robot",
333 "title" => "AnnoMille",
334 "rule" => array(
335 "^AnnoMille( spider)?[/ ]([0-9.]{1,10})" => "\\2"
336 ),
337 "uri" => "http://www.annomille.it"
338 ),
339 "anonymouse" => array(
340 "icon" => "anonymouse",
341 "title" => "Anonymouse.org",
342 "rule" => array(
343 "http://Anonymouse.org" => ""
344 ),
345 "uri" => "http://anonymouse.org"
346 ),
347 "ansearch" => array(
348 "icon" => "robot",
349 "title" => "Ansearch",
350 "rule" => array(
351 "AnsearchBot[/ ]([0-9.]{1,10})" => "\\1"
352 ),
353 "uri" => ""
354 ),
355 "answerchase" => array(
356 "icon" => "answerchase",
357 "title" => "AnswerChase",
358 "rule" => array(
359 "AnswerChase( PROve)?[/ ]([0-9.]{1,10})" => "\\2"
360 ),
361 "uri" => "http://www.answerchase.com/"
362 ),
363 "antibot" => array(
364 "icon" => "robot",
365 "title" => "Antibot",
366 "rule" => array(
367 "antibot-V([0-9.]{1,10})" => "\\1"
368 ),
369 "uri" => ""
370 ),
371 "aonde" => array(
372 "icon" => "aonde",
373 "title" => "Aonde",
374 "rule" => array(
375 "^AONDE-Spider" => ""
376 ),
377 "uri" => ""
378 ),
379 "aonline" => array(
380 "icon" => "robot",
381 "title" => "A-Online.at",
382 "rule" => array(
383 "^A-Online Search" => ""
384 ),
385 "uri" => "http://www.a-online.at/"
386 ),
387 "aol" => array(
388 "icon" => "aol",
389 "title" => "AOLserver",
390 "rule" => array(
391 "^AOLserver-Tcl[/ ]([0-9.]{1,10})" => "\\1",
392 "^AOLserver" => ""
393 ),
394 "uri" => ""
395 ),
396 "apachebench" => array(
397 "icon" => "robot",
398 "title" => "ApacheBench",
399 "rule" => array(
400 "ApacheBench[ /]([0-9.]{1,10})" => "\\1"
401 ),
402 "uri" => ""
403 ),
404 "apassion4jazz" => array(
405 "icon" => "robot",
406 "title" => "Passion 4 Jazz",
407 "rule" => array(
408 "^BebopBot[ /]([0-9.]{1,10})" => "\\1"
409 ),
410 "uri" => "http://www.apassion4jazz.net/bebopbot.html"
411 ),
412 "apexoo" => array(
413 "icon" => "robot",
414 "title" => "Apexoo",
415 "rule" => array(
416 "^Apexoo Spider ([0-9.]{1,10})" => "\\1"
417 ),
418 "uri" => "http://www.apexoo.com/"
419 ),
420 "apnoti" => array(
421 "icon" => "apnoti",
422 "title" => "Apnoti",
423 "rule" => array(
424 "apnoti.*Robot[ /]v([0-9.]{1,10})" => "\\1"
425 ),
426 "uri" => "http://www.apnoti.com/"
427 ),
428 "aport" => array(
429 "icon" => "aport",
430 "title" => "Aport",
431 "rule" => array(
432 "^Aport" => ""
433 ),
434 "uri" => ""
435 ),
436 "appie" => array(
437 "icon" => "walhello",
438 "title" => "Walhello",
439 "rule" => array(
440 "appie[ /]([0-9.]{1,10})" => "\\1"
441 ),
442 "uri" => ""
443 ),
444 "apple" => array(
445 "icon" => "apple",
446 "title" => "Apple",
447 "rule" => array(
448 "Applebot[ /]([0-9.]{1,10})" => "\\1"
449 ),
450 "uri" => "http://www.apple.com/go/applebot"
451 ),
452
453 "arachmo" => array(
454 "icon" => "arachmo",
455 "title" => "Arachmo",
456 "rule" => array(
457 "compatible; Arachmo" => ""
458 ),
459 "uri" => ""
460 ),
461 "arexera" => array(
462 "icon" => "arexera",
463 "title" => "Arexera",
464 "rule" => array(
465 "^X-Crawler" => "",
466 "^TECOMAC-Crawler[ /]([0-9.]{1,10})" => "\\1"
467 ),
468 "uri" => "http://www.arexera.de/"
469 ),
470 "arianna" => array(
471 "icon" => "arianna",
472 "title" => "Arianna",
473 "rule" => array(
474 "^www.arianna.it" => ""
475 ),
476 "uri" => "http://www.arianna.it/"
477 ),
478 "artface" => array(
479 "icon" => "robot",
480 "title" => "Artface",
481 "rule" => array(
482 "^ArtfaceBot" => ""
483 ),
484 "uri" => ""
485 ),
486 "artviper" => array(
487 "icon" => "artviper",
488 "title" => "artViper",
489 "rule" => array(
490 "artViper" => ""
491 ),
492 "uri" => "http://www.artviper.net/"
493 ),
494 "asinfo" => array(
495 "icon" => "robot",
496 "title" => "Any Search Info",
497 "rule" => array(
498 "Sleek Spider[ /]([0-9.]{1,10})" => "\\1"
499 ),
500 "uri" => "http://search-info.com/"
501 ),
502 "ask" => array(
503 "icon" => "askjeeves",
504 "title" => "Ask Jeeves",
505 "rule" => array(
506 "Ask[ \-]?Jeeves" => "",
507 "teomaagent" => ""
508 ),
509 "uri" => ""
510 ),
511 "askaboutoil" => array(
512 "icon" => "robot",
513 "title" => "ASPseek",
514 "rule" => array(
515 "^AskAboutOil[ /]([0-9.]{1,10})" => "\\1"
516 ),
517 "uri" => "http://askaboutoil.com/"
518 ),
519 "asked" => array(
520 "icon" => "robot",
521 "title" => "AskEd!",
522 "rule" => array(
523 "^asked[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
524 ),
525 "uri" => "http://asked.jp"
526 ),
527 "aspseek" => array(
528 "icon" => "robot",
529 "title" => "ASPseek",
530 "rule" => array(
531 "^ASPseek[/ ]([0-9.]{1,10})" => "\\1"
532 ),
533 "uri" => ""
534 ),
535 "atlocal" => array(
536 "icon" => "robot",
537 "title" => "At Local",
538 "rule" => array(
539 "AtlocalBot[/ ]([0-9.]{1,10})" => "\\1"
540 ),
541 "uri" => "http://www.atlocal.com/"
542 ),
543 "atomz" => array(
544 "icon" => "atomz",
545 "title" => "Atomz",
546 "rule" => array(
547 "Atomz[/ ]([0-9.]{1,10})" => "\\1"
548 ),
549 "uri" => ""
550 ),
551 "avira" => array(
552 "icon" => "avira",
553 "title" => "Avira SafeSearch",
554 "rule" => array(
555 "^SafeSearch microdata crawler" => ""
556 ),
557 "uri" => "https://safesearch.avira.com"
558 ),
559 "axel" => array(
560 "icon" => "robot",
561 "title" => "Axel",
562 "rule" => array(
563 "^axel" => ""
564 ),
565 "uri" => ""
566 ),
567 "axmo" => array(
568 "icon" => "axmo",
569 "title" => "Axmo",
570 "rule" => array(
571 "AxmoRobot" => ""
572 ),
573 "uri" => ""
574 ),
575 "answerbus" => array(
576 "icon" => "answerbus",
577 "title" => "AnswerBus",
578 "rule" => array(
579 "answerbus" => ""
580 ),
581 "uri" => ""
582 ),
583 "automapit" => array(
584 "icon" => "robot",
585 "title" => "AutoMapIt",
586 "rule" => array(
587 "AutoMapIt[ /](Bot)?" => ""
588 ),
589 "uri" => "http://www.automapit.com/bot.html"
590 ),
591 "augurnfind" => array(
592 "icon" => "robot",
593 "title" => "Augurnfind",
594 "rule" => array(
595 "augurnfind[/ ][v\-]*([0-9.]{1,10})" => "\\1"
596 ),
597 "uri" => ""
598 ),
599 "awasu" => array(
600 "icon" => "awasu",
601 "title" => "Awasu",
602 "rule" => array(
603 "Awasu[/ ]([0-9a-z.]{1,10})" => "\\1"
604 ),
605 "uri" => ""
606 ),
607 "axxus" => array(
608 "icon" => "axxus",
609 "title" => "axxus.de",
610 "rule" => array(
611 "whoiam" => ""
612 ),
613 "uri" => "http://www.axxus.de/"
614 ),
615 "ayell" => array(
616 "icon" => "ayell",
617 "title" => "Ayell",
618 "rule" => array(
619 "^Eurobot[ /]([0-9.]{1,10})" => "\\1"
620 ),
621 "uri" => "http://eurobot.ayell.eu"
622 ),
623 "babaloo" => array(
624 "icon" => "babaloo",
625 "title" => "Babaloo",
626 "rule" => array(
627 "BabalooSpider[ /]([0-9.]{1,10})" => "\\1"
628 ),
629 "uri" => "http://www.babaloo.si"
630 ),
631 "babe" => array(
632 "icon" => "robot",
633 "title" => "ba.be",
634 "rule" => array(
635 "BACS http://www.ba.be" => ""
636 ),
637 "uri" => "http://www.ba.be/"
638 ),
639 "baidu" => array(
640 "icon" => "baidu",
641 "title" => "Baidu",
642 "rule" => array(
643 "Baiduspider[ /]([0-9.]{1,10})" => "\\1",
644 "Baiduspider" => ""
645 ),
646 "uri" => "http://www.baidu.com/search/spider.html"
647 ),
648 "bananatree" => array(
649 "icon" => "robot",
650 "title" => "BananaTree",
651 "rule" => array(
652 "www\.thebananatree\.org" => ""
653 ),
654 "uri" => "http://www.thebananatree.org/"
655 ),
656 "bdcindexer" => array(
657 "icon" => "robot",
658 "title" => "bdcindexer",
659 "rule" => array(
660 "bdcindexer_([0-9a-z.]{1,10})" => "\\1"
661 ),
662 "uri" => "http://www.business.com/"
663 ),
664 "bdfetch" => array(
665 "icon" => "robot",
666 "title" => "BDFetch",
667 "rule" => array(
668 "^BDFetch" => ""
669 ),
670 "uri" => ""
671 ),
672 "bdncentral" => array(
673 "icon" => "robot",
674 "title" => "Bdncentral",
675 "rule" => array(
676 "BDNcentral Crawler v([0-9.]{1,10})" => "\\1"
677 ),
678 "uri" => "http://www.bdncentral.com/robot.html"
679 ),
680 "beammachine" => array(
681 "icon" => "robot",
682 "title" => "BeamMachine",
683 "rule" => array(
684 "^BeamMachine[ /]([0-9.]{1,10})" => "\\1"
685 ),
686 "uri" => "http://www.beammachine.net/"
687 ),
688 "become" => array(
689 "icon" => "become",
690 "title" => "Become",
691 "rule" => array(
692 "Become(JP)?Bot[/ ]([0-9.]{1,10})" => "\\2",
693 "(BecomeBot|Exabot)@exava\.com\)$" => ""
694 ),
695 "uri" => "http://www.become.com/"
696 ),
697 "beebware" => array(
698 "icon" => "robot",
699 "title" => "Beebware",
700 "rule" => array(
701 "BeebwareDirectory[/ ]v?([0-9.]{1,10})" => "\\2"
702 ),
703 "uri" => ""
704 ),
705 "bigbrother" => array(
706 "icon" => "robot",
707 "title" => "Big Brother",
708 "rule" => array(
709 "^Big Brother" => ""
710 ),
711 "uri" => "http://pauillac.inria.fr/~fpottier/"
712 ),
713 "bigclique" => array(
714 "icon" => "robot",
715 "title" => "BigClique",
716 "rule" => array(
717 "^BigCliqueBOT[/ ]([0-9.]{1,10})" => "\\1"
718 ),
719 "uri" => "http://www.bigclique.com"
720 ),
721 "biglotron" => array(
722 "icon" => "robot",
723 "title" => "Biglotron",
724 "rule" => array(
725 "^BIGLOTRON" => ""
726 ),
727 "uri" => "http://www.bigclique.com"
728 ),
729 "bigsearch" => array(
730 "icon" => "bigsearch",
731 "title" => "Bigsearch",
732 "rule" => array(
733 "Bigsearch.ca[/ ]Nutch[- ]([0-9.]{1,10})" => "\\1"
734 ),
735 "uri" => ""
736 ),
737 "bilbo" => array(
738 "icon" => "robot",
739 "title" => "Bilbo",
740 "rule" => array(
741 "Bilbo[ /]([0-9.]{1,10})" => "\\1"
742 ),
743 "uri" => "http://home.broadpark.no/~tnilsen-1/Linux/Bilbo_-_Nessus_WEB/bilbo_-_nessus_web.html"
744 ),
745 "bilgi" => array(
746 "icon" => "bilgi",
747 "title" => "Bilgi",
748 "rule" => array(
749 "Bilgi(Beta)?Bot[ /]([0-9.]{1,10})" => "\\1"
750 ),
751 "uri" => "http://www.bilgi.com/"
752 ),
753 "bitacle" => array(
754 "icon" => "bitacle",
755 "title" => "Bitacle",
756 "rule" => array(
757 "Bitacle (ro)?bot[ \(/V\:]+([0-9.]{1,10})" => "\\2",
758 ),
759 "uri" => "http://bitacle.org/"
760 ),
761 "bitbeamer" => array(
762 "icon" => "bitbeamer",
763 "title" => "BitBeamer",
764 "rule" => array(
765 "BitBeamer/([0-9.]{1,10})" => "\\1"
766 ),
767 "uri" => ""
768 ),
769 "biz360" => array(
770 "icon" => "biz360",
771 "title" => "Biz360",
772 "rule" => array(
773 "^Biz360 spider" => ""
774 ),
775 "uri" => ""
776 ),
777 "backlinktest" => array(
778 "icon" => "backlinktest",
779 "title" => "BacklinkCrawler",
780 "rule" => array(
781 "BacklinkCrawler" => ""
782 ),
783 "uri" => "http://www.backlinktest.com/crawler.html"
784 ),
785 "blaizbee" => array(
786 "icon" => "blaiz-bee",
787 "title" => "Blaiz-Bee",
788 "rule" => array(
789 "Blaiz-Bee[ /]([0-9.]{1,10})" => ""
790 ),
791 "uri" => ""
792 ),
793 "blogbeat" => array(
794 "icon" => "robot",
795 "title" => "BlogBeat",
796 "rule" => array(
797 "BlogBeat/?([0-9.]{1,10})" => "\\1",
798 ),
799 "uri" => "http://www.blogbeat.nl"
800 ),
801 "blogbotde" => array(
802 "icon" => "robot",
803 "title" => "blogbot.de",
804 "rule" => array(
805 "Naamah[ /]([0-9.a-z]{1,10})[ /]Blogbot" => "\\1",
806 ),
807 "uri" => "http://blogbot.de/"
808 ),
809 "blogcensus" => array(
810 "icon" => "blogcensus",
811 "title" => "Blogcensus",
812 "rule" => array(
813 "^Blogcensus" => "",
814 ),
815 "uri" => "http://blogcensus.de/bot/"
816 ),
817 "blogdex" => array(
818 "icon" => "robot",
819 "title" => "Blogdex",
820 "rule" => array(
821 "Blogdex[ /]([0-9.]{1,10})" => "\\1",
822 ),
823 "uri" => ""
824 ),
825 "blogg" => array(
826 "icon" => "blogg",
827 "title" => "Blogg",
828 "rule" => array(
829 "^blogg\.de" => ""
830 ),
831 "uri" => ""
832 ),
833 "blogland" => array(
834 "icon" => "robot",
835 "title" => "BlogLand",
836 "rule" => array(
837 "BlogLand[/ ]([0-9.]{1,10})" => "\\1"
838 ),
839 "uri" => ""
840 ),
841 "bloglines" => array(
842 "icon" => "bloglines",
843 "title" => "Bloglines",
844 "rule" => array(
845 "Bloglines[ /]([0-9.]{1,10})" => "\\1",
846 "Bloglines" => ""
847 ),
848 "uri" => ""
849 ),
850 "blogmap" => array(
851 "icon" => "robot",
852 "title" => "Blogmap",
853 "rule" => array(
854 "blogmap" => ""
855 ),
856 "uri" => ""
857 ),
858 "blogosphere" => array(
859 "icon" => "robot",
860 "title" => "Blogosphere",
861 "rule" => array(
862 "Blogosphere" => ""
863 ),
864 "uri" => ""
865 ),
866 "blogpeople" => array(
867 "icon" => "robot",
868 "title" => "BlogPeople",
869 "rule" => array(
870 "BlogPeople" => ""
871 ),
872 "uri" => ""
873 ),
874 "blogpulse" => array(
875 "icon" => "blogpulse",
876 "title" => "Blogpulse",
877 "rule" => array(
878 "Blogpulse" => ""
879 ),
880 "uri" => ""
881 ),
882 "blogranking" => array(
883 "icon" => "blogranking",
884 "title" => "BlogRanking",
885 "rule" => array(
886 "^BlogRanking(/RSS checker)?" => ""
887 ),
888 "uri" => ""
889 ),
890 "blogs" => array(
891 "icon" => "blogs",
892 "title" => "Blo.gs",
893 "rule" => array(
894 "blo\.gs[ /]([0-9.]{1,10})" => "\\1",
895 "blo\.gs" => ""
896 ),
897 "uri" => ""
898 ),
899 "blogshares" => array(
900 "icon" => "blogshares",
901 "title" => "BlogShares",
902 "rule" => array(
903 "BlogShares[ /]V?([0-9.]{1,10})" => "\\1",
904 "(^| |\()Blogshares(\.com| |\))" => ""
905 ),
906 "uri" => ""
907 ),
908 "blogslife" => array(
909 "icon" => "robot",
910 "title" => "BlogsLife",
911 "rule" => array(
912 "Blogslive" => ""
913 ),
914 "uri" => ""
915 ),
916 "blogsnow" => array(
917 "icon" => "blogsnow",
918 "title" => "BlogsNow",
919 "rule" => array(
920 "blogsnowbot" => "",
921 "BlogsNow" => ""
922 ),
923 "uri" => ""
924 ),
925 "blogstreet" => array(
926 "icon" => "blogstreet",
927 "title" => "BlogStreet",
928 "rule" => array(
929 "^BlogStreetBot" => ""
930 ),
931 "uri" => ""
932 ),
933 "blogsurf" => array(
934 "icon" => "robot",
935 "title" => "BlogSurf",
936 "rule" => array(
937 "nomadscafe_ra[/ ]([0-9.]{1,10})" => "\\1"
938 ),
939 "uri" => ""
940 ),
941 "blogtick" => array(
942 "icon" => "robot",
943 "title" => "BlogTick",
944 "rule" => array(
945 "BlogTickServer" => ""
946 ),
947 "uri" => ""
948 ),
949 "blogwatcher" => array(
950 "icon" => "blogwatcher",
951 "title" => "Blogwatcher",
952 "rule" => array(
953 "blogWatcher_Spider[/ ]([0-9.]{1,10})" => "\\1"
954 ),
955 "uri" => ""
956 ),
957 "blogwise" => array(
958 "icon" => "blogwise",
959 "title" => "Blogwise",
960 "rule" => array(
961 "Blogwise\.com(-MetaChecker)?[/ ]([0-9.]{1,10})" => "\\2"
962 ),
963 "uri" => ""
964 ),
965 "boardreader" => array(
966 "icon" => "boardreader",
967 "title" => "BoardReader",
968 "rule" => array(
969 "BoardReader[ \-](Image|Favicon)[ \-]Fetcher[ /]+([0-9.]{1,10})" => "\\2"
970 ),
971 "uri" => "http://www.boardreader.com"
972 ),
973 "bobby" => array(
974 "icon" => "bobby",
975 "title" => "Bobby",
976 "rule" => array(
977 "bobby[ /]([0-9.]{1,10})" => "\\1"
978 ),
979 "uri" => ""
980 ),
981 "boitho" => array(
982 "icon" => "robot",
983 "title" => "Boitho",
984 "rule" => array(
985 "Boitho\.com[ \-](dc|robot)?[/ ]([0-9.]{1,10})" => "\\2"
986 ),
987 "uri" => ""
988 ),
989 "booch" => array(
990 "icon" => "robot",
991 "title" => "Booch",
992 "rule" => array(
993 "^booch[_ /]([0-9.]{1,10})" => "\\1"
994 ),
995 "uri" => ""
996 ),
997 "book" => array(
998 "icon" => "book",
999 "title" => "Bookmark",
1000 "rule" => array(
1001 "http://www\.bookmark\.ne\.jp" => ""
1002 ),
1003 "uri" => ""
1004 ),
1005 "bookdog" => array(
1006 "icon" => "bookdog",
1007 "title" => "Bookdog",
1008 "rule" => array(
1009 "^Bookdog[ /]([0-9.]{1,10})" => "\\1"
1010 ),
1011 "uri" => ""
1012 ),
1013 "bordermanager" => array(
1014 "icon" => "bordermanager",
1015 "title" => "Border Manager",
1016 "rule" => array(
1017 "BorderManager[ /]([0-9.]{1,10})" => "\\1"
1018 ),
1019 "uri" => ""
1020 ),
1021 "botonparade" => array(
1022 "icon" => "botonparade",
1023 "title" => "Bot on Parade",
1024 "rule" => array(
1025 "BotOnParade" => ""
1026 ),
1027 "uri" => "http://www.bots-on-para.de/bot.html"
1028 ),
1029 "botje" => array(
1030 "icon" => "botje",
1031 "title" => "Botje",
1032 "rule" => array(
1033 "Plukkie[ /]([0-9.]{1,10})" => "\\1"
1034 ),
1035 "uri" => "http://www.botje.com/"
1036 ),
1037 "bottomfeeder" => array(
1038 "icon" => "bottomfeeder",
1039 "title" => "BottomFeeder",
1040 "rule" => array(
1041 "BottomFeeder[ /]([0-9.]{1,10})" => "\\1"
1042 ),
1043 "uri" => ""
1044 ),
1045 "browseremulator" => array(
1046 "icon" => "browseremulator",
1047 "title" => "BrowserEmulator",
1048 "rule" => array(
1049 "BrowserEmulator[ /]([0-9.]{1,10})" => "\\1"
1050 ),
1051 "uri" => "http://www.dejavu.org/emulator.htm"
1052 ),
1053 "browsershots" => array(
1054 "icon" => "browsershots",
1055 "title" => "Browsershots",
1056 "rule" => array(
1057 "Browsershots URL Check" => ""
1058 ),
1059 "uri" => "http://browsershots.org"
1060 ),
1061 "browserspy" => array(
1062 "icon" => "robot",
1063 "title" => "BrowserSpy",
1064 "rule" => array(
1065 "BrowserSpy" => ""
1066 ),
1067 "uri" => ""
1068 ),
1069 "bruinbot" => array(
1070 "icon" => "robot",
1071 "title" => "BruinBot",
1072 "rule" => array(
1073 "BruinBot" => ""
1074 ),
1075 "uri" => ""
1076 ),
1077 "bruno" => array(
1078 "icon" => "robot",
1079 "title" => "Bruno",
1080 "rule" => array(
1081 "^Bruno" => ""
1082 ),
1083 "uri" => ""
1084 ),
1085 "btbot" => array(
1086 "icon" => "btbot",
1087 "title" => "BitTorrent",
1088 "rule" => array(
1089 "BTbot/([0-9.]{1,10})" => "\\1"
1090 ),
1091 "uri" => ""
1092 ),
1093 "bubing" => array(
1094 "icon" => "robot",
1095 "title" => "BUbiNG",
1096 "rule" => array(
1097 "BUbiNG" => ""
1098 ),
1099 "uri" => "http://law.di.unimi.it/BUbiNG.html"
1100 ),
1101 "builtwith" => array(
1102 "icon" => "builtwith",
1103 "title" => "BuiltWith",
1104 "rule" => array(
1105 "BuiltWith[/ ]([0-9.]{1,10})" => "\\1"
1106 ),
1107 "uri" => "http://builtwith.com/bot.html"
1108 ),
1109 "bulkfeeds" => array(
1110 "icon" => "robot",
1111 "title" => "Bulkfeeds",
1112 "rule" => array(
1113 "Bulkfeeds[/ ]([a-z0-9.]{1,10})" => "\\1"
1114 ),
1115 "uri" => ""
1116 ),
1117 "burf" => array(
1118 "icon" => "burf",
1119 "title" => "Burf.com",
1120 "rule" => array(
1121 "^Norbert the Spider" => ""
1122 ),
1123 "uri" => "http://www.burf.com/"
1124 ),
1125 "butch" => array(
1126 "icon" => "robot",
1127 "title" => "Butch",
1128 "rule" => array(
1129 "Butch(__| )?([a-z0-9.]{1,10})" => "\\2"
1130 ),
1131 "uri" => ""
1132 ),
1133 "buzzlogic" => array(
1134 "icon" => "buzzlogic",
1135 "title" => "Buzzlogic",
1136 "rule" => array(
1137 "BuzzBot[ /]([0-9.]{1,10})" => "\\1"
1138 ),
1139 "uri" => "http://www.buzzlogic.com"
1140 ),
1141 "catchbot" => array(
1142 "icon" => "catchbot",
1143 "title" => "CatchBot",
1144 "rule" => array(
1145 "^CatchBot[/ ]([0-9.]{1,10})" => "\\1"
1146 ),
1147 "uri" => "http://www.catchbot.com"
1148 ),
1149 "camdiscover" => array(
1150 "icon" => "robot",
1151 "title" => "Camdiscover",
1152 "rule" => array(
1153 "^Camcrawler" => ""
1154 ),
1155 "uri" => ""
1156 ),
1157 "cazoodle" => array(
1158 "icon" => "cazoodle",
1159 "title" => "Cazoodle",
1160 "rule" => array(
1161 "^CazoodleBot/(Nutch|CazoodleBot)[/ \-]([0-9.]{1,10})" => "\\2",
1162 "^CazoodleBot[/ ]([a-z0-9.]{1,10})" => "\\1"
1163 ),
1164 "uri" => "http://www.cazoodle.com/cazoodlebot"
1165 ),
1166 "ccbot" => array(
1167 "icon" => "robot",
1168 "title" => "ccBot",
1169 "rule" => array(
1170 "CCBot[/ ]([0-9.]{1,10})" => "\\1"
1171 ),
1172 "uri" => "http://www.commoncrawl.org/bot.html"
1173 ),
1174 "ccgcrawl" => array(
1175 "icon" => "robot",
1176 "title" => "CCGCrawl",
1177 "rule" => array(
1178 "CCGCrawl[/ ]([0-9.]{1,10})" => "\\1"
1179 ),
1180 "uri" => "http://www.myworkbase.com/bot.html"
1181 ),
1182 "cerberian" => array(
1183 "icon" => "robot",
1184 "title" => "Cerberian Drtrs",
1185 "rule" => array(
1186 "^Cerberian Drtrs" => ""
1187 ),
1188 "uri" => ""
1189 ),
1190 "cfnetwork" => array(
1191 "icon" => "robot",
1192 "title" => "Cerberian Drtrs",
1193 "rule" => array(
1194 "^CFNetwork[/ ]([0-9.]{1,10})" => "\\1"
1195 ),
1196 "uri" => "http://www.cfnetwork.be/"
1197 ),
1198 "charlotte" => array(
1199 "icon" => "charlotte",
1200 "title" => "Charlotte",
1201 "rule" => array(
1202 "Charlotte[/ ]([0-9a-z.]{1,10})" => "\\1"
1203 ),
1204 "uri" => ""
1205 ),
1206 "cirilizator" => array(
1207 "icon" => "cirilizator",
1208 "title" => "Cirilizator",
1209 "rule" => array(
1210 "Cirilizator[/ ]([0-9.]{1,10})" => "\\1"
1211 ),
1212 "uri" => ""
1213 ),
1214 "claria" => array(
1215 "icon" => "robot",
1216 "title" => "Claria",
1217 "rule" => array(
1218 "(Claria|Diamond)(Bot)?[ /]([0-9.]{1,10})" => "\\3",
1219 "(Claria|Diamond)(Bot)" => ""
1220 ),
1221 "uri" => ""
1222 ),
1223 "claymont" => array(
1224 "icon" => "claymont",
1225 "title" => "Claymont",
1226 "rule" => array(
1227 "claymont\.com" => "",
1228 "OliverPerry" => ""
1229 ),
1230 "uri" => "http://www.claymont.com"
1231 ),
1232 "clipinc" => array(
1233 "icon" => "clipinc",
1234 "title" => "ClipInc",
1235 "rule" => array(
1236 "ClipInc" => ""
1237 ),
1238 "uri" => "http://tobit.software"
1239 ),
1240 "clush" => array(
1241 "icon" => "clush",
1242 "title" => "Clush",
1243 "rule" => array(
1244 "Clus(tered-Search-|h)Bot[ /]([0-9.]{1,10})" => "\\2"
1245 ),
1246 "uri" => ""
1247 ),
1248 "cmsworldmap" => array(
1249 "icon" => "cmsworldmap",
1250 "title" => "CMS World Map",
1251 "rule" => array(
1252 "cmsworldmap" => ""
1253 ),
1254 "uri" => "http://www.cmsworldmap.com/"
1255 ),
1256 "cobion" => array(
1257 "icon" => "robot",
1258 "title" => "Cobion",
1259 "rule" => array(
1260 " (QXW03018|obot)\)" => ""
1261 ),
1262 "uri" => ""
1263 ),
1264 "coccoc" => array(
1265 "icon" => "coccoc",
1266 "title" => "Coccoc",
1267 "rule" => array(
1268 "coccoc[ /]([0-9.]{1,10})" => "\\1",
1269 "coccocbot-web[ /]([0-9.]{1,10})" => "\\1"
1270 ),
1271 "uri" => "http://help.coccoc.com"
1272 ),
1273 "coldfusion" => array(
1274 "icon" => "coldfusion",
1275 "title" => "ColdFusion",
1276 "rule" => array(
1277 "^coldfusion" => ""
1278 ),
1279 "uri" => ""
1280 ),
1281 "combine" => array(
1282 "icon" => "robot",
1283 "title" => "Combine",
1284 "rule" => array(
1285 "Combine[ /]([0-9.]{1,10})" => "\\1"
1286 ),
1287 "uri" => ""
1288 ),
1289 "combot" => array(
1290 "icon" => "robot",
1291 "title" => "comBot",
1292 "rule" => array(
1293 "^comBot[ /]([0-9.]{1,10})" => "\\1"
1294 ),
1295 "uri" => ""
1296 ),
1297 "comet" => array(
1298 "icon" => "comet",
1299 "title" => "Comet",
1300 "rule" => array(
1301 "cometsearch@cometsystems" => ""
1302 ),
1303 "uri" => ""
1304 ),
1305 "commerobo" => array(
1306 "icon" => "robot",
1307 "title" => "Commerobo",
1308 "rule" => array(
1309 "Commerobo[/ ]([0-9.]{1,10})" => "\\1"
1310 ),
1311 "uri" => ""
1312 ),
1313 "comrite" => array(
1314 "icon" => "robot",
1315 "title" => "ComRite",
1316 "rule" => array(
1317 "Comrite[/ ]([0-9.]{1,10})" => "\\1"
1318 ),
1319 "uri" => "http://www.comrite.com/"
1320 ),
1321 "convera" => array(
1322 "icon" => "convera",
1323 "title" => "Convera",
1324 "rule" => array(
1325 "Convera(MultiMedia)?Crawler[/ ]([0-9.]{1,10})" => "\\2",
1326 "Convera Internet Spider V([0-9.]{1,10})" => "\\1"
1327 ),
1328 "uri" => ""
1329 ),
1330 "coolbot" => array(
1331 "icon" => "robot",
1332 "title" => "CoolBot",
1333 "rule" => array(
1334 "^CoolBot" => ""
1335 ),
1336 "uri" => ""
1337 ),
1338 "cosmix" => array(
1339 "icon" => "robot",
1340 "title" => "Cosmix",
1341 "rule" => array(
1342 "^(voyager|cfetch|CosmixCrawler|carleson)[/ ]([0-9.]{1,10})" => "\\2",
1343 ),
1344 "uri" => ""
1345 ),
1346 "cosmos" => array(
1347 "icon" => "robot",
1348 "title" => "Cosmos",
1349 "rule" => array(
1350 "^cosmos" => ""
1351 ),
1352 "uri" => ""
1353 ),
1354 "cosmoty" => array(
1355 "icon" => "robot",
1356 "title" => "Cosmoty",
1357 "rule" => array(
1358 "^beautybot[/ ]([0-9.]{1,10})" => "\\1"
1359 ),
1360 "uri" => "http://www.uchoose.de/crawler/beautybot/"
1361 ),
1362 "covario" => array(
1363 "icon" => "covario",
1364 "title" => "Covario",
1365 "rule" => array(
1366 "Covario-IDS[/ ]([0-9.]{1,10})" => "\\1"
1367 ),
1368 "uri" => "http://www.covario.com/ids/"
1369 ),
1370 "creativecommons" => array(
1371 "icon" => "creativecommons",
1372 "title" => "Creative Commons",
1373 "rule" => array(
1374 "CreativeCommons[/ ]([0-9.]{1,6}(-dev)?)" => "\\1"
1375 ),
1376 "uri" => ""
1377 ),
1378 "cscrawler" => array(
1379 "icon" => "robot",
1380 "title" => "CsCrawler",
1381 "rule" => array(
1382 "CsCrawler" => ""
1383 ),
1384 "uri" => "http://www.kde.cs.uni-kassel.de/lehre/ss2005/googlespam/crawler.html"
1385 ),
1386 "jigsaw" => array(
1387 "icon" => "jigsaw",
1388 "title" => "Jigsaw",
1389 "rule" => array(
1390 "Jigsaw[ /]([0-9.]{1,10})" => "\\1"
1391 ),
1392 "uri" => "http://jigsaw.w3.org/css-validator/"
1393 ),
1394 "csscheck" => array(
1395 "icon" => "w3c",
1396 "title" => "W3C CSS Validator",
1397 "rule" => array(
1398 "CSS(Check|_Validator).+[ /]([0-9.]{1,10})" => "\\2"
1399 ),
1400 "uri" => "http://jigsaw.w3.org/css-validator/"
1401 ),
1402 "custo" => array(
1403 "icon" => "robot",
1404 "title" => "Custo",
1405 "rule" => array(
1406 "Custo[ /]([0-9.]{1,10})" => "\\1"
1407 ),
1408 "uri" => ""
1409 ),
1410 "cybernavi" => array(
1411 "icon" => "robot",
1412 "title" => "CyberNavi",
1413 "rule" => array(
1414 "CyberNavi_WebGet[ /]([0-9.]{1,10})" => "\\1"
1415 ),
1416 "uri" => ""
1417 ),
1418 "cyberpatrol" => array(
1419 "icon" => "cyberpatrol",
1420 "title" => "CyberPatrol",
1421 "rule" => array(
1422 "^CyberPatrol" => ""
1423 ),
1424 "uri" => "http://www.cyberpatrol.com/cyberpatrolcrawler.asp"
1425 ),
1426 "cyberz" => array(
1427 "icon" => "cyberz",
1428 "title" => "Cyberz",
1429 "rule" => array(
1430 "Cyberz Communication Agent" => ""
1431 ),
1432 "uri" => ""
1433 ),
1434 "cydral" => array(
1435 "icon" => "robot",
1436 "title" => "Cydral",
1437 "rule" => array(
1438 "CydralSpider[ /]([0-9.]{1,10})" => "\\1"
1439 ),
1440 "uri" => ""
1441 ),
1442 "cynthia" => array(
1443 "icon" => "cynthia",
1444 "title" => "Cynthia Says",
1445 "rule" => array(
1446 "Cynthia[ /]([0-9.]{1,10})" => "\\1"
1447 ),
1448 "uri" => ""
1449 ),
1450 "d4x" => array(
1451 "icon" => "d4x",
1452 "title" => "Downloader for X",
1453 "rule" => array(
1454 "Downloader for X[ /]([0-9.]{1,10})" => "\\1"
1455 ),
1456 "uri" => ""
1457 ),
1458 "da" => array(
1459 "icon" => "da",
1460 "title" => "DA",
1461 "rule" => array(
1462 "^DA[ /]([0-9.]{1,10})" => "\\1"
1463 ),
1464 "uri" => ""
1465 ),
1466 "daum" => array(
1467 "icon" => "daum",
1468 "title" => "DAUM",
1469 "rule" => array(
1470 "DAUMOA[ /]([0-9.]{1,10})" => "\\1",
1471 "Daum[ /]([0-9.]{1,10})" => "\\1",
1472 "DAUM Web Robot" => "",
1473 "daum.net" => "",
1474 "Daum Communications Corp" => "",
1475 "EDI[ /]([0-9.]{1,10})" => "\\1",
1476 "Edacious.*Intelligent Web Robot" => "",
1477 "RaBot[/ ]([0-9.]{1,10}) Agent" => "\\1"
1478 ),
1479 "uri" => "http://ws.daum.net/"
1480 ),
1481 "daypop" => array(
1482 "icon" => "robot",
1483 "title" => "Daypop",
1484 "rule" => array(
1485 "daypopbot[/ ]([0-9.]{1,10})" => "\\1"
1486 ),
1487 "uri" => ""
1488 ),
1489 "delfi" => array(
1490 "icon" => "delfi",
1491 "title" => "Delfi",
1492 "rule" => array(
1493 "crawl at delfi dot lt" => ""
1494 ),
1495 "uri" => ""
1496 ),
1497 "depspid" => array(
1498 "icon" => "depspid",
1499 "title" => "DepSpid",
1500 "rule" => array(
1501 "DepSpid[/ ]([0-9.]{1,10})" => "\\1"
1502 ),
1503 "uri" => ""
1504 ),
1505 "devonagent" => array(
1506 "icon" => "devonagent",
1507 "title" => "DEVONagent",
1508 "rule" => array(
1509 "DEVONtech" => ""
1510 ),
1511 "uri" => ""
1512 ),
1513 "diffbot" => array(
1514 "icon" => "diffbot",
1515 "title" => "Diffbot",
1516 "rule" => array(
1517 " Diffbot" => ""
1518 ),
1519 "uri" => "http://www.diffbot.com"
1520 ),
1521 "diribot" => array(
1522 "icon" => "diribot",
1523 "title" => "Diri",
1524 "rule" => array(
1525 "diribot" => ""
1526 ),
1527 "uri" => "http://www.diri.bg"
1528 ),
1529 "directhit" => array(
1530 "icon" => "robot",
1531 "title" => "Direct Hit",
1532 "rule" => array(
1533 "EZResult -- Internet Search Engine" => ""
1534 ),
1535 "uri" => "http://www.directhit.com"
1536 ),
1537 "disco" => array(
1538 "icon" => "disco",
1539 "title" => "Disco",
1540 "rule" => array(
1541 "disco/Nutch[/ -]([0-9.]{1,10})" => "\\1",
1542 "discobot[/ -]([0-9.]{1,10})" => "\\1",
1543 "disco-crawl@discoveryengine.com" => ""
1544 ),
1545 "uri" => "http://www.discoveryengine.com/"
1546 ),
1547 "discopump" => array(
1548 "icon" => "robot",
1549 "title" => "DISCo Pump",
1550 "rule" => array(
1551 "DISCo Pump[/ ]([0-9.]{1,10})" => "\\1"
1552 ),
1553 "uri" => ""
1554 ),
1555 "dkimreputation" => array(
1556 "icon" => "dkimreputation",
1557 "title" => "DKIM Reputation",
1558 "rule" => array(
1559 "DKIMRepBot[ /]([0-9.]{1,10})" => "\\1"
1560 ),
1561 "uri" => "http://www.dkim-reputation.org"
1562 ),
1563 "dnsdigger" => array(
1564 "icon" => "dnsdigger",
1565 "title" => "DNS-Digger",
1566 "rule" => array(
1567 "DNS-Digger-Explorer[ /]([0-9.]{1,10})" => "\\1"
1568 ),
1569 "uri" => "http://www.dnsdigger.com"
1570 ),
1571 "dnsvalidation" => array(
1572 "icon" => "dnsvalidation",
1573 "title" => "DNS Validation",
1574 "rule" => array(
1575 "DNSValidation[ /]([0-9.]{1,10})" => "\\1"
1576 ),
1577 "uri" => "http://www.dnsvalidation.com/"
1578 ),
1579 "doctorhtml" => array(
1580 "icon" => "robot",
1581 "title" => "DoctorHTML",
1582 "rule" => array(
1583 "Doctor[ \-]?HTML" => ""
1584 ),
1585 "uri" => ""
1586 ),
1587 "dolphin" => array(
1588 "icon" => "dolphin",
1589 "title" => "Dolphin",
1590 "rule" => array(
1591 "Dolphin[ /]([0-9.]{1,10})" => "\\1"
1592 ),
1593 "uri" => "http://telehouse.ru/crawler.html"
1594 ),
1595 "domaindatei" => array(
1596 "icon" => "robot",
1597 "title" => "Domaindatei",
1598 "rule" => array(
1599 "DomaindateiSpider[ /]([0-9.]{1,10})" => "\\1"
1600 ),
1601 "uri" => ""
1602 ),
1603 "dontbuylists" => array(
1604 "icon" => "dontbuylists",
1605 "title" => "Dontbuylists",
1606 "rule" => array(
1607 "DBLBot[ /]([0-9.]{1,10})" => "\\1"
1608 ),
1609 "uri" => "http://www.dontbuylists.com"
1610 ),
1611 "dotbot" => array(
1612 "icon" => "robot",
1613 "title" => "DotBot",
1614 "rule" => array(
1615 "DotBot[ /]([0-9.]{1,10})" => "\\1"
1616 ),
1617 "uri" => "http://www.dotnetdotcom.org"
1618 ),
1619 "doweb" => array(
1620 "icon" => "doweb",
1621 "title" => "DoWeb",
1622 "rule" => array(
1623 "^www.doweb.co.uk" => ""
1624 ),
1625 "uri" => "http://www.doweb.co.uk/"
1626 ),
1627 "downforeveryoneorjustme" => array(
1628 "icon" => "downforeveryoneorjustme",
1629 "title" => "Down for everyone or just me",
1630 "rule" => array(
1631 "downforeveryoneorjustme" => ""
1632 ),
1633 "uri" => "http://www.downforeveryoneorjustme.com"
1634 ),
1635 "downloadninja" => array(
1636 "icon" => "robot",
1637 "title" => "Download Ninja",
1638 "rule" => array(
1639 "Download Ninja[ /]([0-9.]{1,10})" => "\\1"
1640 ),
1641 "uri" => ""
1642 ),
1643 "drupal" => array(
1644 "icon" => "drupal",
1645 "title" => "Drupal",
1646 "rule" => array(
1647 "^Drupal" => ""
1648 ),
1649 "uri" => ""
1650 ),
1651 "dsns" => array(
1652 "icon" => "robot",
1653 "title" => "DSNS Scanner",
1654 "rule" => array(
1655 "^DSNS" => ""
1656 ),
1657 "uri" => ""
1658 ),
1659 "dtsagent" => array(
1660 "icon" => "robot",
1661 "title" => "DTS Agent",
1662 "rule" => array(
1663 "DTS Agent" => ""
1664 ),
1665 "uri" => ""
1666 ),
1667 "duckduckgo" => array(
1668 "icon" => "duckduckgo",
1669 "title" => "DuckDuckGo",
1670 "rule" => array(
1671 "DuckDuckGo-Favicons-Bot[ /]([0-9.]{1,10})" => "\\1",
1672 "DuckDuckBot-Https[ /]([0-9.]{1,10})" => "\\1"
1673 ),
1674 "uri" => "http://duckduckgo.com"
1675 ),
1676 "earthcom" => array(
1677 "icon" => "earthcom",
1678 "title" => "Earthcom",
1679 "rule" => array(
1680 "EARTHCOM\.info[/ ]([0-9a-z.]{1,10})" => "\\1"
1681 ),
1682 "uri" => ""
1683 ),
1684 "ebay" => array(
1685 "icon" => "ebay",
1686 "title" => "eBay",
1687 "rule" => array(
1688 "eBay Relevance Ad Crawler" => ""
1689 ),
1690 "uri" => ""
1691 ),
1692 "echo" => array(
1693 "icon" => "robot",
1694 "title" => "Echo.com",
1695 "rule" => array(
1696 "_TrueRobot[/ ]([0-9.]{1,10})" => "\\1"
1697 ),
1698 "uri" => "http://www.echo.com/"
1699 ),
1700 "eert" => array(
1701 "icon" => "robot",
1702 "title" => "Eert",
1703 "rule" => array(
1704 "eert spdr[/ ]([0-9.]{1,10})" => "\\1"
1705 ),
1706 "uri" => "http://bot.eert.net"
1707 ),
1708 "eknip" => array(
1709 "icon" => "eknip",
1710 "title" => "E-Knip",
1711 "rule" => array(
1712 "eknip[ /]([0-9a-z.]{1,10})" => "\\1"
1713 ),
1714 "uri" => ""
1715 ),
1716 "zoominfo" => array(
1717 "icon" => "zoominfo",
1718 "title" => "ZoomInfo", //Previous called Eliyon
1719 "rule" => array(
1720 "NextGenSearchBot[/ ]([0-9.]{1,10})" => "\\1"
1721 ),
1722 "uri" => "http://www.zoominfo.com/business/nextgensearchbot.html"
1723 ),
1724 "emeraldshield" => array(
1725 "icon" => "emeraldshield",
1726 "title" => "EmeraldShield",
1727 "rule" => array(
1728 "^EmeraldShield" => ""
1729 ),
1730 "uri" => ""
1731 ),
1732 "empas" => array(
1733 "icon" => "empas",
1734 "title" => "Empas",
1735 "rule" => array(
1736 "DigExt; empas\)$" => "",
1737 "^EMPAS[_\-]ROBOT" => ""
1738 ),
1739 "uri" => ""
1740 ),
1741 "entfer" => array(
1742 "icon" => "entfer",
1743 "title" => "Entfer",
1744 "rule" => array(
1745 "EntferBot[ /]([0-9.]{1,10})" => "\\1"
1746 ),
1747 "uri" => "https://entfer.com"
1748 ),
1749 "entireweb" => array(
1750 "icon" => "entireweb",
1751 "title" => "Entireweb",
1752 "rule" => array(
1753 "Speedy[ ]?Spider" => ""
1754 ),
1755 "uri" => ""
1756 ),
1757 "envolk" => array(
1758 "icon" => "envolk",
1759 "title" => "Envolk",
1760 "rule" => array(
1761 "envolk\[ITS\]spider[/ ]([0-9.]{1,10})" => "\\1",
1762 "envolk[/ ]([0-9.]{1,10})" => "\\1"
1763 ),
1764 "uri" => ""
1765 ),
1766 "esnet" => array(
1767 "icon" => "robot",
1768 "title" => "ES.NET",
1769 "rule" => array(
1770 "ES.NET Crawler[ /]([0-9.]{1,10})" => "\\1"
1771 ),
1772 "uri" => ""
1773 ),
1774 "estyle" => array(
1775 "icon" => "estyle",
1776 "title" => "eStyle Search",
1777 "rule" => array(
1778 "eStyleSearch[ /]([0-9.]{1,10})" => "\\1"
1779 ),
1780 "uri" => ""
1781 ),
1782 "eurip" => array(
1783 "icon" => "robot",
1784 "title" => "Eurip",
1785 "rule" => array(
1786 "EuripBot[ /]([0-9.]{1,10})" => "\\1"
1787 ),
1788 "uri" => "http://www.eurip.com"
1789 ),
1790 "eurodirectory" => array(
1791 "icon" => "robot",
1792 "title" => "Euro Directory",
1793 "rule" => array(
1794 "www\.euro-directory\.com" => ""
1795 ),
1796 "uri" => "http://www.euro-directory.com/"
1797 ),
1798 "euroseek" => array(
1799 "icon" => "euroseek",
1800 "title" => "EuroSeek",
1801 "rule" => array(
1802 "Arachnoidea" => ""
1803 ),
1804 "uri" => ""
1805 ),
1806 "evaal" => array(
1807 "icon" => "evaal",
1808 "title" => "Evaal",
1809 "rule" => array(
1810 "^EvaalSE" => ""
1811 ),
1812 "uri" => "http://www.evaal.com/"
1813 ),
1814 "eventax" => array(
1815 "icon" => "eventax",
1816 "title" => "Eventax",
1817 "rule" => array(
1818 "^eventax[ /]([0-9.]{1,10})" => "\\1"
1819 ),
1820 "uri" => "http://www.eventax.de/"
1821 ),
1822 "everbee" => array(
1823 "icon" => "everbee",
1824 "title" => "Everbee",
1825 "rule" => array(
1826 "EverbeeCrawler" => ""
1827 ),
1828 "uri" => ""
1829 ),
1830 "everest" => array(
1831 "icon" => "everest",
1832 "title" => "Everest",
1833 "rule" => array(
1834 "Everest-Vulcan Inc.[ /]([0-9.]{1,10})" => "\\1"
1835 ),
1836 "uri" => ""
1837 ),
1838 "exabot" => array(
1839 "icon" => "exabot",
1840 "title" => "ExaBot",
1841 "rule" => array(
1842 "^NG[ /]([0-9.]{1,10})" => "\\1",
1843 "Exabot/([0-9.]{1,10})" => "\\1",
1844 "ExaBotTest/([0-9.]{1,10})" => "\\1",
1845 "ExaBot-(Test|Images)/([0-9.]{1,10})" => "\\2",
1846 "ExaBot-Thumbnails" => ""
1847 ),
1848 "uri" => "http://www.exabot.com/go/robot"
1849 ),
1850 "exactseek" => array(
1851 "icon" => "exactseek",
1852 "title" => "ExactSeek",
1853 "rule" => array(
1854 "^exactseek[ \-]?(pagereaper|crawler)[ \-]?([0-9.]{1,10})" => "\\2",
1855 "ExactSeek[ \.\-]?(Crawler|com)" => ""
1856 ),
1857 "uri" => "http://www.exactseek.com/"
1858 ),
1859 "excite" => array(
1860 "icon" => "excite",
1861 "title" => "Excite",
1862 "rule" => array(
1863 "Architext[ \-]?Spider" => ""
1864 ),
1865 "uri" => ""
1866 ),
1867 "execrawl" => array(
1868 "icon" => "robot",
1869 "title" => "Execrawl",
1870 "rule" => array(
1871 "Execrawl[ /]([0-9.]{1,10})" => "\\1",
1872 "Execrawl" => ""
1873 ),
1874 "uri" => ""
1875 ),
1876 "expertmonitor" => array(
1877 "icon" => "robot",
1878 "title" => "ExpertMonitor",
1879 "rule" => array(
1880 "^NetMonitor[ /]([0-9.]{1,10})" => "\\1"
1881 ),
1882 "uri" => ""
1883 ),
1884 "explorerrss" => array(
1885 "icon" => "robot",
1886 "title" => "Explorer RSS",
1887 "rule" => array(
1888 "^Windows-RSS-Platform[ /]([0-9.]{1,10})" => "\\1"
1889 ),
1890 "uri" => ""
1891 ),
1892 "ezooms" => array(
1893 "icon" => "robot",
1894 "title" => "Ezooms",
1895 "rule" => array(
1896 "ezooms[/ ]([0-9a-z.\-]{1,10})" => "\\1"
1897 ),
1898 "uri" => ""
1899 ),
1900 "facebook" => array(
1901 "icon" => "facebook",
1902 "title" => "Facebook",
1903 "rule" => array(
1904 "FacebookFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
1905 "facebookexternalhit/([0-9.]{1,10})" => "\\1",
1906 "^facebook" => ""
1907 ),
1908 "uri" => "http://www.facebook.com/"
1909 ),
1910 "fast" => array(
1911 "icon" => "fast",
1912 "title" => "Fast",
1913 "rule" => array(
1914 "^FAST( Enterprise |-Web| MetaWeb )?Crawler[ /]([0-9.]{1,10})" => "\\2",
1915 "^FAST( Enterprise |-Web| MetaWeb | PartnerSite )?Crawler" => "",
1916 "^Fast Crawler" => "",
1917 "^libwww-perl[ /]([0-9.]{1,10}) FP[ /]([0-9.]{1,10})" => "\\2"
1918 ),
1919 "uri" => "http://www.alltheweb.com/"
1920 ),
1921 "fastbuzz" => array(
1922 "icon" => "fastbuzz",
1923 "title" => "Fastbuzz",
1924 "rule" => array(
1925 "^fastbuzz\.com" => ""
1926 ),
1927 "uri" => ""
1928 ),
1929 "favorg" => array(
1930 "icon" => "robot",
1931 "title" => "FavOrg",
1932 "rule" => array(
1933 "^FavOrg" => ""
1934 ),
1935 "uri" => ""
1936 ),
1937 "favorstar" => array(
1938 "icon" => "favorstar",
1939 "title" => "Favorstar",
1940 "rule" => array(
1941 "favorstarbot[ /]([0-9.]{1,10})" => "\\1"
1942 ),
1943 "uri" => "http://favorstar.com/bot.html"
1944 ),
1945 "faxo" => array(
1946 "icon" => "robot",
1947 "title" => "Faxo",
1948 "rule" => array(
1949 "^Faxobot[ /]([0-9.]{1,10})" => "\\1"
1950 ),
1951 "uri" => "http://www.faxo.com/"
1952 ),
1953 "fdse" => array(
1954 "icon" => "robot",
1955 "title" => "FDSE Robot",
1956 "rule" => array(
1957 "FDSE[ \-]?robot" => ""
1958 ),
1959 "uri" => ""
1960 ),
1961 "feedback" => array(
1962 "icon" => "robot",
1963 "title" => "FeedBack",
1964 "rule" => array(
1965 "FeedBack[/ ]([0-9.]{1,10})" => "\\1"
1966 ),
1967 "uri" => ""
1968 ),
1969 "feedburner" => array(
1970 "icon" => "feedburner",
1971 "title" => "FeedBurner",
1972 "rule" => array(
1973 "^FeedBurner[/ ]([0-9.]{1,10})" => "\\1"
1974 ),
1975 "uri" => ""
1976 ),
1977 "feeddemon" => array(
1978 "icon" => "feeddemon",
1979 "title" => "FeedDemon",
1980 "rule" => array(
1981 "FeedDemon[/ ]([0-9.]{1,10})" => "\\1"
1982 ),
1983 "uri" => ""
1984 ),
1985 "feedfind" => array(
1986 "icon" => "feedfind",
1987 "title" => "FeedFind",
1988 "rule" => array(
1989 "Feed::Find[ /]([0-9.]{1,10})" => "\\1"
1990 ),
1991 "uri" => ""
1992 ),
1993 "feedonfeeds" => array(
1994 "icon" => "robot",
1995 "title" => "Feed On Feeds",
1996 "rule" => array(
1997 "FeedOnFeeds[/ ]([0-9.]{1,10})" => "\\1"
1998 ),
1999 "uri" => ""
2000 ),
2001 "feedparser" => array(
2002 "icon" => "robot",
2003 "title" => "Feedparser",
2004 "rule" => array(
2005 "UniversalFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
2006 "FeedParser" => ""
2007 ),
2008 "uri" => ""
2009 ),
2010 "feedreader" => array(
2011 "icon" => "feedreader",
2012 "title" => "Feedreader",
2013 "rule" => array(
2014 "^Feedreader" => ""
2015 ),
2016 "uri" => ""
2017 ),
2018 "feedserver" => array(
2019 "icon" => "robot",
2020 "title" => "FeedServer",
2021 "rule" => array(
2022 "FeedServer[/ ]([0-9.]{1,10})" => "\\1"
2023 ),
2024 "uri" => ""
2025 ),
2026 "feedster" => array(
2027 "icon" => "feedster",
2028 "title" => "Feedster",
2029 "rule" => array(
2030 "Feedster Crawler[/ ]([0-9.]{1,10})" => "\\1"
2031 ),
2032 "uri" => ""
2033 ),
2034 "feedvalidator" => array(
2035 "icon" => "feedvalidator",
2036 "title" => "Feed Validator",
2037 "rule" => array(
2038 "^FeedValidator[/ ]([0-9.]{1,10})" => "\\1"
2039 ),
2040 "uri" => ""
2041 ),
2042 "fdm" => array(
2043 "icon" => "robot",
2044 "title" => "Free Download Manager",
2045 "rule" => array(
2046 "^FDM[/ ]([0-9a-z.]{1,10})" => "\\1"
2047 ),
2048 "uri" => ""
2049 ),
2050 "filangy" => array(
2051 "icon" => "robot",
2052 "title" => "Filangy",
2053 "rule" => array(
2054 "Filangy[/ ]([0-9.]{1,10})" => "\\1"
2055 ),
2056 "uri" => "http://www.filangy.com/"
2057 ),
2058 "findanisp" => array(
2059 "icon" => "robot",
2060 "title" => "FindAnISP",
2061 "rule" => array(
2062 "FindAnISP" => ""
2063 ),
2064 "uri" => "http://www.findanisp.com/"
2065 ),
2066 "findengines" => array(
2067 "icon" => "findengines",
2068 "title" => "FindEngines",
2069 "rule" => array(
2070 "FindEngines! Bot" => ""
2071 ),
2072 "uri" => ""
2073 ),
2074 "findexa" => array(
2075 "icon" => "findexa",
2076 "title" => "Findexa",
2077 "rule" => array(
2078 "Findexa Crawler" => ""
2079 ),
2080 "uri" => ""
2081 ),
2082 "findlinks" => array(
2083 "icon" => "findlinks",
2084 "title" => "FindLinks",
2085 "rule" => array(
2086 "findlinks[ /]([0-9.]{1,10})" => "\\1",
2087 "^FindLinks" => ""
2088 ),
2089 "uri" => ""
2090 ),
2091 "findoor" => array(
2092 "icon" => "findoor",
2093 "title" => "Findoor",
2094 "rule" => array(
2095 "^findoor(-Bot)?" => "\\1"
2096 ),
2097 "uri" => ""
2098 ),
2099 "firefly" => array(
2100 "icon" => "firefly",
2101 "title" => "Firefly",
2102 "rule" => array(
2103 "Firefly" => ""
2104 ),
2105 "uri" => ""
2106 ),
2107 "flashget" => array(
2108 "icon" => "flashget",
2109 "title" => "FlashGet",
2110 "rule" => array(
2111 "^FlashGet" => ""
2112 ),
2113 "uri" => ""
2114 ),
2115 "flatland" => array(
2116 "icon" => "flatland",
2117 "title" => "Flatland",
2118 "rule" => array(
2119 "^flatlandbot" => ""
2120 ),
2121 "uri" => "http://www.flatlandindustries.com/flatlandbot"
2122 ),
2123 "flickbot" => array(
2124 "icon" => "flickbot",
2125 "title" => "FlickBot",
2126 "rule" => array(
2127 "FlickBot[ /]([0-9.]{1,10})" => "\\1"
2128 ),
2129 "uri" => ""
2130 ),
2131 "flightdeckreports" => array(
2132 "icon" => "flightdeckreports",
2133 "title" => "Flight Deck Reports",
2134 "rule" => array(
2135 "FlightDeckReportsBot[ /]([0-9.]{1,10})" => "\\1"
2136 ),
2137 "uri" => "http://www.flightdeckreports.com/"
2138 ),
2139 "forex" => array(
2140 "icon" => "robot",
2141 "title" => "Forex",
2142 "rule" => array(
2143 "^Forex Trading Network Organization" => ""
2144 ),
2145 "uri" => "http://www.netforex.org/"
2146 ),
2147 "freshmeat" => array(
2148 "icon" => "freshmeat",
2149 "title" => "Freshmeat",
2150 "rule" => array(
2151 "fmII URL validator[ /]([0-9.]{1,10})" => "\\1",
2152 "freshmeat.net URL validator[ /]([0-9.]{1,10})" => "\\1"
2153 ),
2154 "uri" => "http://www.freshmeat.net/"
2155 ),
2156 "friend" => array(
2157 "icon" => "friend",
2158 "title" => "Friend",
2159 "rule" => array(
2160 "www\.friend\.fr" => ""
2161 ),
2162 "uri" => "http://www.friend.fr/"
2163 ),
2164 "frontier" => array(
2165 "icon" => "frontier",
2166 "title" => "Frontier",
2167 "rule" => array(
2168 "Frontier[ /]([0-9.]{1,10})" => "\\1"
2169 ),
2170 "uri" => ""
2171 ),
2172 "fyberspider" => array(
2173 "icon" => "robot",
2174 "title" => "FyberSpider",
2175 "rule" => array(
2176 "FyberSpider[ /]([0-9.]{1,10})" => "\\1"
2177 ),
2178 "uri" => "http://www.fyberspider.com/"
2179 ),
2180 "gaisbot" => array(
2181 "icon" => "gais",
2182 "title" => "Gaisbot",
2183 "rule" => array(
2184 "Gaisbot[ /]([0-9.]{1,10})" => "\\1"
2185 ),
2186 "uri" => ""
2187 ),
2188 "galaxy" => array(
2189 "icon" => "galaxy",
2190 "title" => "Galaxy",
2191 "rule" => array(
2192 "GalaxyBot[ /]([0-9.]{1,10})" => "\\1",
2193 "www.galaxy.com" => ""
2194 ),
2195 "uri" => "http://www.galaxy.com/"
2196 ),
2197 "gamespy" => array(
2198 "icon" => "gamespy",
2199 "title" => "GameSpy",
2200 "rule" => array(
2201 "GameSpyHTTP[ /]([0-9.]{1,10})" => "\\1"
2202 ),
2203 "uri" => ""
2204 ),
2205 "garlik" => array(
2206 "icon" => "garlik",
2207 "title" => "Garlik",
2208 "rule" => array(
2209 "GarlikCrawler[ /]([0-9.]{1,10})" => "\\1"
2210 ),
2211 "uri" => "http://garlik.com/"
2212 ),
2213 "gdesktop" => array(
2214 "icon" => "gdesktop",
2215 "title" => "Google Desktop",
2216 "rule" => array(
2217 "compatible; Google Desktop" => ""
2218 ),
2219 "uri" => ""
2220 ),
2221 "genome" => array(
2222 "icon" => "robot",
2223 "title" => "Genome Machine",
2224 "rule" => array(
2225 "Genome[ \-]?Machine" => ""
2226 ),
2227 "uri" => ""
2228 ),
2229 "geohash" => array(
2230 "icon" => "geohash",
2231 "title" => "Geohash",
2232 "rule" => array(
2233 "GeoHasher(/Nutch)[ /-]([0-9.]{1,10})" => "\\2"
2234 ),
2235 "uri" => "http://geohash.org/"
2236 ),
2237 "geona" => array(
2238 "icon" => "robot",
2239 "title" => "Geona",
2240 "rule" => array(
2241 "GeonaBot[ /]([0-9.]{1,10})" => "\\1"
2242 ),
2243 "uri" => ""
2244 ),
2245 "geoblog" => array(
2246 "icon" => "robot",
2247 "title" => "The World as a Blog",
2248 "rule" => array(
2249 "The World as a Blog" => ""
2250 ),
2251 "uri" => ""
2252 ),
2253 "geourl" => array(
2254 "icon" => "geourl",
2255 "title" => "GeoUrl",
2256 "rule" => array(
2257 "geourl[ /]([0-9.]{1,10})" => "\\1",
2258 "^GeoURLBot[ /]([0-9.]{1,10})" => "\\1",
2259 ),
2260 "uri" => ""
2261 ),
2262 "getnetwise" => array(
2263 "icon" => "robot",
2264 "title" => "GetNetWise",
2265 "rule" => array(
2266 " Crayon Crawler" => ""
2267 ),
2268 "uri" => ""
2269 ),
2270 "getright" => array(
2271 "icon" => "getright",
2272 "title" => "GetRight",
2273 "rule" => array(
2274 "GetRight[ /]([0-9.]{1,10})" => "\\1"
2275 ),
2276 "uri" => ""
2277 ),
2278 "getsmart" => array(
2279 "icon" => "getsmart",
2280 "title" => "GetSmart",
2281 "rule" => array(
2282 "GetSmart[ /]([0-9.]{1,10})" => "\\1"
2283 ),
2284 "uri" => ""
2285 ),
2286 "gigabot" => array(
2287 "icon" => "gigablast",
2288 "title" => "Gigablast",
2289 "rule" => array(
2290 "(Gigabot|Sitesearch)[/ ]([0-9.]{1,10})" => "\\2",
2291 "GigabotSiteSearch[/ ]([0-9.]{1,10})" => "\\1",
2292 "GigablastOpenSource" => ""
2293 ),
2294 "uri" => ""
2295 ),
2296 "gimme" => array(
2297 "icon" => "gimme",
2298 "title" => "gimmeUSA",
2299 "rule" => array(
2300 "Gimme60bot[ /]([0-9.]{1,10})" => "\\1"
2301 ),
2302 "uri" => "http://gimme60.com"
2303 ),
2304 "ginger" => array(
2305 "icon" => "ginger",
2306 "title" => "GingerCrawler",
2307 "rule" => array(
2308 "GingerCrawler[ /]([0-9.]{1,10})" => "\\1"
2309 ),
2310 "uri" => "http://www.gingersoftware.com/crawler_agent.htm"
2311 ),
2312 "girafabot" => array(
2313 "icon" => "girafa",
2314 "title" => "Girafa",
2315 "rule" => array(
2316 "Girafabot" => ""
2317 ),
2318 "uri" => ""
2319 ),
2320 "globalspec" => array(
2321 "icon" => "globalspec",
2322 "title" => "GlobalSpec",
2323 "rule" => array(
2324 "Ocelli[ /]([0-9.]{1,10})" => "\\1"
2325 ),
2326 "uri" => ""
2327 ),
2328 "glucose" => array(
2329 "icon" => "glucose",
2330 "title" => "Glucose",
2331 "rule" => array(
2332 "glucose[ /]([0-9a-z.\-]{1,10})" => "\\1"
2333 ),
2334 "uri" => ""
2335 ),
2336 "gnomit" => array(
2337 "icon" => "gnomit",
2338 "title" => "Gnomit",
2339 "rule" => array(
2340 "gnomit[ /]([0-9.]{1,10})" => "\\1"
2341 ),
2342 "uri" => "http://www.gnomit.com/",
2343 ),
2344 "goforit" => array(
2345 "icon" => "goforit",
2346 "title" => "GoForIt",
2347 "rule" => array(
2348 "^GoForIt\.com" => "",
2349 "^GOFORITBOT" => ""
2350 ),
2351 "uri" => ""
2352 ),
2353 "goguides" => array(
2354 "icon" => "robot",
2355 "title" => "GoGuides",
2356 "rule" => array(
2357 "^GoGuidesBot[ /]([0-9.]{1,10})" => "\\1"
2358 ),
2359 "uri" => "http://www.goguides.org/"
2360 ),
2361 // Needs to be before google for correct detection
2362 "mediapartners" => array(
2363 "icon" => "google",
2364 "title" => "Mediapartners",
2365 "rule" => array (
2366 "Mediapartners-Google[ /]([0-9.]{1,10})" => "\\1",
2367 "Mediapartners-Google" => ""
2368 ),
2369 "uri" => ""
2370 ),
2371 "google" => array(
2372 "icon" => "google",
2373 "title" => "Google",
2374 "rule" => array (
2375 "Googl(e|ebot)(-Image)?/([0-9.]{1,10})" => "\\3",
2376 "Googl(e|ebot)(-Image)?/" => "",
2377 "^gsa-crawler" => "",
2378 "Google Web Preview" => ""
2379 ),
2380 "uri" => "http://www.google.com/"
2381 ),
2382 "googlesitemaps" => array(
2383 "icon" => "google",
2384 "title" => "Google-Sitemaps",
2385 "rule" => array (
2386 "Googl(e|ebot)(-Sitemaps)?/([0-9.]{1,10})" => "\\3",
2387 "GSiteCrawler[ /v]*([0-9.a-z]{1,10})" => "\\1",
2388 "Googl(e|ebot)(-Sitemaps)?/" => ""
2389 ),
2390 "uri" => ""
2391 ),
2392 "googlemobile" => array(
2393 "icon" => "google",
2394 "title" => "Google-Mobile",
2395 "rule" => array (
2396 "Googl(e|ebot)(-Mobile)?/([0-9.]{1,10})" => "\\3",
2397 "Googl(e|ebot)(-Mobile)?/" => ""
2398 ),
2399 "uri" => ""
2400 ),
2401 "googleads" => array(
2402 "icon" => "google",
2403 "title" => "Google-AdsBot",
2404 "rule" => array (
2405 "^AdsBot-Google" => "",
2406 ),
2407 "uri" => ""
2408 ),
2409 "googlefeeds" => array(
2410 "icon" => "google",
2411 "title" => "Google-Feedfetcher",
2412 "rule" => array (
2413 "^Feedfetcher-Google" => "",
2414 ),
2415 "uri" => ""
2416 ),
2417 "googlverification" => array(
2418 "icon" => "google",
2419 "title" => "Google-Site-Verification",
2420 "rule" => array (
2421 "Google-Site-Verification[ /]([0-9.]{1,10})" => "\\1"
2422 ),
2423 "uri" => ""
2424 ),
2425 // Needs to be AFTER Google detection
2426 "goo" => array(
2427 "icon" => "goo",
2428 "title" => "Goo",
2429 "rule" => array (
2430 "(gazz|ichiro|mog(et|imogi))[ /]([0-9.]{1,10})" => "\\3",
2431 "DoCoMo[ /]([0-9.]{1,10})" => "\\1"
2432 ),
2433 "uri" => ""
2434 ),
2435 "goongee" => array(
2436 "icon" => "robot",
2437 "title" => "GoonGee",
2438 "rule" => array (
2439 "^Big Fish[ /]v?([0-9.]{1,10})" => "\\2"
2440 ),
2441 "uri" => "http://www.goongee.com/"
2442 ),
2443 "gpost" => array(
2444 "icon" => "gpost",
2445 "title" => "GPost",
2446 "rule" => array(
2447 "^GPostbot" => ""
2448 ),
2449 "uri" => ""
2450 ),
2451 "grapeshot" => array(
2452 "icon" => "grapeshot",
2453 "title" => "Grapeshot",
2454 "rule" => array(
2455 "GrapeshotCrawler[/ ]([0-9.]{1,10})" => "\\1"
2456 ),
2457 "uri" => "http://www.grapeshot.co.uk/crawler.php"
2458 ),
2459 "gregarius" => array(
2460 "icon" => "robot",
2461 "title" => "Gregarius",
2462 "rule" => array(
2463 "^Gregarius[/ ]([0-9.]{1,10})" => ""
2464 ),
2465 "uri" => ""
2466 ),
2467 "grub" => array(
2468 "icon" => "grub",
2469 "title" => "Grub",
2470 "rule" => array(
2471 "grub[ \-]?client[ /\-]{1,5}([0-9.]{1,10})" => "\\1",
2472 "grub crawler" => "",
2473 "grub[/ ]([0-9.]{1,10})" => "\\1",
2474 "^GrubNG([0-9. ]{1,10})?" => "\\1"
2475 ),
2476 "uri" => "http://www.grub.org/"
2477 ),
2478 "gulliver" => array(
2479 "icon" => "robot",
2480 "title" => "Gulliver",
2481 "rule" => array(
2482 "Gulliver" => ""
2483 ),
2484 "uri" => ""
2485 ),
2486 "guruji" => array(
2487 "icon" => "guruji",
2488 "title" => "Guruji",
2489 "rule" => array(
2490 "GurujiBot[/ ]([0-9.]{1,10})" => "\\1"
2491 ),
2492 "uri" => "http://www.guruji.com/"
2493 ),
2494 "gush" => array(
2495 "icon" => "robot",
2496 "title" => "Gush",
2497 "rule" => array(
2498 "^Gush[/ ]([0-9.]{1,10})" => "\\1"
2499 ),
2500 "uri" => ""
2501 ),
2502 "gziptester" => array(
2503 "icon" => "robot",
2504 "title" => "Gzip Tester",
2505 "rule" => array(
2506 "HTTP_Compression_Test" => "",
2507 "g(id)?zip[ \-]?test(er)?" => ""
2508 ),
2509 "uri" => "http://whatsmyip.org/"
2510 ),
2511 "hanzoweb" => array(
2512 "icon" => "hanzoweb",
2513 "title" => "Hanzoweb",
2514 "rule" => array(
2515 "^Hanzoweb" => ""
2516 ),
2517 "uri" => ""
2518 ),
2519 "harbot" => array(
2520 "icon" => "harbot",
2521 "title" => "Harbot",
2522 "rule" => array(
2523 "^Harbot GateStation" => ""
2524 ),
2525 "uri" => ""
2526 ),
2527 "hatena" => array(
2528 "icon" => "hatena",
2529 "title" => "Hatena",
2530 "rule" => array(
2531 "Hatena (Antenna|Bookmark|Pagetitle Agent)[ /]([0-9.]{1,10})" => "\\2"
2532 ),
2533 "uri" => ""
2534 ),
2535 "htmlparser" => array(
2536 "icon" => "htmlparser",
2537 "title" => "HTMLParser",
2538 "rule" => array(
2539 "HTMLParser[ /]([0-9.]{1,10})" => "\\1",
2540 "lua-resty-http/0.10" => ""
2541 ),
2542 "uri" => "http://htmlparser.sourceforge.net/"
2543 ),
2544 "helix" => array(
2545 "icon" => "helix",
2546 "title" => "Heritrix",
2547 "rule" => array(
2548 "^helix[ /]([0-9.]{1,10})" => "\\1"
2549 ),
2550 "uri" => "http://www.sitesearch.ca/helix/"
2551 ),
2552 "heritrix" => array(
2553 "icon" => "heritrix",
2554 "title" => "Heritrix",
2555 "rule" => array(
2556 "heritrix[ /]([0-9.]{1,10})" => "\\1",
2557 "archive.org_bot" => "",
2558 "InternetArchive[ /]([0-9.a-z]{1,10})" => "\\1"
2559 ),
2560 "uri" => "http://archive.org"
2561 ),
2562 "hiddenmarket" => array(
2563 "icon" => "robot",
2564 "title" => "HiddenMarket",
2565 "rule" => array(
2566 "HiddenMarket[ /\-]([0-9.]{1,10})" => "\\1"
2567 ),
2568 "uri" => ""
2569 ),
2570 "honda" => array(
2571 "icon" => "robot",
2572 "title" => "Honda",
2573 "rule" => array(
2574 "Honda-Search[ /]([0-9.]{1,10})" => "\\1"
2575 ),
2576 "uri" => "http://www.honda-search.com"
2577 ),
2578 "hoowwwer" => array(
2579 "icon" => "hoowwwer",
2580 "title" => "HooWWWer",
2581 "rule" => array(
2582 "HooWWWer[ /]([0-9.]{1,10})" => "\\1"
2583 ),
2584 "uri" => ""
2585 ),
2586 "hotzonu" => array(
2587 "icon" => "hotzonu",
2588 "title" => "Hotzonu",
2589 "rule" => array(
2590 "Hotzonu[ /]([0-9.]{1,10})" => "\\1"
2591 ),
2592 "uri" => ""
2593 ),
2594 "houxou" => array(
2595 "icon" => "robot",
2596 "title" => "Houxou",
2597 "rule" => array(
2598 "HouxouCrawler[ /]Nutch.([0-9.]{1,10})" => "\\1",
2599 "HouxouCrawler" => ""
2600 ),
2601 "uri" => ""
2602 ),
2603 "htdig" => array(
2604 "icon" => "htdig",
2605 "title" => "ht://Dig",
2606 "rule" => array(
2607 "htdig[ /]([0-9.]{1,10})" => "\\1",
2608 "htdig" => "\\1"
2609 ),
2610 "uri" => ""
2611 ),
2612 "html2jpg" => array(
2613 "icon" => "html2jpg",
2614 "title" => "HTML2JPG",
2615 "rule" => array(
2616 "^HTML2JPG" => ""
2617 ),
2618 "uri" => ""
2619 ),
2620 "httperf" => array(
2621 "icon" => "robot",
2622 "title" => "HTTPerf",
2623 "rule" => array(
2624 "httperf[ /]([0-9.]{1,10})" => "\\1"
2625 ),
2626 "uri" => ""
2627 ),
2628 "httpunit" => array(
2629 "icon" => "httpunit",
2630 "title" => "HttpUnit",
2631 "rule" => array(
2632 "httpunit[ /]([0-9.]{1,10})" => "\\1"
2633 ),
2634 "uri" => ""
2635 ),
2636 "httrack" => array(
2637 "icon" => "httrack",
2638 "title" => "HTTrack",
2639 "rule" => array(
2640 "HTTrack[ /]([0-9.]{1,10})" => "\\1"
2641 ),
2642 "uri" => ""
2643 ),
2644 "huaweisymantec" => array(
2645 "icon" => "huaweisymantec",
2646 "title" => "HuaweiSymantec",
2647 "rule" => array(
2648 "HuaweiSymantecSpider[ /]([0-9.]{1,10})" => "\\1"
2649 ),
2650 "uri" => "http://www.huaweisymantec.com/en/IRL/spider/"
2651 ),
2652 "hungary" => array(
2653 "icon" => "hungary",
2654 "title" => "Hungary",
2655 "rule" => array(
2656 "HuRob[ /]([0-9.]{1,10})" => "\\1"
2657 ),
2658 "uri" => ""
2659 ),
2660 "i18n" => array(
2661 "icon" => "w3c",
2662 "title" => "W3C I18n Checker",
2663 "rule" => array(
2664 "^W3C_I18n-Checker[ /]([0-9.]{1,10})" => "\\1"
2665 ),
2666 "uri" => "http://validator.w3.org/services"
2667 ),
2668 "iakke" => array(
2669 "icon" => "iakke",
2670 "title" => "Iakké",
2671 "rule" => array(
2672 "^iakke_bot[ /]v([0-9.]{1,10})" => "\\1"
2673 ),
2674 "uri" => "http://fr.iakke.com/"
2675 ),
2676 "iask" => array(
2677 "icon" => "iask",
2678 "title" => "IAsk",
2679 "rule" => array(
2680 "iaskspider[ /]([0-9.]{1,10})" => "\\1",
2681 "^iaskspider" => ""
2682 ),
2683 "uri" => "http://iask.com"
2684 ),
2685 "icc" => array(
2686 "icon" => "icc",
2687 "title" => "ICC-Crawler",
2688 "rule" => array(
2689 "^ICC-Crawler" => ""
2690 ),
2691 "uri" => "http://kc.nict.go.jp/icc/crawl.html"
2692 ),
2693 "icerocket" => array(
2694 "icon" => "icerocket",
2695 "title" => "Icerocket",
2696 "rule" => array(
2697 "BlogzIce[ /]([0-9.]{1,10})" => "\\1",
2698 "BlogSearch[ /]([0-9.]{1,10})" => "\\1"
2699 ),
2700 "uri" => ""
2701 ),
2702 "icjobs" => array(
2703 "icon" => "icjobs",
2704 "title" => "iCjobs",
2705 "rule" => array(
2706 "iCjobs[ /]([0-9.]{1,10})" => "\\1"
2707 ),
2708 "uri" => "http://www.icjobs.de/"
2709 ),
2710 "icra" => array(
2711 "icon" => "icra",
2712 "title" => "ICRA",
2713 "rule" => array(
2714 "^ICRA_Semantic_spider[ /]([0-9.]{1,10})" => "\\1"
2715 ),
2716 "uri" => "http://www.icra.org"
2717 ),
2718 "iknow" => array(
2719 "icon" => "robot",
2720 "title" => "I know",
2721 "rule" => array(
2722 "Comaneci_bot[ /]([0-9.]{1,10})" => "\\1"
2723 ),
2724 "uri" => ""
2725 ),
2726 "ilial" => array(
2727 "icon" => "robot",
2728 "title" => "Ilial",
2729 "rule" => array(
2730 "ilial[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
2731 ),
2732 "uri" => ""
2733 ),
2734 "ilocal" => array(
2735 "icon" => "ilocal",
2736 "title" => "ilocal",
2737 "rule" => array(
2738 "^ilocal" => "",
2739 ),
2740 "uri" => "http://www.ilocal.nl"
2741 ),
2742 "ilse" => array(
2743 "icon" => "ilse",
2744 "title" => "Ilse",
2745 "rule" => array(
2746 "I(NGRID|lseRobot|lseBot)[ /]([0-9.]{1,10})" => "\\1"
2747 ),
2748 "uri" => "http://ilse.nl/"
2749 ),
2750 "iltrovatore" => array(
2751 "icon" => "iltrovatore",
2752 "title" => "IlTrovatore",
2753 "rule" => array(
2754 "iltrovatore-setaccio[ /]([0-9.]{1,10})" => "\\1",
2755 "Iltrovatore-Setaccio" => "",
2756 "iltrovatore[ /]([0-9.]{1,10})" => "\\1"
2757 ),
2758 "uri" => ""
2759 ),
2760 "indylibrary" => array(
2761 "icon" => "robot",
2762 "title" => "Indy Library",
2763 "rule" => array(
2764 "Indy[ \-]?Library" => ""
2765 ),
2766 "uri" => ""
2767 ),
2768 "inela" => array(
2769 "icon" => "robot",
2770 "title" => "Inela",
2771 "rule" => array(
2772 "InelaBot[ /]([0-9.]{1,10})" => ""
2773 ),
2774 "uri" => "http://inelegant.org/bot"
2775 ),
2776 "ineturl" => array(
2777 "icon" => "robot",
2778 "title" => "InetURL",
2779 "rule" => array(
2780 "InetURL.?[ /]([0-9.]{1,10})" => ""
2781 ),
2782 "uri" => ""
2783 ),
2784 "infoart" => array(
2785 "icon" => "robot",
2786 "title" => "InfoArt",
2787 "rule" => array(
2788 "InfoArt crawler" => ""
2789 ),
2790 "uri" => ""
2791 ),
2792 "infomine" => array(
2793 "icon" => "infomine",
2794 "title" => "INFOMINE",
2795 "rule" => array(
2796 "^DataFountains/DMOZ" => "",
2797 "^INFOMINE[ /]([0-9.]{1,10})" => "\\1"
2798 ),
2799 "uri" => "http://infomine.ucr.edu/"
2800 ),
2801 "infoseek" => array(
2802 "icon" => "infoseek",
2803 "title" => "Infoseek",
2804 "rule" => array(
2805 "SideWinder[ /]?([0-9a-z.]{1,10})" => "\\1",
2806 "Infoseek" => ""
2807 ),
2808 "uri" => ""
2809 ),
2810 "inktomi" => array(
2811 "icon" => "inktomi",
2812 "title" => "Inktomi",
2813 "rule" => array(
2814 "slurp@inktomi\.com" => ""
2815 ),
2816 "uri" => ""
2817 ),
2818 "innerprise" => array(
2819 "icon" => "robot",
2820 "title" => "Innerprise",
2821 "rule" => array(
2822 "^InnerpriseBot[ /]([0-9.]{1,10})" => "\\1",
2823 "URL[ _]Spider[ _]Pro[ /]([0-9.+]{1,10})" => "\\1",
2824 "^ES[ .]NET[ _]Crawler[ /]([0-9.]{1,10})" => "\\1"
2825 ),
2826 "uri" => "http://www.innerprise.com/"
2827 ),
2828 "inria" => array(
2829 "icon" => "inria",
2830 "title" => "Inria",
2831 "rule" => array(
2832 "^xyro_" => ""
2833 ),
2834 "uri" => ""
2835 ),
2836 "insitor" => array(
2837 "icon" => "insitor",
2838 "title" => "Insitor",
2839 "rule" => array(
2840 "^Insitor(,|\.|naut)" => ""
2841 ),
2842 "uri" => "http://www.insitor.com/"
2843 ),
2844 "internetninja" => array(
2845 "icon" => "robot",
2846 "title" => "Internet Ninja",
2847 "rule" => array(
2848 "^Internet Ninja[ /]([0-9.]{1,10})" => "\\1"
2849 ),
2850 "uri" => ""
2851 ),
2852 "internetseer" => array(
2853 "icon" => "internetseer",
2854 "title" => "InternetSeer",
2855 "rule" => array(
2856 "^InternetSeer\.com" => ""
2857 ),
2858 "uri" => ""
2859 ),
2860 "interseek" => array(
2861 "icon" => "interseek",
2862 "title" => "Interseek",
2863 "rule" => array(
2864 "Interseek.com" => ""
2865 ),
2866 "uri" => "http://www.interseek.com"
2867 ),
2868 "intravnews" => array(
2869 "icon" => "intravnews",
2870 "title" => "IntraVnews",
2871 "rule" => array(
2872 "IntraVnews[ /]([0-9.]{1,10})" => "\\1"
2873 ),
2874 "uri" => "http://www.intravnews.com/"
2875 ),
2876 "ionos" => array(
2877 "icon" => "ionos",
2878 "title" => "IONOS",
2879 "rule" => array(
2880 "IonCrawl" => ""
2881 ),
2882 "uri" => "https://www.ionos.de/terms-gtc/faq-crawler-en/"
2883 ),
2884 "ip2location" => array(
2885 "icon" => "ip2location",
2886 "title" => "IP2LocationBot",
2887 "rule" => array(
2888 "^IP2(Map|Location)Bot[ /]([0-9.]{1,10})" => "\\2"
2889 ),
2890 "uri" => "http://www.ip2location.com"
2891 ),
2892 "ipworks" => array(
2893 "icon" => "ipworks",
2894 "title" => "IP*Works",
2895 "rule" => array(
2896 "^IP\*Works\! V([0-9.]{1,10})" => "\\1"
2897 ),
2898 "uri" => "http://www.nsoftware.com/ipworks/"
2899 ),
2900 "irca" => array(
2901 "icon" => "robot",
2902 "title" => "Novell iChain Cool Solutions caching",
2903 "rule" => array(
2904 "^ICRA_(label_generator|Semantic_spider)[ /]([0-9.]{1,10})" => "\\2",
2905 "^Mozilla[/ ]([0-9.]{1,10})[/ ]\(compatible[ ;]*ICS" => "\\1"
2906 ),
2907 "uri" => "http://www.icra.org"
2908 ),
2909 "irvine" => array(
2910 "icon" => "robot",
2911 "title" => "Irvine",
2912 "rule" => array(
2913 "Irvine[ /]([0-9.]{1,10})" => "\\1"
2914 ),
2915 "uri" => ""
2916 ),
2917 "ips-agent" => array(
2918 "icon" => "robot",
2919 "title" => "IPS-agent",
2920 "rule" => array(
2921 "ips-agent" => ""
2922 ),
2923 "uri" => ""
2924 ),
2925 "isara" => array(
2926 "icon" => "isara",
2927 "title" => "Isara",
2928 "rule" => array(
2929 "Isara[ -]([0-9.]{1,10})" => "\\1"
2930 ),
2931 "uri" => "http://www.isara.org/"
2932 ),
2933 "isspider" => array(
2934 "icon" => "robot",
2935 "title" => "ISSpider",
2936 "rule" => array(
2937 "ISSpider[ /\-]([0-9.]{1,10})" => "\\1"
2938 ),
2939 "uri" => ""
2940 ),
2941 "it2media" => array(
2942 "icon" => "it2media",
2943 "title" => "IT2media",
2944 "rule" => array(
2945 "www.adressendeutschland.de" => ""
2946 ),
2947 "uri" => "http://www.adressendeutschland.de/"
2948 ),
2949 "ivia" => array(
2950 "icon" => "robot",
2951 "title" => "iVia",
2952 "rule" => array(
2953 "iVia Site Checker.?[ /]([0-9.]{1,10})" => "\\1"
2954 ),
2955 "uri" => ""
2956 ),
2957 "jeteye" => array(
2958 "icon" => "jeteye",
2959 "title" => "Jeteye",
2960 "rule" => array(
2961 "Jetbot[ /]([0-9.]{1,10})" => "\\1"
2962 ),
2963 "uri" => ""
2964 ),
2965 "jobsde" => array(
2966 "icon" => "jobsde",
2967 "title" => "jobs.de",
2968 "rule" => array(
2969 "www\.jobs\.de" => "",
2970 "jobs.de-Robot" => ""
2971 ),
2972 "uri" => "http://www.jobs.de/"
2973 ),
2974 "jpluck" => array(
2975 "icon" => "robot",
2976 "title" => "Jpluck",
2977 "rule" => array(
2978 "JPluck[ /]([0-9a-z.]{1,10})" => "\\1"
2979 ),
2980 "uri" => ""
2981 ),
2982 "jxta" => array(
2983 "icon" => "robot",
2984 "title" => "Jxta",
2985 "rule" => array(
2986 "falcon[ /]([0-9.]{1,10})" => "\\1"
2987 ),
2988 "uri" => ""
2989 ),
2990 "jyte" => array(
2991 "icon" => "jyte",
2992 "title" => "Jyte",
2993 "rule" => array(
2994 "jyte_fetcher[ /]([0-9.]{1,10})" => "\\1"
2995 ),
2996 "uri" => ""
2997 ),
2998 "jyxo" => array(
2999 "icon" => "jyxo",
3000 "title" => "Jyxo",
3001 "rule" => array(
3002 "Jyxobot[ /]([0-9.]{1,10})" => "\\1"
3003 ),
3004 "uri" => ""
3005 ),
3006 "kalooga" => array(
3007 "icon" => "kalooga",
3008 "title" => "Kalooga",
3009 "rule" => array(
3010 "kalooga[ /-]([0-9.]{1,10})" => "\\1",
3011 "^kalooga" => "",
3012 "KaloogaBot" => ""
3013 ),
3014 "uri" => "http://www.kalooga.com"
3015 ),
3016 "keywen" => array(
3017 "icon" => "keywen",
3018 "title" => "Keywen",
3019 "rule" => array(
3020 "EasyDL[ /]([0-9.]{1,10})" => "\\1"
3021 ),
3022 "uri" => ""
3023 ),
3024 "kilomonkey" => array(
3025 "icon" => "robot",
3026 "title" => "Kilomonkey",
3027 "rule" => array(
3028 "kmky-not-a-bot[ /]([0-9.]{1,10})" => "\\1"
3029 ),
3030 "uri" => "http://www.kilomonkey.com/notabot.txt"
3031 ),
3032 "kinja" => array(
3033 "icon" => "kinja",
3034 "title" => "Kinja",
3035 "rule" => array(
3036 "kinjabot[ /]([0-9.]{1,10})" => "\\1",
3037 "^kinjabot" => ""
3038 ),
3039 "uri" => ""
3040 ),
3041 "kiwi" => array(
3042 "icon" => "robot",
3043 "title" => "KiwiStatus",
3044 "rule" => array(
3045 "KiwiStatus[ /]([0-9.]{1,10})" => "\\1",
3046 "KiwiStatus" => ""
3047 ),
3048 "uri" => "http://www.nzs.com/kiei-status/"
3049 ),
3050 "lachesis" => array(
3051 "icon" => "robot",
3052 "title" => "Lachesis",
3053 "rule" => array(
3054 "lachesis" => ""
3055 ),
3056 "uri" => ""
3057 ),
3058 "lanshan" => array(
3059 "icon" => "robot",
3060 "title" => "Lachesis",
3061 "rule" => array(
3062 "lanshanbot[/ ]([0-9.]{1,10})" => "\\1"
3063 ),
3064 "uri" => ""
3065 ),
3066 "lapozz" => array(
3067 "icon" => "lapozz",
3068 "title" => "Lapozz",
3069 "rule" => array(
3070 "LapozzBot[/ ]?([0-9.]{1,10})" => "\\1"
3071 ),
3072 "uri" => ""
3073 ),
3074 "larbin" => array(
3075 "icon" => "robot",
3076 "title" => "Larbin",
3077 "rule" => array(
3078 "larbin[_/ ]?([0-9.]{1,10})" => "\\1"
3079 ),
3080 "uri" => ""
3081 ),
3082 "laurion" => array(
3083 "icon" => "robot",
3084 "title" => "Laurion",
3085 "rule" => array(
3086 "^IPiumBot" => ""
3087 ),
3088 "uri" => "http://www.laurion.com/"
3089 ),
3090 "leechget" => array(
3091 "icon" => "leechget",
3092 "title" => "LeechGet",
3093 "rule" => array(
3094 "^LeechGet[ /]([0-9.]{1,10})" => "\\1"
3095 ),
3096 "uri" => ""
3097 ),
3098 "linguaseek" => array(
3099 "icon" => "linguaseek",
3100 "title" => "Linguaseek",
3101 "rule" => array(
3102 "^LinguaBot[ /]v([0-9.]{1,10})" => "\\1"
3103 ),
3104 "uri" => "http://www.linguaseek.com/"
3105 ),
3106 "linguee" => array(
3107 "icon" => "linguee",
3108 "title" => "Linguee",
3109 "rule" => array(
3110 "^Linguee Bot" => ""
3111 ),
3112 "uri" => "http://www.linguee.com/"
3113 ),
3114 "linkapedia" => array(
3115 "icon" => "linkapedia",
3116 "title" => "Linkapedia",
3117 "rule" => array(
3118 "^linkapedia" => ""
3119 ),
3120 "uri" => "http://www.linkapedia.com"
3121 ),
3122 "linkdex" => array(
3123 "icon" => "linkdex",
3124 "title" => "Linkdex",
3125 "rule" => array(
3126 "linkdexbot[ /]([0-9.]{1,10})" => "\\1"
3127 ),
3128 "uri" => "http://www.linkdex.com/bots/"
3129 ),
3130 "linkedin" => array(
3131 "icon" => "linkedin",
3132 "title" => "LinkedIn",
3133 "rule" => array(
3134 "LinkedInBot[ /]([0-9.]{1,10})" => "\\1"
3135 ),
3136 "uri" => "http://www.linkedin.com"
3137 ),
3138 "linkguard" => array(
3139 "icon" => "robot",
3140 "title" => "Linkguard",
3141 "rule" => array(
3142 "Linkguard Online[ /]([0-9.]{1,10})" => "\\1"
3143 ),
3144 "uri" => "http://www.linkguard.com/"
3145 ),
3146 "linklint" => array(
3147 "icon" => "linklint",
3148 "title" => "Linklint",
3149 "rule" => array(
3150 "^Linklint[-\-a-z /]*([0-9.]{1,10})" => "\\1"
3151 ),
3152 "uri" => "http://www.linklint.org/"
3153 ),
3154 "linkman" => array(
3155 "icon" => "linkman",
3156 "title" => "Linkman",
3157 "rule" => array(
3158 "\(compatible; Linkman\)" => ""
3159 ),
3160 "uri" => ""
3161 ),
3162 // Needs to be before linkcheck for correct detection
3163 "linkchecker" => array(
3164 "icon" => "w3c",
3165 "title" => "W3C Link Checker",
3166 "rule" => array(
3167 "^W3C-checklink[ /]([0-9.]{1,10})" => "\\1"
3168 ),
3169 "uri" => "http://validator.w3.org/checklink"
3170 ),
3171 "linkcheck" => array(
3172 "icon" => "linkcheck",
3173 "title" => "Linkcheck",
3174 "rule" => array(
3175 "checklink[ /]([0-9.]{1,10})" => "\\1",
3176 "Link[ \-]?(Chec(k|ker)|Val(et|idator))" => "",
3177 "Adaxas Spider" => "",
3178 "Agent-SharewarePlazaFileCheckBot[ /]([0-9.]{1,10})" => "\\1",
3179 // "NetMechanic V([0-9.]{1,10})" => "\\1",
3180 "^InfoLink" => "",
3181 "InternetLinkAgent" => "",
3182 "; SPENG\)" => "",
3183 "SharewarePlazaFileCheckBot" => "",
3184 "fileboost.net" => "",
3185 "^billbot" => ""
3186 ),
3187 "uri" => ""
3188 ),
3189 "linkru" => array(
3190 "icon" => "robot",
3191 "title" => "Link.RU",
3192 "rule" => array(
3193 "^Link.RU bot" => ""
3194 ),
3195 "uri" => ""
3196 ),
3197 "linkssql" => array(
3198 "icon" => "robot",
3199 "title" => "Links SQL",
3200 "rule" => array(
3201 "links sql" => ""
3202 ),
3203 "uri" => ""
3204 ),
3205 "linksweeper" => array(
3206 "icon" => "robot",
3207 "title" => "Link Sweeper",
3208 "rule" => array(
3209 "LinkSweeper[ /]([0-9.]{1,10})" => "\\1"
3210 ),
3211 "uri" => ""
3212 ),
3213 "linkwalker" => array(
3214 "icon" => "robot",
3215 "title" => "Link Walker",
3216 "rule" => array(
3217 "^LinkWalker" => ""
3218 ),
3219 "uri" => ""
3220 ),
3221 "lipperhey" => array(
3222 "icon" => "lipperhey",
3223 "title" => "Lipperhey",
3224 "rule" => array(
3225 "Lipperhey Spider" => ""
3226 ),
3227 "uri" => "http://www.lipperhey.com"
3228 ),
3229 "livedoor" => array(
3230 "icon" => "livedoor",
3231 "title" => "Livedoor",
3232 "rule" => array(
3233 "^Livedoor( SF( - California Crawl)?|Checkers)[ /]" => ""
3234 ),
3235 "uri" => ""
3236 ),
3237 "livejournal" => array(
3238 "icon" => "livejournal",
3239 "title" => "Live Journal",
3240 "rule" => array(
3241 "^LiveJournal\.com" => ""
3242 ),
3243 "uri" => "http://www.livejournal.com"
3244 ),
3245 "ljpic" => array(
3246 "icon" => "ljpic",
3247 "title" => "ljpic",
3248 "rule" => array(
3249 "LjSEEK Picture-Bot[ /]+([0-9.]{1,10})" => "\\1"
3250 ),
3251 "uri" => "http://www.ljpic.com"
3252 ),
3253 "lmspider" => array(
3254 "icon" => "robot",
3255 "title" => "Lmspider",
3256 "rule" => array(
3257 "^lmspider" => ""
3258 ),
3259 "uri" => ""
3260 ),
3261 "locators" => array(
3262 "icon" => "robot",
3263 "title" => "Locaters",
3264 "rule" => array(
3265 "^FiNDoBot[/ ]([0-9a-z.]{1,10})" => "\\1"
3266 ),
3267 "uri" => ""
3268 ),
3269 "look" => array(
3270 "icon" => "look",
3271 "title" => "Look",
3272 "rule" => array(
3273 "www\.look\.com" => "",
3274 "Lookbot" => ""
3275 ),
3276 "uri" => ""
3277 ),
3278 "looksmart" => array(
3279 "icon" => "looksmart",
3280 "title" => "LookSmart",
3281 "rule" => array(
3282 "^Martini" => "",
3283 "^MantraAgent" => "",
3284 "FurlBot" => "",
3285 "looksmart-sv-fw" => ""
3286 ),
3287 "uri" => ""
3288 ),
3289 "loop" => array(
3290 "icon" => "loop",
3291 "title" => "LOOP",
3292 "rule" => array(
3293 "NetResearchServer[ /]([0-9.]{1,10})" => "\\1"
3294 ),
3295 "uri" => ""
3296 ),
3297 "lotkyll" => array(
3298 "icon" => "robot",
3299 "title" => "Lotkyll",
3300 "rule" => array(
3301 "Lotkyll" => ""
3302 ),
3303 "uri" => ""
3304 ),
3305 "ltx71" => array(
3306 "icon" => "robot",
3307 "title" => "LTX71",
3308 "rule" => array(
3309 "ltx71" => ""
3310 ),
3311 "uri" => "http://ltx71.com/"
3312 ),
3313 "lwp" => array(
3314 "icon" => "robot",
3315 "title" => "lwp",
3316 "rule" => array(
3317 "lwp(-trivial|::simple)[ /]([0-9.]{1,10})" => "\\2"
3318 ),
3319 "uri" => ""
3320 ),
3321 "lycos" => array(
3322 "icon" => "lycos",
3323 "title" => "Lycos",
3324 "rule" => array(
3325 "Lycos_Spider_" => ""
3326 ),
3327 "uri" => ""
3328 ),
3329 "magpierss" => array(
3330 "icon" => "rss",
3331 "title" => "MagpieRSS",
3332 "rule" => array(
3333 "MagpieRSS" => ""
3334 ),
3335 "uri" => "http://magpierss.sourceforge.net/"
3336 ),
3337 "mailru" => array(
3338 "icon" => "mailru",
3339 "title" => "Mail.Ru",
3340 "rule" => array(
3341 "^Mail.Ru[ /]([0-9.]{1,10})" => "\\1",
3342 "Mail.RU_Bot[ /]([0-9.]{1,10})" => "\\1"
3343 ),
3344 "uri" => "http://www.mail.ru/"
3345 ),
3346 "mailsweeper" => array(
3347 "icon" => "robot",
3348 "title" => "Mail Sweeper",
3349 "rule" => array(
3350 "Mail[ \-]?Sweeper" => ""
3351 ),
3352 "uri" => ""
3353 ),
3354 "marvin" => array(
3355 "icon" => "robot",
3356 "title" => "Marvin",
3357 "rule" => array(
3358 "^Marvin" => ""
3359 ),
3360 "uri" => ""
3361 ),
3362 "matkurja" => array(
3363 "icon" => "matkurja",
3364 "title" => "Mat'Kurja",
3365 "rule" => array(
3366 "Mosad[ /]([0-9.]{1,10})" => "\\1"
3367 ),
3368 "uri" => ""
3369 ),
3370 "mavicanet" => array(
3371 "icon" => "mavicanet",
3372 "title" => "Mavicanet",
3373 "rule" => array(
3374 "Mavicanet robot" => ""
3375 ),
3376 "uri" => ""
3377 ),
3378 "meanpath" => array(
3379 "icon" => "meanpath",
3380 "title" => "Meanpath",
3381 "rule" => array(
3382 "meanpathbot[ /]([0-9.]{1,10})" => "\\1"
3383 ),
3384 "uri" => "http://www.meanpath.com/meanpathbot.html"
3385 ),
3386 "mediater" => array(
3387 "icon" => "robot",
3388 "title" => "Mediater",
3389 "rule" => array (
3390 "^libwww[ /]([0-9.]{1,10})" => "\\1"
3391 ),
3392 "uri" => ""
3393 ),
3394 "memory" => array(
3395 "icon" => "memory",
3396 "title" => "internet Memory",
3397 "rule" => array (
3398 "memoryBot[ /]([0-9.]{1,10})" => "\\1"
3399 ),
3400 "uri" => "http://internetmemory.org/en/"
3401 ),
3402 "mercator" => array(
3403 "icon" => "robot",
3404 "title" => "Mercator",
3405 "rule" => array(
3406 "Mercator" => ""
3407 ),
3408 "uri" => ""
3409 ),
3410 "metacarta" => array(
3411 "icon" => "robot",
3412 "title" => "Metacarta",
3413 "rule" => array(
3414 "^RRC (crawler_admin@bigfoot.com)" => "",
3415 "^flunky" => "",
3416 "^Mozilla.*\(samualt9@bigfoot.com\)$" => ""
3417 ),
3418 "uri" => "http://www.metacarta.com"
3419 ),
3420 "metager" => array(
3421 "icon" => "metager",
3422 "title" => "MetaGer",
3423 "rule" => array(
3424 "MetaGer" => ""
3425 ),
3426 "uri" => ""
3427 ),
3428 "metamark" => array(
3429 "icon" => "robot",
3430 "title" => "Metamark",
3431 "rule" => array(
3432 "^XRL[ /]([0-9.a-z]{1,10})" => "\\1"
3433 ),
3434 "uri" => "http://metamark.net"
3435 ),
3436 "metamedic" => array(
3437 "icon" => "metamedic",
3438 "title" => "MetaMedic",
3439 "rule" => array(
3440 "MediBot[ /]([0-9.]{1,10})" => "\\1"
3441 ),
3442 "uri" => ""
3443 ),
3444 "mirago" => array(
3445 "icon" => "mirago",
3446 "title" => "Mirago",
3447 "rule" => array(
3448 "Mirago" => ""
3449 ),
3450 "uri" => ""
3451 ),
3452 "misterwong" => array(
3453 "icon" => "misterwong",
3454 "title" => "Mister Wong",
3455 "rule" => array(
3456 "Mister Wong-Bot[ /]([0-9.]{1,10})" => "\\1"
3457 ),
3458 "uri" => "http://www.mister-wong.de/"
3459 ),
3460 "miva" => array(
3461 "icon" => "miva",
3462 "title" => "Miva",
3463 "rule" => array(
3464 "AlgoFeedback@miva\.com" => ""
3465 ),
3466 "uri" => "http://www.miva.com/"
3467 ),
3468 "mj12" => array(
3469 "icon" => "mj12",
3470 "title" => "Majestic-12",
3471 "rule" => array(
3472 "Mj12bot[ /]v?([0-9.]{1,10})" => "\\1",
3473 "MJ12bot \(mini\)[ /]([0-9.]{1,10})" => "\\1"
3474 ),
3475 "uri" => "http://majestic12.co.uk/bot.php"
3476 ),
3477 "mlbot" => array(
3478 "icon" => "robot",
3479 "title" => "MLBot",
3480 "rule" => array(
3481 "^MLBot" => ""
3482 ),
3483 "uri" => "http://www.metadatalabs.com/mlbot"
3484 ),
3485 "mnogo" => array(
3486 "icon" => "mnogo",
3487 "title" => "mnoGoSearch",
3488 "rule" => array(
3489 "Mnogosearch[ /\-]([0-9.]{1,10})" => "\\1"
3490 ),
3491 "uri" => "http://www.mnogosearch.org/"
3492 ),
3493 "mobileok" => array(
3494 "icon" => "mobileok",
3495 "title" => "W3C mobileOK",
3496 "rule" => array(
3497 "^W3C-mobileOK" => ""
3498 ),
3499 "uri" => "http://www.w3.org/2006/07/mobileok-ddc"
3500 ),
3501 "mojeek" => array(
3502 "icon" => "mojeek",
3503 "title" => "Mojeek",
3504 "rule" => array(
3505 "MojeekBot[ /]([0-9.]{1,10})" => "\\1"
3506 ),
3507 "uri" => "https://www.mojeek.com/bot.html"
3508 ),
3509 "momspider" => array(
3510 "icon" => "robot",
3511 "title" => "MOM Spider",
3512 "rule" => array(
3513 "MOMspider[ /]([0-9.]{1,10})" => "\\1"
3514 ),
3515 "uri" => ""
3516 ),
3517 "moreover" => array(
3518 "icon" => "moreover",
3519 "title" => "Moreover",
3520 "rule" => array(
3521 "^Moreoverbot[ /]([0-9.]{1,10})" => "\\1"
3522 ),
3523 "uri" => ""
3524 ),
3525 "movabletype" => array(
3526 "icon" => "movabletype",
3527 "title" => "Movable Type",
3528 "rule" => array(
3529 "MovableType[ /]([0-9.]{1,10})" => "\\1"
3530 ),
3531 "uri" => ""
3532 ),
3533 "mozdex" => array(
3534 "icon" => "mozdex",
3535 "title" => "MozDex",
3536 "rule" => array(
3537 "mozDex[ /]([0-9.]{1,6}(-dev)?)" => "\\1"
3538 ),
3539 "uri" => ""
3540 ),
3541 "mqbot" => array(
3542 "icon" => "robot",
3543 "title" => "MQbot",
3544 "rule" => array(
3545 "MQbot" => ""
3546 ),
3547 "uri" => ""
3548 ),
3549 "msnbot" => array(
3550 "icon" => "bing",
3551 "title" => "Bing",
3552 "rule" => array(
3553 "MSN(BOT|PTC)[ /]([0-9.]{1,10})" => "\\2",
3554 "MS Search ([0-9.]{1,10}) Robot" => "\\1",
3555 "MSNBOT-(MEDIA|PRODUCTS|NewsBlogs)[ /]([0-9.]{1,10})" => "\\2",
3556 "bingbot[ /]([0-9.]{1,10})" => "\\1"
3557 ),
3558 "uri" => ""
3559 ),
3560 "msnbot-mobile" => array(
3561 "icon" => "msn",
3562 "title" => "MSN Mobile",
3563 "rule" => array(
3564 "MSNBOT-(MOBILE|)[ /]([0-9.]{1,10})" => "\\2",
3565 "MSNBOT_Mobile" => "",
3566 "MSMOBOT" => ""
3567 ),
3568 "uri" => ""
3569 ),
3570 "mslivebot" => array(
3571 "icon" => "livesearch",
3572 "title" => "MS Live Search",
3573 "rule" => array(
3574 "MSNBOT-(Academic)[ /]([0-9.]{1,10})" => "\\2"
3575 ),
3576 "uri" => ""
3577 ),
3578 "msproxy" => array(
3579 "icon" => "robot",
3580 "title" => "MSProxy",
3581 "rule" => array(
3582 "MSProxy[ /]([0-9.]{1,10})" => "\\1"
3583 ),
3584 "uri" => ""
3585 ),
3586 "msrbot" => array(
3587 "icon" => "robot",
3588 "title" => "MSRBOT",
3589 "rule" => array(
3590 "^MSRBOT" => ""
3591 ),
3592 "uri" => "http://research.microsoft.com/research/sv/msrbot/"
3593 ),
3594 "mswebdav" => array(
3595 "icon" => "robot",
3596 "title" => "MS-WebDAV",
3597 "rule" => array(
3598 "Microsoft[ \-]?WebDAV[ \-]?MiniRedir" => ""
3599 ),
3600 "uri" => ""
3601 ),
3602 "mticon" => array(
3603 "icon" => "robot",
3604 "title" => "MTIcon",
3605 "rule" => array(
3606 "MTIcon[/ ]([0-9.]{1,10})" => "\\1"
3607 ),
3608 "uri" => ""
3609 ),
3610 "multipage-validator" => array(
3611 "icon" => "multipage-validator",
3612 "title" => "Multipage Validator",
3613 "rule" => array(
3614 "^W3C_Multipage_Validator[ /]([0-9.]{1,10})" => "\\1"
3615 ),
3616 "uri" => "http://www.validator.ca/"
3617 ),
3618 "myrss" => array(
3619 "icon" => "rss",
3620 "title" => "MyRSS",
3621 "rule" => array(
3622 "MyRSS.jp[/ ]([0-9.]{1,10})" => "\\1"
3623 ),
3624 "uri" => ""
3625 ),
3626 "multimap" => array(
3627 "icon" => "robot",
3628 "title" => "Multimap",
3629 "rule" => array(
3630 "Multimap Geotag Blog Parser[/ ]([0-9.]{1,10})" => "\\1"
3631 ),
3632 "uri" => ""
3633 ),
3634 "najdi" => array(
3635 "icon" => "najdi",
3636 "title" => "Najdi.si",
3637 "rule" => array(
3638 "Najdi.si" => ""
3639 ),
3640 "uri" => "http://www.najdi.si"
3641 ),
3642 "nameprotect" => array(
3643 "icon" => "nameprotect",
3644 "title" => "Name Protect",
3645 "rule" => array(
3646 "NPBot" => ""
3647 ),
3648 "uri" => ""
3649 ),
3650 "nationaldirectory" => array(
3651 "icon" => "robot",
3652 "title" => "National Directory",
3653 "rule" => array(
3654 "NationalDirectory-WebSpider[ /]([0-9.]{1,10})" => "\\1"
3655 ),
3656 "uri" => ""
3657 ),
3658 "natsumican" => array(
3659 "icon" => "robot",
3660 "title" => "Natsu Mican",
3661 "rule" => array(
3662 "NATSU[ \-]MICAN[/ ]([0-9a-z.]{1,10})" => "\\1"
3663 ),
3664 "uri" => ""
3665 ),
3666 "naverbot" => array(
3667 "icon" => "naverbot",
3668 "title" => "Naver",
3669 "rule" => array(
3670 "NaverBot([_\-]dloader)?[/ \-]([0-9.]{1,10})" => "\\2",
3671 "Naver(Bot)?" => "",
3672 "^nabot" => ""
3673 ),
3674 "uri" => ""
3675 ),
3676 "navisso" => array(
3677 "icon" => "navisso",
3678 "title" => "Navisso",
3679 "rule" => array(
3680 "Navisso(Bot)?" => ""
3681 ),
3682 "uri" => "http://www.navisso.com"
3683 ),
3684 "neevabot" => array(
3685 "icon" => "neeva",
3686 "title" => "Neeva",
3687 "rule" => array(
3688 "Neevabot[ /]([0-9.]{1,10})" => "\\1"
3689 ),
3690 "uri" => "https://neeva.com/neevabot"
3691 ),
3692 "neofonie" => array(
3693 "icon" => "robot",
3694 "title" => "Neofonie",
3695 "rule" => array(
3696 "www.neofonie.de" => ""
3697 ),
3698 "uri" => "http://www.neofonie.de/loesungen/search/robot.html"
3699 ),
3700 "neomo" => array(
3701 "icon" => "robot",
3702 "title" => "Neomo",
3703 "rule" => array(
3704 "Francis[ /]([0-9.]{1,10})" => "\\1"
3705 ),
3706 "uri" => ""
3707 ),
3708 "nessus" => array(
3709 "icon" => "nessus",
3710 "title" => "Nessus",
3711 "rule" => array(
3712 "Nessus\)$" => ""
3713 ),
3714 "uri" => ""
3715 ),
3716 "nerdybot" => array(
3717 "icon" => "robot",
3718 "title" => "NerdyBot",
3719 "rule" => array(
3720 "NerdyBot" => ""
3721 ),
3722 "uri" => "http://nerdybot.com/"
3723 ),
3724 "nerdbynature" => array(
3725 "icon" => "nerdbynature",
3726 "title" => "NerdByNature",
3727 "rule" => array(
3728 "NerdByNature.Bot" => ""
3729 ),
3730 "uri" => "http://www.nerdbynature.net/bot"
3731 ),
3732 "netants" => array(
3733 "icon" => "netants",
3734 "title" => "NetAnts",
3735 "rule" => array(
3736 "NetAnts[ /]([0-9.]{1,10})" => "\\1"
3737 ),
3738 "uri" => ""
3739 ),
3740 "netcraft" => array(
3741 "icon" => "netcraft",
3742 "title" => "Netcraft",
3743 "rule" => array(
3744 "netcraft" => ""
3745 ),
3746 "uri" => ""
3747 ),
3748 "netinfo" => array(
3749 "icon" => "netinfo",
3750 "title" => "Netinfo",
3751 "rule" => array(
3752 "^NetinfoBot[ /]([0-9.]{1,10})" => "\\1"
3753 ),
3754 "uri" => "http://netinfo.bg/"
3755 ),
3756 "netluchs" => array(
3757 "icon" => "netluchs",
3758 "title" => "Netluchs",
3759 "rule" => array(
3760 "Netluchs[ /]([0-9.a-z]{1,10})" => "\\1"
3761 ),
3762 "uri" => "http://www.netluchs.de/"
3763 ),
3764 "netmechanic" => array(
3765 "icon" => "netmechanic",
3766 "title" => "NetMechanic",
3767 "rule" => array(
3768 "NetMechanic[ /V]{1,5}([0-9.]{1,10})" => "\\1"
3769 ),
3770 "uri" => ""
3771 ),
3772 "netnose" => array(
3773 "icon" => "netnose",
3774 "title" => "NetNose",
3775 "rule" => array(
3776 "NetNose[ \-]Crawler[/ ]([0-9.]{1,10})" => "\\1"
3777 ),
3778 "uri" => ""
3779 ),
3780 "netoskop" => array(
3781 "icon" => "robot",
3782 "title" => "Netoskop",
3783 "rule" => array(
3784 "netoskop" => ""
3785 ),
3786 "uri" => ""
3787 ),
3788 "netpromoter" => array(
3789 "icon" => "netpromoter",
3790 "title" => "NetPromoter",
3791 "rule" => array(
3792 "NetPromoter Spider" => ""
3793 ),
3794 "uri" => "http://www.net-promoter.com/"
3795 ),
3796 "netprospector" => array(
3797 "icon" => "robot",
3798 "title" => "Netprospector",
3799 "rule" => array(
3800 "^netprospector" => ""
3801 )
3802 ),
3803 "netpumper" => array(
3804 "icon" => "robot",
3805 "title" => "Netpumper",
3806 "rule" => array(
3807 "^NetPumper[/ ]([0-9.]{1,10})" => "\\1"
3808 ),
3809 "uri" => ""
3810 ),
3811 "netscapeproxy" => array(
3812 "icon" => "netscape",
3813 "title" => "Netscape Proxy",
3814 "rule" => array(
3815 "Netscape-Proxy[/ ]([0-9.]{1,10})" => "\\1"
3816 ),
3817 "uri" => ""
3818 ),
3819 "netspective" => array(
3820 "icon" => "robot",
3821 "title" => "NetSpective",
3822 "rule" => array(
3823 "^WebFilter Robot ([0-9.]{1,10})" => "\\1"
3824 ),
3825 "uri" => ""
3826 ),
3827 "netvibes" => array(
3828 "icon" => "netvibes",
3829 "title" => " Netvibes",
3830 "rule" => array(
3831 "^Netvibes" => "\\1"
3832 ),
3833 "uri" => ""
3834 ),
3835 "newsfire" => array(
3836 "icon" => "newsfire",
3837 "title" => "NewsFire",
3838 "rule" => array(
3839 "NewsFire[/ ]([0-9.]{1,10})" => "\\1"
3840 ),
3841 "uri" => ""
3842 ),
3843 "newsgator" => array(
3844 "icon" => "newsgator",
3845 "title" => "NewsGator",
3846 "rule" => array(
3847 "NewsGato(r|rOnline)[/ ]([0-9.]{1,10})" => "\\2"
3848 ),
3849 "uri" => ""
3850 ),
3851 "newzcrawler" => array(
3852 "icon" => "newzcrawler",
3853 "title" => "NewzCrawler",
3854 "rule" => array(
3855 "NewzCrawler[/ ]([0-9.]{1,10})" => "\\1"
3856 ),
3857 "uri" => ""
3858 ),
3859 "nextopia" => array(
3860 "icon" => "newzcrawler",
3861 "title" => "NewzCrawler",
3862 "rule" => array(
3863 "^NextopiaBOT.*[v ]([0-9.]{1,10})" => "\\1"
3864 ),
3865 "uri" => ""
3866 ),
3867 "ngsearch" => array(
3868 "icon" => "ngsearch",
3869 "title" => "NG Search",
3870 "rule" => array(
3871 "NG-Search[/ ]([0-9.]{1,10})" => "\\1"
3872 ),
3873 "uri" => ""
3874 ),
3875 "nimble" => array(
3876 "icon" => "robot",
3877 "title" => "Nimble",
3878 "rule" => array(
3879 "NimbleCrawler[/ ]([0-9.]{1,10})" => "\\1"
3880 ),
3881 "uri" => ""
3882 ),
3883 "nmap" => array(
3884 "icon" => "nmap",
3885 "title" => "Nmap",
3886 "rule" => array(
3887 "Nmap Scripting Engine" => ""
3888 ),
3889 "uri" => "http://nmap.org/book/nse.html"
3890 ),
3891 "nusearch" => array(
3892 "icon" => "robot",
3893 "title" => "NuSearch",
3894 "rule" => array(
3895 "^nuSearch" => ""
3896 ),
3897 "uri" => "http://www.nusearch.com/"
3898 ),
3899 "noago" => array(
3900 "icon" => "noago",
3901 "title" => "Noago",
3902 "rule" => array(
3903 "Noago Spider" => ""
3904 ),
3905 "uri" => "http://www.noago.com/"
3906 ),
3907 "noviforum" => array(
3908 "icon" => "noviforum",
3909 "title" => "Noviforum",
3910 "rule" => array(
3911 "TridentSpider[/ ]?([0-9.]{1,10})" => "\\1"
3912 ),
3913 "uri" => ""
3914 ),
3915 "noxtrum" => array(
3916 "icon" => "noxtrum",
3917 "title" => "noXtrum",
3918 "rule" => array(
3919 "noxtrumbot[/ ]?([0-9.]{1,10})" => "\\1"
3920 ),
3921 "uri" => ""
3922 ),
3923 "noyona" => array(
3924 "icon" => "robot",
3925 "title" => "Noyona",
3926 "rule" => array(
3927 "noyona.([0-9._]{1,10})" => "\\1"
3928 ),
3929 "uri" => "http://noyona.com/"
3930 ),
3931 "nsauditor" => array(
3932 "icon" => "nsauditor",
3933 "title" => "Nsauditor",
3934 "rule" => array(
3935 "Nsauditor[ /]([0-9.]{1,10})" => "\\1"
3936 ),
3937 "uri" => "http://www.nsauditor.com/"
3938 ),
3939 "obidosbot" => array(
3940 "icon" => "robot",
3941 "title" => "Bookwatch",
3942 "rule" => array(
3943 "obidos[ \-]?bot" => ""
3944 ),
3945 "uri" => ""
3946 ),
3947 "objectssearch" => array(
3948 "icon" => "robot",
3949 "title" => "Objects Search",
3950 "rule" => array(
3951 "ObjectsSearch[ /]([0-9.]{1,10})" => "\\1"
3952 ),
3953 "uri" => ""
3954 ),
3955 "obot" => array(
3956 "icon" => "ibm",
3957 "title" => "IBM (ONLY) Crawler",
3958 "rule" => array(
3959 "oBot[ /]([0-9.]{1,10})" => "\\1"
3960 ),
3961 "uri" => "http://filterdb.iss.net/crawler/"
3962 // Previous from "ONLY Solutions GmbH" – that is what the O stands for
3963 ),
3964 "ocawa" => array(
3965 "icon" => "ocawa",
3966 "title" => "Ocawa",
3967 "rule" => array(
3968 "Ocawa[ /]([A-Z.a-z][0-9.]{1,10})" => "\\1",
3969 "Ocawa" => ""
3970 ),
3971 "uri" => "http://www.ocawa.com/"
3972 ),
3973 "octora" => array(
3974 "icon" => "octora",
3975 "title" => "Octora",
3976 "rule" => array(
3977 "^Octora (Beta)?" => ""
3978 ),
3979 "uri" => "http://www.octora.com/"
3980 ),
3981 "offlineexplorer" => array(
3982 "icon" => "robot",
3983 "title" => "OfflineExplorer",
3984 "rule" => array(
3985 "^Offline Explorer[ /]([0-9.]{1,10})" => "\\1"
3986 ),
3987 "uri" => ""
3988 ),
3989 "omea" => array(
3990 "icon" => "omea",
3991 "title" => "Omea Reader",
3992 "rule" => array(
3993 "Omea Reader[ /]([0-9.]{1,10})" => "\\1"
3994 ),
3995 "uri" => ""
3996 ),
3997 "onet" => array(
3998 "icon" => "onet",
3999 "title" => "Onet",
4000 "rule" => array(
4001 "OnetSzukaj[ /]([0-9.]{1,10})" => "\\1",
4002 "Onet\.pl" => "",
4003 "inktomi.search.onet" => ""
4004 ),
4005 "uri" => "http://www.onet.pl"
4006 ),
4007 "online24" => array(
4008 "icon" => "robot",
4009 "title" => "Online24",
4010 "rule" => array(
4011 "^Online24-Bot .* ([0-9.]{1,10})" => "\\1"
4012 ),
4013 "uri" => "http://www.online24.de"
4014 ),
4015 "onlinewebcheck" => array(
4016 "icon" => "csehtmlvalidator",
4017 "title" => "CSE HTML Validator",
4018 "rule" => array(
4019 "onlinewebcheck" => ""
4020 ),
4021 "uri" => "http://www.onlinewebcheck.com"
4022 ),
4023 "onsearch" => array(
4024 "icon" => "onsearch",
4025 "title" => "OnSearch",
4026 "rule" => array(
4027 "^onCHECK-Robot" => ""
4028 ),
4029 "uri" => "http://www.onsearch.de"
4030 ),
4031 "onto" => array(
4032 "icon" => "robot",
4033 "title" => "OntoSpider",
4034 "rule" => array(
4035 "^OntoSpider[ /]([0-9.]{1,10})" => "\\1"
4036 ),
4037 "uri" => "http://ontospider.i-n.info/"
4038 ),
4039 "openacoon" => array(
4040 "icon" => "robot",
4041 "title" => "OpenAcoon",
4042 "rule" => array(
4043 "^OpenAcoon v([0-9.]{1,10})" => "\\1"
4044 ),
4045 "uri" => "http://www.openacoon.de/"
4046 ),
4047 "openfind" => array(
4048 "icon" => "openfind",
4049 "title" => "Openfind",
4050 "rule" => array(
4051 "openbot[ /]([0-9.]{1,10})" => "\\1",
4052 "Openfind Robot[ /]([0-9.A-Z]{1,10})" => "\\1"
4053 ),
4054 "uri" => ""
4055 ),
4056 "opentagger" => array(
4057 "icon" => "robot",
4058 "title" => "OpenTagger",
4059 "rule" => array(
4060 "^OpenTaggerBot" => ""
4061 ),
4062 "uri" => "http://www.opentagger.com/opentaggerbot.htm"
4063 ),
4064 "opentext" => array(
4065 "icon" => "opentext",
4066 "title" => "OpenText",
4067 "rule" => array(
4068 "^OpenTextSiteCrawler[ /]([0-9.]{1,10})" => "\\1"
4069 ),
4070 "uri" => "http://www.opentext.net/"
4071 ),
4072 "openweb" => array(
4073 "icon" => "robot",
4074 "title" => "OpenWebSpider",
4075 "rule" => array(
4076 "^OpenWebSpider[ /]([0-9.]{1,10})" => "\\1",
4077 "^OpenWebSpider v([0-9.A-Z]{1,10})" => "\\1"
4078 ),
4079 "uri" => "http://www.openwebspider.org"
4080 ),
4081 "openx" => array(
4082 "icon" => "openx",
4083 "title" => "OpenX Spider",
4084 "rule" => array(
4085 "OpenX" => ""
4086 ),
4087 "uri" => "http://www.openx.org"
4088 ),
4089 "orange" => array(
4090 "icon" => "orange",
4091 "title" => "Orange",
4092 "rule" => array(
4093 "OrangeBot-Mobile[ /]([0-9.]{1,10})" => "\\1",
4094 "OrangeBot[ /]([0-9.]{1,10})" => "\\1"
4095 ),
4096 "uri" => "http://orange.com/"
4097 ),
4098 "organica" => array(
4099 "icon" => "robot",
4100 "title" => "Organica",
4101 "rule" => array(
4102 "crawler@organica\.us" => ""
4103 ),
4104 "uri" => ""
4105 ),
4106 "outfox" => array(
4107 "icon" => "robot",
4108 "title" => "Outfox Melon",
4109 "rule" => array(
4110 "OutfoxMelonBot[ /]([0-9.]{1,10})" => "\\1",
4111 "OutfoxBot[ /]([0-9.]{1,10})" => "\\1"
4112 ),
4113 "uri" => ""
4114 ),
4115 "overture" => array(
4116 "icon" => "overture",
4117 "title" => "Overture",
4118 "rule" => array(
4119 "Overture[ \-]?WebCrawler" => ""
4120 ),
4121 "uri" => ""
4122 ),
4123 "owler" => array(
4124 "icon" => "robot",
4125 "title" => "Owler",
4126 "rule" => array(
4127 "Owler[ /]([0-9.]{1,10})" => "\\1",
4128 "Owler" => ""
4129 ),
4130 "uri" => ""
4131 ),
4132 "page2rss" => array(
4133 "icon" => "page2rss",
4134 "title" => "Page2RSS",
4135 "rule" => array(
4136 "Page2RSS[ /]([0-9.]{1,10})" => "\\1"
4137 ),
4138 "uri" => "http://page2rss.com"
4139 ),
4140 "pagebytes" => array(
4141 "icon" => "robot",
4142 "title" => "PageBites",
4143 "rule" => array(
4144 "^PageBitesHyperBot[ /]([0-9.]{1,10})" => "\\1"
4145 ),
4146 "uri" => ""
4147 ),
4148 "pagesinventory" => array(
4149 "icon" => "pagesinventory",
4150 "title" => "PagesInventory",
4151 "rule" => array(
4152 "^PagesInventory" => ""
4153 ),
4154 "uri" => "http://www.pagesinventory.com"
4155 ),
4156 "pagesjaunes" => array(
4157 "icon" => "pagesjaunes",
4158 "title" => "Pages Jaunes",
4159 "rule" => array(
4160 "PJBot[ /]([0-9.]{1,10})" => "\\1"
4161 ),
4162 "uri" => "http://www.pagesjaunes.fr/"
4163 ),
4164 "pagevalet" => array(
4165 "icon" => "wdg",
4166 "title" => "WDG Page Valet",
4167 "rule" => array(
4168 "^Page Valet[ /]([0-9.]{1,10})" => "\\1"
4169 ),
4170 "uri" => "http://www.htmlhelp.com/tools/validator/"
4171 ),
4172 "panopeabot" => array(
4173 "icon" => "robot",
4174 "title" => "PanopeaBot",
4175 "rule" => array(
4176 "PanopeaBot[/ ]([0-9.]{1,10})" => "\\1"
4177 ),
4178 "uri" => ""
4179 ),
4180 "parchmenthill" => array(
4181 "icon" => "robot",
4182 "title" => "Parchment Hill",
4183 "rule" => array(
4184 "ParchBot[ /]([0-9.]{1,10})" => "\\1"
4185 ),
4186 "uri" => "http://www.parchmenthill.com/search.htm"
4187 ),
4188 "pascient" => array(
4189 "icon" => "pascient",
4190 "title" => "Pascient",
4191 "rule" => array(
4192 "panscient.com" => ""
4193 ),
4194 "uri" => "http://www.panscient.com/"
4195 ),
4196 "peerbot" => array(
4197 "icon" => "peerbot",
4198 "title" => "Peerbot",
4199 "rule" => array(
4200 "^PEERbot" => ""
4201 ),
4202 "uri" => ""
4203 ),
4204 "petalbot" => array(
4205 "icon" => "huawei",
4206 "title" => "PetalBot", // Huawei Search - also called Aspiegel
4207 "rule" => array(
4208 "PetalBot" => "",
4209 "AspiegelBot" => ""
4210 ),
4211 "uri" => "https://aspiegel.com/petalbot"
4212 ),
4213 "php" => array(
4214 "icon" => "php",
4215 "title" => "PHP",
4216 "rule" => array(
4217 "^PHP[ /]([0-9.]{1,10})" => "\\1"
4218 ),
4219 "uri" => ""
4220 ),
4221 "phpcrawl" => array(
4222 "icon" => "robot",
4223 "title" => "PHPCrawl",
4224 "rule" => array(
4225 "^PHPCrawl" => ""
4226 ),
4227 "uri" => "http://phpcrawl.cuab.de/"
4228 ),
4229 "phpdig" => array(
4230 "icon" => "robot",
4231 "title" => "PhpDig",
4232 "rule" => array(
4233 "^PhpDig[ /]([0-9.]{1,10})" => "\\1"
4234 ),
4235 "uri" => "http://www.finbot.com/"
4236 ),
4237 "phpversiontracker" => array(
4238 "icon" => "phpversiontracker",
4239 "title" => "PHP version tracker",
4240 "rule" => array(
4241 "^PHP version tracker" => ""
4242 ),
4243 "uri" => "http://www.nexen.net/phpversion/bot.php"
4244 ),
4245 "pictureofinternet" => array(
4246 "icon" => "robot",
4247 "title" => "PictureOfInternet",
4248 "rule" => array(
4249 "^PictureOfInternet[ /]([0-9.]{1,10})" => ""
4250 ),
4251 "uri" => ""
4252 ),
4253 "pingdom" => array(
4254 "icon" => "pingdom",
4255 "title" => "Pingdom",
4256 "rule" => array(
4257 "^Pingdom GIGRIB v([0-9.]{1,10})" => "\\1",
4258 "^Pingdom" => ""
4259 ),
4260 "uri" => "http://www.pingdom.com/"
4261 ),
4262 "pinseri" => array(
4263 "icon" => "pinseri",
4264 "title" => "Pinseri",
4265 "rule" => array(
4266 "www\.pinseri\.com/bloglist" => ""
4267 ),
4268 "uri" => ""
4269 ),
4270 "plagger" => array(
4271 "icon" => "plagger",
4272 "title" => "Plagger",
4273 "rule" => array(
4274 "Plagger[ /]([0-9.]{1,10})" => "\\1"
4275 ),
4276 "uri" => "http://www.plugger.org"
4277 ),
4278 "planet" => array(
4279 "icon" => "planet",
4280 "title" => "Planet",
4281 "rule" => array(
4282 "Planet[ /]([0-9.]{1,10})" => "\\1"
4283 ),
4284 "uri" => ""
4285 ),
4286 "plantynet" => array(
4287 "icon" => "robot",
4288 "title" => "PlantyNet",
4289 "rule" => array(
4290 "PlantyNet_WebRobot[_ /]V?([0-9.]{1,10})" => "\\1"
4291 ),
4292 "uri" => ""
4293 ),
4294 "pluck" => array(
4295 "icon" => "pluck",
4296 "title" => "Pluck",
4297 "rule" => array(
4298 "PluckFeedCrawler[ /]([0-9.]{1,10})" => "\\1"
4299 ),
4300 "uri" => ""
4301 ),
4302 "plsearch" => array(
4303 "icon" => "plsearch",
4304 "title" => "PlanetSearch",
4305 "rule" => array(
4306 "fido[ /]([0-9.]{1,10}) Harvest" => "\\1"
4307 ),
4308 "uri" => ""
4309 ),
4310 "poe" => array(
4311 "icon" => "robot",
4312 "title" => "POE-Component",
4313 "rule" => array(
4314 "^POE-Component-Client-HTTP[/ ]([0-9.]{1,10})" => "\\1"
4315 ),
4316 "uri" => ""
4317 ),
4318 "pogodak" => array(
4319 "icon" => "pogodak",
4320 "title" => "Pogodak",
4321 "rule" => array(
4322 "Pogodak\.hr[/ ]?([0-9.]{1,10})" => "\\1"
4323 ),
4324 "uri" => ""
4325 ),
4326 "poodle" => array(
4327 "icon" => "robot",
4328 "title" => "Poodle predictor",
4329 "rule" => array(
4330 "P(oo|ooo)dle[ \-]?predictor[ \-]?([0-9.]{1,10})" => "\\1",
4331 "P(oo|ooo)dle[ \-]?predictor" => ""
4332 ),
4333 "uri" => "http://www.gritechnologies.com/tools/spider.go"
4334 ),
4335 "pompos" => array(
4336 "icon" => "pompos",
4337 "title" => "Pompos",
4338 "rule" => array(
4339 "Pompos[ /]([0-9.]{1,10})" => "\\1"
4340 ),
4341 "uri" => ""
4342 ),
4343 "popdex" => array(
4344 "icon" => "robot",
4345 "title" => "Popdexter",
4346 "rule" => array(
4347 "Popdexter" => ""
4348 ),
4349 "uri" => ""
4350 ),
4351 "postrank" => array(
4352 "icon" => "postrank",
4353 "title" => "PostRank",
4354 "rule" => array(
4355 "^PostRank[ /]+([0-9.]{1,10})" => "\\1"
4356 ),
4357 "uri" => "http://www.postrank.com/"
4358 ),
4359 "powermarks" => array(
4360 "icon" => "robot",
4361 "title" => "Powermarks",
4362 "rule" => array(
4363 "Powermarks[ /]([0-9.]{1,10})" => "\\1"
4364 ),
4365 "uri" => ""
4366 ),
4367 "pinterest" => array(
4368 "icon" => "pinterest",
4369 "title" => "PROBE!",
4370 "rule" => array(
4371 "Pinterest[ /]([0-9.]{1,10})" => "\\1"
4372 ),
4373 "uri" => "http://www.pinterest.com/"
4374 ),
4375 "probe" => array(
4376 "icon" => "robot",
4377 "title" => "PROBE!",
4378 "rule" => array(
4379 "^PROBE!" => ""
4380 ),
4381 "uri" => ""
4382 ),
4383 "projecthoneypot" => array(
4384 "icon" => "projecthoneypot",
4385 "title" => "Project Honeypot",
4386 "rule" => array(
4387 "^PHPot Verispider[ /v]+([0-9.]{1,10})" => "\\1",
4388 "projecthoneypot" => ""
4389 ),
4390 "uri" => "http://www.projecthoneypot.org"
4391 ),
4392 "proxycache" => array(
4393 "icon" => "robot",
4394 "title" => "Proxy Cache",
4395 "rule" => array(
4396 "^Mozilla/[0-9.]{1,10} \(compatible\;\)$" => ""
4397 ),
4398 "uri" => ""
4399 ),
4400 "proxyhunter" => array(
4401 "icon" => "robot",
4402 "title" => "ProxyHunter",
4403 "rule" => array(
4404 "ProxyHunter" => ""
4405 ),
4406 "uri" => ""
4407 ),
4408 "psbot" => array(
4409 "icon" => "picsearch",
4410 "title" => "PicSearch",
4411 "rule" => array(
4412 "^psbot" => ""
4413 ),
4414 "uri" => ""
4415 ),
4416 "pubsub" => array(
4417 "icon" => "pubsub",
4418 "title" => "PubSub",
4419 "rule" => array(
4420 "^PubSub-RSS-Reader[ /]([0-9.]{1,10})" => "\\1",
4421 "^PubSub\.com" => ""
4422 ),
4423 "uri" => ""
4424 ),
4425 "pubarch" => array(
4426 "icon" => "robot",
4427 "title" => "PubArchive",
4428 "rule" => array(
4429 "publiclibraryarchive.org" => ""
4430 ),
4431 "uri" => ""
4432 ),
4433 "pukiwiki" => array(
4434 "icon" => "pukiwiki",
4435 "title" => "PukiWiki",
4436 "rule" => array(
4437 "PukiWiki[ /]([0-9.]{1,10})" => "\\1"
4438 ),
4439 "uri" => ""
4440 ),
4441 "pwebotxy" => array(
4442 "icon" => "pwebotxy",
4443 "title" => "PWeBot/X.Y",
4444 "rule" => array(
4445 "^PWeBot[ /]([0-9.]{1,10})" => "\\1"
4446 ),
4447 "uri" => "http://www.programacionweb.net/robot.php"
4448 ),
4449 "pxys" => array(
4450 "icon" => "robot",
4451 "title" => "PXYS",
4452 "rule" => array(
4453 "^pxys" => ""
4454 ),
4455 "uri" => ""
4456 ),
4457 "qango" => array(
4458 "icon" => "qango",
4459 "title" => "Qango",
4460 "rule" => array(
4461 "^Qango.com" => ""
4462 ),
4463 "uri" => "http://www.quango.com/"
4464 ),
4465 "qihoo" => array(
4466 "icon" => "qihoo",
4467 "title" => "Qihoo",
4468 "rule" => array(
4469 "QihooBot[ /]([0-9.]{1,10})" => "\\1"
4470 ),
4471 "uri" => "http://www.qihoo.com/"
4472 ),
4473 "qseero" => array(
4474 "icon" => "robot",
4475 "title" => "Qseero",
4476 "rule" => array(
4477 "Qseero v([0-9.]{1,10})" => "\\1"
4478 ),
4479 "uri" => "http://www.q0.com/"
4480 ),
4481 "quantcast" => array(
4482 "icon" => "robot",
4483 "title" => "Quantcast",
4484 "rule" => array(
4485 "Quantcastbot[ /]([0-9.]{1,10})" => "\\1"
4486 ),
4487 "uri" => "http://www.quantcast.com/"
4488 ),
4489 "quepasa" => array(
4490 "icon" => "quepasa",
4491 "title" => "Quepasa",
4492 "rule" => array(
4493 "Quepasa[ \-]?Creep" => ""
4494 ),
4495 "uri" => ""
4496 ),
4497 "questfinder" => array(
4498 "icon" => "robot",
4499 "title" => "QuestFinder",
4500 "rule" => array(
4501 "www\.questfinder\.com" => ""
4502 ),
4503 "uri" => ""
4504 ),
4505 "qwantify" => array(
4506 "icon" => "qwantify",
4507 "title" => "Qwantify",
4508 "rule" => array(
4509 "Qwantify[ /]([0-9.]{1,10})" => "\\1"
4510 ),
4511 "uri" => "https://www.qwant.com/"
4512 ),
4513 "qweery" => array(
4514 "icon" => "robot",
4515 "title" => "Qweery",
4516 "rule" => array(
4517 "^QweeryBot[ /]([0-9.]{1,10})" => "\\1"
4518 ),
4519 "uri" => "http://qweerybot.qweery.nl"
4520 ),
4521 "racaicrawler" => array(
4522 "icon" => "robot",
4523 "title" => "RacaiCrawler",
4524 "rule" => array(
4525 "RacaiCrawler[ -]([0-9.]{1,10})" => "\\1"
4526 )
4527 ),
4528 "radian6" => array(
4529 "icon" => "robot",
4530 "title" => "Radian6",
4531 "rule" => array(
4532 "www\.radian6\.com" => ""
4533 ),
4534 "uri" => "http://www.radian6.com"
4535 ),
4536 "radiofx" => array(
4537 "icon" => "radiofx",
4538 "title" => "Radio.fx",
4539 "rule" => array(
4540 "Radio.fx" => ""
4541 ),
4542 "uri" => "https://de.tobit.softwarw"
4543 ),
4544 "rambler" => array(
4545 "icon" => "rambler",
4546 "title" => "Rambler",
4547 "rule" => array(
4548 "StackRambler[ /]([0-9.]{1,10})" => "\\1"
4549 ),
4550 "uri" => ""
4551 ),
4552 "ramiba" => array(
4553 "icon" => "robot",
4554 "title" => "Ramiba",
4555 "rule" => array(
4556 "^ramiba(-bot)?" => "\\1"
4557 ),
4558 "uri" => ""
4559 ),
4560 "rankur" => array(
4561 "icon" => "rankur",
4562 "title" => "Rankur",
4563 "rule" => array(
4564 "^RankurBot/Rankur([0-9.]{1,10})" => "\\1"
4565 ),
4566 "uri" => "http://rankur.com/",
4567 ),
4568 "red" => array(
4569 "icon" => "red",
4570 "title" => "RED",
4571 "rule" => array(
4572 "RED[ /]([0-9.]{1,10})" => "\\1"
4573 ),
4574 "uri" => "http://redbot.org/"
4575 ),
4576 "rediff" => array(
4577 "icon" => "rediff",
4578 "title" => "Rediff",
4579 "rule" => array(
4580 "^RedBot/redbot[ /\-]([0-9.]{1,10})" => "\\1"
4581 ),
4582 "uri" => "http://www.rediff.com",
4583 ),
4584 "repia" => array(
4585 "icon" => "robot",
4586 "title" => "Repia",
4587 "rule" => array(
4588 "webmaster@repia\.com" => ""
4589 ),
4590 "uri" => ""
4591 ),
4592 "robotgenius" => array(
4593 "icon" => "robot",
4594 "title" => "Robot Genius",
4595 "rule" => array(
4596 "^robotgenius" => ""
4597 ),
4598 "uri" => "http://robotgenius.net",
4599 ),
4600 "robozilla" => array(
4601 "icon" => "robot",
4602 "title" => "Robozilla",
4603 "rule" => array(
4604 "Robozilla" => ""
4605 ),
4606 "uri" => ""
4607 ),
4608 "rogerbot" => array(
4609 "icon" => "moz",
4610 "title" => "Moz Rogerbot",
4611 "rule" => array(
4612 "rogerbot[ /]([0-9.]{1,10})" => "\\1"
4613 ),
4614 "uri" => "http://moz.com/help/guides/moz-procedures/who-is-rogerbot"
4615 ),
4616 "rojo" => array(
4617 "icon" => "rojo",
4618 "title" => "Rojo",
4619 "rule" => array(
4620 "Rojo[ /]([0-9.]{1,10})" => "\\1"
4621 ),
4622 "uri" => ""
4623 ),
4624 "rss-atom" => array(
4625 "icon" => "rss",
4626 "title" => "RSS / Atom",
4627 "rule" => array(
4628 "^Apple-PubSub" => "",
4629 "^AppleSyndication" => ""
4630 ),
4631 "uri" => ""
4632 ),
4633 "rssbot" => array(
4634 "icon" => "rss",
4635 "title" => "RSS-bot",
4636 "rule" => array(
4637 "rss-bot[ /]([0-9.]{1,10})" => "\\1"
4638 ),
4639 "uri" => ""
4640 ),
4641 "rssbandit" => array(
4642 "icon" => "rssbandit",
4643 "title" => "RssBandit",
4644 "rule" => array(
4645 "RssBandit[ /]([0-9.]{1,10})" => "\\1"
4646 ),
4647 "uri" => ""
4648 ),
4649 "rssimages" => array(
4650 "icon" => "rss",
4651 "title" => "RssImages",
4652 "rule" => array(
4653 "rssImagesBot[ /]([0-9.]{1,10})" => "\\1"
4654 ),
4655 "uri" => ""
4656 ),
4657 "rssmicro" => array(
4658 "icon" => "rssmicro",
4659 "title" => "RSSMicro",
4660 "rule" => array(
4661 "RSSMicro\.com" => ""
4662 ),
4663 "uri" => "http://www.rssmicro.com"
4664 ),
4665 "rssowl" => array(
4666 "icon" => "rssowl",
4667 "title" => "RSSOwl",
4668 "rule" => array(
4669 "RSSOwl[ /]([0-9a-z.]{1,10})" => "\\1"
4670 ),
4671 "uri" => ""
4672 ),
4673 "rssreader" => array(
4674 "icon" => "rss",
4675 "title" => "RssReader",
4676 "rule" => array(
4677 "RssReader[ /]([0-9.]{1,10})" => ""
4678 ),
4679 "uri" => ""
4680 ),
4681 "rtgi" => array(
4682 "icon" => "rtgi",
4683 "title" => "Rtgi",
4684 "rule" => array(
4685 "RTGI" => ""
4686 ),
4687 "uri" => "http://rtgi.fr/"
4688 ),
4689 "rufusbot" => array(
4690 "icon" => "robot",
4691 "title" => "RufusBot",
4692 "rule" => array(
4693 "RufusBot" => ""
4694 ),
4695 "uri" => ""
4696 ),
4697 "runet" => array(
4698 "icon" => "runet",
4699 "title" => "iTrack RuNet Crawler",
4700 "rule" => array(
4701 "Runet-Research-Crawler" => ""
4702 ),
4703 "uri" => "http://www.itrack.ru/research/cmsrate/"
4704 ),
4705 "runnk" => array(
4706 "icon" => "robot",
4707 "title" => "Runnk",
4708 "rule" => array(
4709 "Runnk RSS finder" => ""
4710 ),
4711 "uri" => "http://www.runnk.com/il/law"
4712 ),
4713 "sagool" => array(
4714 "icon" => "robot",
4715 "title" => "Sagool",
4716 "rule" => array(
4717 "MaSagool" => ""
4718 ),
4719 "uri" => "http://sagool.jp/"
4720 ),
4721 "sanszbot" => array(
4722 "icon" => "robot",
4723 "title" => "Sansz",
4724 "rule" => array(
4725 "SanszBot" => ""
4726 ),
4727 "uri" => ""
4728 ),
4729 "saucereader" => array(
4730 "icon" => "saucereader",
4731 "title" => "Sauce Reader",
4732 "rule" => array(
4733 "Sauce[ ]?Reader[ /]([0-9.]{1,10})" => "\\1"
4734 ),
4735 "uri" => ""
4736 ),
4737 "sbider" => array(
4738 "icon" => "sbider",
4739 "title" => "SBIder",
4740 "rule" => array(
4741 "SBIder[/ ]([0-9.]{1,10})" => "\\1",
4742 "SBIder[/ ]SBIder.([0-9.]{1,10})" => "\\1"
4743 ),
4744 "uri" => ""
4745 ),
4746 "scirus" => array(
4747 "icon" => "robot",
4748 "title" => "Scirus",
4749 "rule" => array(
4750 "FAST-WebCrawler/[0-9a-z.]{1,10}/Scirus" => ""
4751 ),
4752 "uri" => ""
4753 ),
4754 "scoutjet" => array(
4755 "icon" => "scoutjet",
4756 "title" => "ScoutJet",
4757 "rule" => array(
4758 "ScoutJet" => ""
4759 ),
4760 "uri" => "http://www.scoutjet.com/"
4761 ),
4762 "scrapy" => array(
4763 "icon" => "scrapy",
4764 "title" => "Scrapy",
4765 "rule" => array(
4766 "Scrapy[ /]([0-9.]{1,10})" => "\\1"
4767 ),
4768 "uri" => "http://scrapy.org"
4769 ),
4770 "scrubby" => array(
4771 "icon" => "scrubby",
4772 "title" => "Scrubby",
4773 "rule" => array(
4774 "Scrubby[ /]([0-9.]{1,10})" => "\\1"
4775 ),
4776 "uri" => ""
4777 ),
4778 "sdm" => array(
4779 "icon" => "sdm",
4780 "title" => "SUN Download Manager",
4781 "rule" => array(
4782 "Sun Download Manager[/ ]([0-9.]{1,10})" => "\\1"
4783 ),
4784 "uri" => ""
4785 ),
4786 "sealinks" => array(
4787 "icon" => "robot",
4788 "title" => "Sea Links",
4789 "rule" => array(
4790 "SEA-Links( HTML-Scanner Pingoo\!)?[ /]([0-9.]{1,10})" => "\\2"
4791 ),
4792 "uri" => ""
4793 ),
4794 "search17" => array(
4795 "icon" => "robot",
4796 "title" => "Search 17",
4797 "rule" => array(
4798 "Search17Bot[ /]([0-9.]{1,10})" => "\\1"
4799 ),
4800 "uri" => "http://www.search17.com/bot.php"
4801 ),
4802 "search2" => array(
4803 "icon" => "search2",
4804 "title" => "Search2.net",
4805 "rule" => array(
4806 "^S2Bot[ /]([0-9.]{1,10})" => "\\1"
4807 ),
4808 "uri" => "http://search2.net/"
4809 ),
4810 "searchbot" => array(
4811 "icon" => "robot",
4812 "title" => "Searchbot",
4813 "rule" => array(
4814 "Searchbot[ /]([0-9.]{1,10})" => "\\1"
4815 ),
4816 "uri" => ""
4817 ),
4818 "searchch" => array(
4819 "icon" => "robot",
4820 "title" => "Search.ch",
4821 "rule" => array(
4822 "search\.ch[ /]?V?([0-9.]{1,10})" => "\\1"
4823 ),
4824 "uri" => ""
4825 ),
4826 "searchengineworld" => array(
4827 "icon" => "robot",
4828 "title" => "SearchEngineWorld",
4829 "rule" => array(
4830 "searchengineworld" => ""
4831 ),
4832 "uri" => "http://www.searchengineworld.com/"
4833 ),
4834 "searchhippo" => array(
4835 "icon" => "searchhippo",
4836 "title" => "Searchhippo",
4837 "rule" => array(
4838 "searchhippo" => ""
4839 ),
4840 "uri" => "http://www.searchhippo.com/"
4841 ),
4842 "searchthruus" => array(
4843 "icon" => "robot",
4844 "title" => "SearchThruUs",
4845 "rule" => array(
4846 "www\.unitek-systems\.co\.uk[ /]([0-9.]{1,10})" => "\\1"
4847 ),
4848 "uri" => ""
4849 ),
4850 "securecomputing" => array(
4851 "icon" => "robot",
4852 "title" => "Secure Computing",
4853 "rule" => array(
4854 "securecomputing" => ""
4855 ),
4856 "uri" => ""
4857 ),
4858 "seekport" => array(
4859 "icon" => "seekport",
4860 "title" => "Seekport",
4861 "rule" => array(
4862 "Seekbot[ /]([0-9.]{1,10})" => "\\1"
4863 ),
4864 "uri" => ""
4865 ),
4866 "semanticdiscovery" => array(
4867 "icon" => "robot",
4868 "title" => "Semantic Discovery",
4869 "rule" => array(
4870 "semanticdiscovery[ /]([0-9.]{1,10})" => "\\1"
4871 ),
4872 "uri" => ""
4873 ),
4874 "semrush" => array(
4875 "icon" => "semrush",
4876 "title" => "SEMrush",
4877 "rule" => array(
4878 "SemrushBot[ /]([0-9.]{1,10})" => "\\1"
4879 ),
4880 "uri" => "http://www.semrush.com/bot.html"
4881 ),
4882 "sengine" => array(
4883 "icon" => "sengine",
4884 "title" => "Sengine",
4885 "rule" => array(
4886 "netEstate NE Crawler" => ""
4887 ),
4888 "uri" => "http://www.sengine.info/"
4889 ),
4890 "sensis" => array(
4891 "icon" => "sensis",
4892 "title" => "Sensis",
4893 "rule" => array(
4894 "^Sensis(.com.au)? Web Crawler" => ""
4895 ),
4896 "uri" => "http://sensis.com.au"
4897 ),
4898 "seokicks" => array(
4899 "icon" => "seokicks",
4900 "title" => "SEOkicks",
4901 "rule" => array(
4902 "SEOkicks-Robot" => ""
4903 ),
4904 "uri" => "http://www.seokicks.de/"
4905 ),
4906 "seoprofiler" => array(
4907 "icon" => "seoprofiler",
4908 "title" => "SEOprofiler",
4909 "rule" => array(
4910 "spbot[ /]([0-9.]{1,10})" => "\\1"
4911 ),
4912 "uri" => "http://www.seoprofiler.com/"
4913 ),
4914 "setooz" => array(
4915 "icon" => "setooz",
4916 "title" => "Setooz",
4917 "rule" => array(
4918 "OOZBOT[ /]([0-9.]{1,10})" => "\\1"
4919 ),
4920 "uri" => "http://www.setooz.com/oozbot.html"
4921 ),
4922 "seznam" => array(
4923 "icon" => "seznam",
4924 "title" => "Seznam",
4925 "rule" => array(
4926 "SeznamBot[ /]([0-9.]{1,10})" => "\\1",
4927 "Seznam" => ""
4928 ),
4929 "uri" => "http://www.seznam.cz"
4930 ),
4931 "sharpreader" => array(
4932 "icon" => "sharpreader",
4933 "title" => "SharpReader",
4934 "rule" => array(
4935 "SharpReader[ /]([0-9.]{1,10})" => "\\1"
4936 ),
4937 "uri" => ""
4938 ),
4939 "shelob" => array(
4940 "icon" => "shelob",
4941 "title" => "Sherlock Spider",
4942 "rule" => array(
4943 "^Shelob" => ""
4944 ),
4945 "uri" => "http://www.gmx.net"
4946 ),
4947 "sherlockspider" => array(
4948 "icon" => "robot",
4949 "title" => "Sherlock Spider",
4950 "rule" => array(
4951 "sherlock_spider" => ""
4952 ),
4953 "uri" => ""
4954 ),
4955 "shim" => array(
4956 "icon" => "robot",
4957 "title" => "Shim Crawler",
4958 "rule" => array(
4959 "shim[ \-]crawler" => ""
4960 ),
4961 "uri" => ""
4962 ),
4963 "shopwiki" => array(
4964 "icon" => "shopwiki",
4965 "title" => "ShopWiki",
4966 "rule" => array(
4967 "^ShopWiki[ /]([0-9.]{1,10})" => "\\1"
4968 ),
4969 "uri" => ""
4970 ),
4971 "shoula" => array(
4972 "icon" => "robot",
4973 "title" => "Shoula",
4974 "rule" => array(
4975 "^Shoula.com Crawler ([0-9.]{1,10})" => "\\1"
4976 ),
4977 "uri" => "http://www.shoula.com"
4978 ),
4979 "siege" => array(
4980 "icon" => "robot",
4981 "title" => "Siege",
4982 "rule" => array(
4983 "Siege[ /]([0-9.]{1,10})" => "\\1"
4984 ),
4985 "uri" => ""
4986 ),
4987 "siets" => array(
4988 "icon" => "robot",
4989 "title" => "Siets",
4990 "rule" => array(
4991 "SietsCrawler[ /]([0-9.]{1,10})" => "\\1"
4992 ),
4993 "uri" => ""
4994 ),
4995 "simpy" => array(
4996 "icon" => "simpy",
4997 "title" => "Simpy",
4998 "rule" => array(
4999 "^(argus|simpy)[ /]([0-9.]{1,10})" => "\\2",
5000 ),
5001 "uri" => ""
5002 ),
5003 "singingfish" => array(
5004 "icon" => "singingfish",
5005 "title" => "SingingFish",
5006 "rule" => array(
5007 "asterias[ /]([0-9.]{1,10})" => "\\1",
5008 "Asterias Crawler v([0-9.]{1,10})" => "\\1",
5009 "asterias" => ""
5010 ),
5011 "uri" => ""
5012 ),
5013 "sirketce" => array(
5014 "icon" => "robot",
5015 "title" => "Sirketce",
5016 "rule" => array(
5017 "Sirketcebot[ /v]+([0-9.]{1,10})" => "\\1"
5018 ),
5019 "uri" => "http://www.sirketce.com/bot.html"
5020 ),
5021 "sirobot" => array(
5022 "icon" => "robot",
5023 "title" => "SiroBot",
5024 "rule" => array(
5025 "sirobot" => ""
5026 ),
5027 "uri" => ""
5028 ),
5029 "sistrix" => array(
5030 "icon" => "sistrix",
5031 "title" => "SISTRIX",
5032 "rule" => array(
5033 "SISTRIX Crawler" => ""
5034 ),
5035 "uri" => "http://crawler.sistrix.net/"
5036 ),
5037 "sitebar" => array(
5038 "icon" => "sitebar",
5039 "title" => "SiteBar",
5040 "rule" => array(
5041 "SiteBar[ /]([0-9.]{1,10})" => "\\1"
5042 ),
5043 "uri" => ""
5044 ),
5045 "sitebot" => array(
5046 "icon" => "sitebot",
5047 "title" => "SiteBot",
5048 "rule" => array(
5049 "SiteBot[ /]([0-9.]{1,10})" => "\\1"
5050 ),
5051 "uri" => "http://www.sitebot.org/robot/"
5052 ),
5053 "siteexplorer" => array(
5054 "icon" => "siteexplorer",
5055 "title" => "SiteExplorer",
5056 "rule" => array(
5057 "SiteExplorer[ /]([0-9a-z.]{1,10})" => "\\1"
5058 ),
5059 "uri" => "http://siteexplorer.info/"
5060 ),
5061 "sitesell" => array(
5062 "icon" => "sitesell",
5063 "title" => "SiteSell",
5064 "rule" => array(
5065 "SBIder[/ ]([0-9a-z.\-]{1,10})" => "\\1"
5066 ),
5067 "uri" => ""
5068 ),
5069 "sitespider" => array(
5070 "icon" => "robot",
5071 "title" => "SiteSpider",
5072 "rule" => array(
5073 "^SiteSpider" => ""
5074 ),
5075 "uri" => ""
5076 ),
5077 "sitesucker" => array(
5078 "icon" => "sitesucker",
5079 "title" => "SiteSucker",
5080 "rule" => array(
5081 "Sitesucker[ /]([0-9.]{1,10})" => "\\1"
5082 ),
5083 "uri" => "http://www.sitesucker.us/"
5084 ),
5085 "sitidi" => array(
5086 "icon" => "robot",
5087 "title" => "SitiDi",
5088 "rule" => array(
5089 "SitiDiBot[ /]([0-9.]{1,10})" => "\\1"
5090 ),
5091 "uri" => ""
5092 ),
5093 "sixy" => array(
5094 "icon" => "robot",
5095 "title" => "Sixy.ch",
5096 "rule" => array(
5097 "sixy.ch[ /]([0-9a-z.]{1,10})" => "\\1"
5098 ),
5099 "uri" => "http://sixy.ch"
5100 ),
5101 "skaffe" => array(
5102 "icon" => "robot",
5103 "title" => "Skaffe",
5104 "rule" => array(
5105 "Skampy[ /]([0-9.\-]{1,10})" => "\\1"
5106 ),
5107 "uri" => "http://www.skaffe.com"
5108 ),
5109 "skizzle" => array(
5110 "icon" => "skizzle",
5111 "title" => "Skizzle",
5112 "rule" => array(
5113 "SKIZZLE! Distributed Internet Spider[ /v]+([0-9a-z.\-]{1,10})" => "\\1"
5114 ),
5115 "uri" => "http://www.skizzle.com"
5116 ),
5117 "slider" => array(
5118 "icon" => "robot",
5119 "title" => "Slider",
5120 "rule" => array(
5121 "^Slider[ /]([0-9.]{1,10})" => "\\1"
5122 ),
5123 "uri" => ""
5124 ),
5125 "slugch" => array(
5126 "icon" => "robot",
5127 "title" => "Slugch",
5128 "rule" => array(
5129 "^slug\.ch crawl ([0-9a-z.\-]{1,10})" => "\\1"
5130 ),
5131 "uri" => ""
5132 ),
5133 "smartware" => array(
5134 "icon" => "robot",
5135 "title" => "SmartWareSoft",
5136 "rule" => array(
5137 "^SWSBot-Images[ /]([0-9.]{1,10})" => "\\1"
5138 ),
5139 "uri" => "http://www.smartwaresoft.com/swsbot12.html"
5140 ),
5141 "snookit" => array(
5142 "icon" => "snookit",
5143 "title" => "Snookit",
5144 "rule" => array(
5145 "^snookit" => ""
5146 ),
5147 "uri" => "http://www.snookit.com/"
5148 ),
5149 "snoopy" => array(
5150 "icon" => "robot",
5151 "title" => "Snoopy",
5152 "rule" => array(
5153 "^Snoopy.+([0-9.]{1,10})" => "\\1",
5154 "sna-([0-9.]{1,10})" => "\\1"
5155 ),
5156 "uri" => "http://snoopy.sourceforge.net/"
5157 ),
5158 "snyke" => array(
5159 "icon" => "robot",
5160 "title" => "Snyke",
5161 "rule" => array(
5162 "^SnykeBot[ /]([0-9.]{1,10})" => "\\1"
5163 ),
5164 "uri" => "http://www.snyke.com"
5165 ),
5166 "socialradar" => array(
5167 "icon" => "socialradar",
5168 "title" => "Social Radar",
5169 "rule" => array(
5170 "Socialradarbot[ /]([0-9.]{1,10})" => "\\1"
5171 ),
5172 "uri" => "http://infegy.com/"
5173 ),
5174 "soegning" => array(
5175 "icon" => "soegning",
5176 "title" => "Søgning",
5177 "rule" => array(
5178 "soegning\.dk[/ ]spider[ /]([0-9.]{1,10})" => "\\1"
5179 ),
5180 "uri" => ""
5181 ),
5182 "soft411" => array(
5183 "icon" => "soft411",
5184 "title" => "Soft411",
5185 "rule" => array(
5186 "SOFT411 Directory" => ""
5187 ),
5188 "uri" => ""
5189 ),
5190 "sogou" => array(
5191 "icon" => "sogou",
5192 "title" => "Sogou",
5193 "rule" => array(
5194 "Sogou web spider[ /]([0-9.]{1,10})" => "\\1"
5195 ),
5196 "uri" => "http://www.sogou.com/docs/help/webmasters.htm#07"
5197 ),
5198 "sohu" => array(
5199 "icon" => "robot",
5200 "title" => "Sohu",
5201 "rule" => array(
5202 "sohu[ \-](agent|search)" => ""
5203 ),
5204 "uri" => ""
5205 ),
5206 "somewhere" => array(
5207 "icon" => "robot",
5208 "title" => "Somewhere.com",
5209 "rule" => array(
5210 "Mozilla\@somewhere\.com" => "\\1"
5211 ),
5212 "uri" => "http://www.somewhere.com/"
5213 ),
5214 "sopheus" => array(
5215 "icon" => "robot",
5216 "title" => "Sopheus",
5217 "rule" => array(
5218 "Sopheus Project[ /]([0-9.]{1,10})" => "\\1"
5219 ),
5220 "uri" => "http://www.thenetplanet.com"
5221 ),
5222 "soso" => array(
5223 "icon" => "soso",
5224 "title" => "Soso",
5225 "rule" => array(
5226 "^Soso(image)?spider" => ""
5227 ),
5228 "uri" => "http://help.soso.com/soso-image-spider.htm"
5229 ),
5230 "souppot" => array(
5231 "icon" => "robot",
5232 "title" => "SoupPot",
5233 "rule" => array(
5234 "SoupPotBot" => ""
5235 ),
5236 "uri" => ""
5237 ),
5238 "specificmedia" => array(
5239 "icon" => "specificmedia",
5240 "title" => "Specific Media",
5241 "rule" => array(
5242 "^SMBot[ /]([0-9.]{1,10})" => "\\1"
5243 ),
5244 "uri" => ""
5245 ),
5246 "sphider" => array(
5247 "icon" => "sphider",
5248 "title" => "Sphider",
5249 "rule" => array(
5250 "Sphider" => ""
5251 ),
5252 "uri" => "http://www.sphider.eu"
5253 ),
5254 "spinn3r" => array(
5255 "icon" => "robot",
5256 "title" => "Spinn3r",
5257 "rule" => array(
5258 "Spinn3r[ /]([0-9.]{1,10})" => "\\1"
5259 ),
5260 "uri" => "http://spinn3r.com/robot"
5261 ),
5262 "sproose" => array(
5263 "icon" => "robot",
5264 "title" => "Sproose",
5265 "rule" => array(
5266 "^sproose[ /]([0-9a-z.]{1,10})" => "\\1"
5267 ),
5268 "uri" => "http://www.sproose.com/bot.html"
5269 ),
5270 "spurlbot" => array(
5271 "icon" => "robot",
5272 "title" => "SpurlBot",
5273 "rule" => array(
5274 "SpurlBot[/ ]([0-9.]{1,10})" => "\\1"
5275 ),
5276 "uri" => ""
5277 ),
5278 "stardownloader" => array(
5279 "icon" => "stardownloader",
5280 "title" => "Star Downloader",
5281 "rule" => array(
5282 "^Star Downloader( Pro)?" => ""
5283 ),
5284 "uri" => ""
5285 ),
5286 "steeler" => array(
5287 "icon" => "robot",
5288 "title" => "Steeler",
5289 "rule" => array(
5290 "Steeler[ /]([0-9.]{1,10})" => "\\1"
5291 ),
5292 "uri" => ""
5293 ),
5294 "strategicboard" => array(
5295 "icon" => "strategicboard",
5296 "title" => "Strategic Board",
5297 "rule" => array(
5298 "Strategic Board Bot" => ""
5299 ),
5300 "uri" => "http://www.strategicboard.com"
5301 ),
5302 "suchbaer" => array(
5303 "icon" => "robot",
5304 "title" => "Suchbaer.de",
5305 "rule" => array(
5306 "^suchbaer\.de" => ""
5307 ),
5308 "uri" => "http://www.suchbaer.de/"
5309 ),
5310 "suchbot" => array(
5311 "icon" => "robot",
5312 "title" => "Suchbot",
5313 "rule" => array(
5314 "^suchbot" => ""
5315 ),
5316 "uri" => ""
5317 ),
5318 "suchende" => array(
5319 "icon" => "suchende",
5320 "title" => "Suchen.de",
5321 "rule" => array(
5322 "^gonzo([0-9]{1,2}).*www.suchen.de" => "\\1",
5323 "^gonzo/([0-9.]{1,10})" => "\\1"
5324 ),
5325 "uri" => "http://www.suchen.de/"
5326 ),
5327 "suchknecht" => array(
5328 "icon" => "robot",
5329 "title" => "Suchknecht",
5330 "rule" => array(
5331 "^Suchknecht.at-Robot" => ""
5332 ),
5333 "uri" => "http://www.suchknecht.at/"
5334 ),
5335 "suchpad" => array(
5336 "icon" => "robot",
5337 "title" => "Suchpad",
5338 "rule" => array(
5339 "^suchpadbot[ /]([0-9.]{1,10})" => "\\1"
5340 ),
5341 "uri" => "http://www.suchpad.de"
5342 ),
5343 "sunrise" => array(
5344 "icon" => "sunrise",
5345 "title" => "Sunrise",
5346 "rule" => array(
5347 "^Sunrise[ /]([0-9a-z.]{1,10})" => "\\1"
5348 ),
5349 "uri" => ""
5350 ),
5351 "superbot" => array(
5352 "icon" => "superbot",
5353 "title" => "SuperBot",
5354 "rule" => array(
5355 "SuperBot[ /]([0-9.]{1,10})" => "\\1"
5356 ),
5357 "uri" => ""
5358 ),
5359 "surfcontrol" => array(
5360 "icon" => "robot",
5361 "title" => "SurfControl",
5362 "rule" => array(
5363 "SurfControl" => "",
5364 "ScSpider[ /]([0-9.]{1,10})" => "\\1"
5365 ),
5366 "uri" => ""
5367 ),
5368 "surfnet" => array(
5369 "icon" => "robot",
5370 "title" => "SURFnet",
5371 "rule" => array(
5372 "AVSearch[ \-]([0-9.]{1,10})" => "\\1"
5373 ),
5374 "uri" => ""
5375 ),
5376 "surfsafely" => array(
5377 "icon" => "robot",
5378 "title" => "Surfsafely",
5379 "rule" => array(
5380 "Submission Spider at surfsafely.com" => ""
5381 ),
5382 "uri" => "http://www.surfsafely.com"
5383 ),
5384 "surphace" => array(
5385 "icon" => "spherescout",
5386 "title" => "Surphace",
5387 "rule" => array(
5388 "Sphere Scout.+([0-9.]{1,10})" => "\\1",//Previous called Sphere Scout
5389 "Surphace.+v([0-9.]{1,10})" => "\\1"
5390 ),
5391 "uri" => "http://www.surphace.com"
5392 ),
5393 "surveybot" => array(
5394 "icon" => "surveybot",
5395 "title" => "Whois Survey",
5396 "rule" => array(
5397 "SurveyBot[ /]([0-9.]{1,10})" => "\\1"
5398 ),
5399 "uri" => ""
5400 ),
5401 "swoogle" => array(
5402 "icon" => "robot",
5403 "title" => "Swoogle",
5404 "rule" => array(
5405 "^Swooglebot[ /]([0-9.]{1,10})" => "\\1"
5406 ),
5407 "uri" => "http://swoogle.umbc.edu/swooglebot.htm"
5408 ),
5409 "swse" => array(
5410 "icon" => "robot",
5411 "title" => "SWSE",
5412 "rule" => array(
5413 "sw\.deri\.org" => ""
5414 ),
5415 "uri" => "http://sw.deri.org/2006/04/multicrawler/robots.html"
5416 ),
5417 "swish-e" => array(
5418 "icon" => "swish-e",
5419 "title" => "Swish-e",
5420 "rule" => array(
5421 "^swish-e" => ""
5422 ),
5423 "uri" => "http://swish-e.org/"
5424 ),
5425 "sygol" => array(
5426 "icon" => "sygol",
5427 "title" => "Sygol",
5428 "rule" => array(
5429 "www.sygol.(com|net)" => ""
5430 ),
5431 "uri" => "http://www.sygol.com"
5432 ),
5433 "syllabs" => array(
5434 "icon" => "syllabs",
5435 "title" => "Syllabs",
5436 "rule" => array(
5437 "Focal[-]([0-9.]{1,10})" => "\\1"
5438 ),
5439 "uri" => "http://www.syllabs.com/crawler.html"
5440 ),
5441 "synapse" => array(
5442 "icon" => "robot",
5443 "title" => "Synapse",
5444 "rule" => array(
5445 " Synapse\)" => ""
5446 ),
5447 "uri" => "http://ws.apache.org/synapse/"
5448 ),
5449 "sync2it" => array(
5450 "icon" => "robot",
5451 "title" => "Sync2it",
5452 "rule" => array(
5453 "^\!Susie" => ""
5454 ),
5455 "uri" => "http://www.sync2it.com/bms/susie.php"
5456 ),
5457 "syncit" => array(
5458 "icon" => "robot",
5459 "title" => "Syncit",
5460 "rule" => array(
5461 "^SyncIT[ /]([0-9.]{1,10})" => "\\1"
5462 ),
5463 "uri" => "http://www.syncit.com/"
5464 ),
5465 "syndic8" => array(
5466 "icon" => "syndic8",
5467 "title" => "Syndic8",
5468 "rule" => array(
5469 "Syndic8[ /]([0-9.]{1,10})" => "\\1"
5470 ),
5471 "uri" => "http://www.syndic8.com/"
5472 ),
5473 "syndicatie" => array(
5474 "icon" => "robot",
5475 "title" => "Syndicatie.nl",
5476 "rule" => array(
5477 "Syndicatie\.nl robot v ([0-9.]{1,10})" => "\\1",
5478 "Syndicatie\.nl robot;" => ""
5479 ),
5480 "uri" => ""
5481 ),
5482 "synomia" => array(
5483 "icon" => "robot",
5484 "title" => "Synomia",
5485 "rule" => array(
5486 "^SynoBot" => ""
5487 ),
5488 "uri" => ""
5489 ),
5490 "synoo" => array(
5491 "icon" => "robot",
5492 "title" => "SynooBot",
5493 "rule" => array(
5494 "SynooBot[ /]([0-9.]{1,10})" => "\\1",
5495 ),
5496 "uri" => ""
5497 ),
5498 "szukacz" => array(
5499 "icon" => "szukacz",
5500 "title" => "Szukacz",
5501 "rule" => array(
5502 "Szukacz[ /]([0-9.]{1,10})" => "\\1"
5503 ),
5504 "uri" => ""
5505 ),
5506 "tagoo" => array(
5507 "icon" => "tagoobot",
5508 "title" => "Tagoo",
5509 "rule" => array(
5510 "Tagoobot[ /]([0-9.]{1,10})" => "\\1"
5511 ),
5512 "uri" => "http://www.tagoo.ru"
5513 ),
5514 "tagword" => array(
5515 "icon" => "tagword",
5516 "title" => "Tagword",
5517 "rule" => array(
5518 "^Tagword" => ""
5519 ),
5520 "uri" => "http://tagword.com/dmoz_survey.php"
5521 ),
5522 "trailfire" => array(
5523 "icon" => "trailfire",
5524 "title" => "Trailfire",
5525 "rule" => array(
5526 "^Trailfire-bot[ /]([0-9.]{1,10})" => "\\1"
5527 ),
5528 "uri" => "http://trailfire.com"
5529 ),
5530 "tamu" => array(
5531 "icon" => "tamu",
5532 "title" => "Tamu Crawler",
5533 "rule" => array(
5534 "IRLbot[ /]([0-9.]{1,10})" => "\\1",
5535 "TAMU_CS_IRL_CRAWLER[ /]([0-9.]{1,10})" => "\\1"
5536 ),
5537 "uri" => "http://irl.cs.tamu.edu/crawler/"
5538 ),
5539 "taptubot" => array(
5540 "icon" => "taptubot",
5541 "title" => "Taptu",
5542 "rule" => array(
5543 "taptubot" => ""
5544 ),
5545 "uri" => "http://www.taptu.com/corp/taptubot"
5546 ),
5547 "targetseek" => array(
5548 "icon" => "robot",
5549 "title" => "TargetSeek",
5550 "rule" => array(
5551 "TargetSeek[ /]([0-9.]{1,10})" => "\\1"
5552 ),
5553 "uri" => "http://www.targetgroups.net/TargetSeek.html"
5554 ),
5555 "taw" => array(
5556 "icon" => "taw",
5557 "title" => "TAW",
5558 "rule" => array(
5559 "TAW[ /]([0-9.]{1,10})" => "\\1"
5560 ),
5561 "uri" => "http://www.tawdis.net"
5562 ),
5563 "tcd" => array(
5564 "icon" => "tcd",
5565 "title" => "Trinity College Dublin",
5566 "rule" => array(
5567 "^TCDBOT/Nutch-([0-9.]{1,10})" => "\\1"
5568 ),
5569 "uri" => "http://www.tcd.ie"
5570 ),
5571 "technorati" => array(
5572 "icon" => "technorati",
5573 "title" => "Technorati",
5574 "rule" => array(
5575 "Technoratibot[ /]([0-9.]{1,10})" => "\\1"
5576 ),
5577 "uri" => ""
5578 ),
5579 "teleport" => array(
5580 "icon" => "teleport",
5581 "title" => "Teleport",
5582 "rule" => array(
5583 "Teleport[ \-]?Pro" => ""
5584 ),
5585 "uri" => ""
5586 ),
5587 "terrar" => array(
5588 "icon" => "robot",
5589 "title" => "Terrar",
5590 "rule" => array(
5591 "^Fresh Search :: Terrar" => ""
5592 ),
5593 "uri" => ""
5594 ),
5595 "theophrastus" => array(
5596 "icon" => "robot",
5597 "title" => "Theophrastus",
5598 "rule" => array(
5599 "Theophrastus[ /]([0-9.]{1,10})" => "\\1"
5600 ),
5601 "uri" => "http://users.cs.cf.ac.uk/N.A.Smith/theophrastus.php"
5602 ),
5603 "thumbnailscz" => array(
5604 "icon" => "robot",
5605 "title" => "Thumbnails.cz",
5606 "rule" => array(
5607 "^thumbnail\.cz robot[ /]([0-9.]{1,10})" => "\\1"
5608 ),
5609 "uri" => ""
5610 ),
5611 "thumbshot" => array(
5612 "icon" => "robot",
5613 "title" => "Thumbshots",
5614 "rule" => array(
5615 "^thumbshots.*(Version: |v)([0-9.]{2,10})e" => "\\1",
5616 "^thumbshots-de" => ""
5617 ),
5618 "uri" => "http://www.thumbshots.de"
5619 ),
5620 "thunderstone" => array(
5621 "icon" => "thunderstone",
5622 "title" => "Thunderstone",
5623 "rule" => array(
5624 "T-H-U-N-D-E-R-S-T-O-N-E" => "",
5625 "search.thunderstone.com" => ""
5626 ),
5627 "uri" => "http://search.thunderstone.com/"
5628 ),
5629 "timbobot" => array(
5630 "icon" => "robot",
5631 "title" => "TimboBot",
5632 "rule" => array(
5633 "timboBot" => ""
5634 ),
5635 "uri" => ""
5636 ),
5637 "topsy" => array(
5638 "icon" => "topsy",
5639 "title" => "Topsy",
5640 "rule" => array(
5641 "Butterfly[ /]([0-9.]{1,10})" => "\\1"
5642 ),
5643 "uri" => "http://labs.topsy.com/butterfly.html"
5644 ),
5645 "trayce" => array(
5646 "icon" => "robot",
5647 "title" => "Trayce",
5648 "rule" => array(
5649 "traycebot[ /]([0-9a-z.\-]{1,10})" => "\\1"
5650 ),
5651 "uri" => ""
5652 ),
5653 "tricus" => array(
5654 "icon" => "robot",
5655 "title" => "Tricus",
5656 "rule" => array(
5657 "B_l_i_t_z_B_O_T_@_t_r_i_c_u_s_\._c_o_m" => ""
5658 ),
5659 "uri" => ""
5660 ),
5661 "topicblogs" => array(
5662 "icon" => "robot",
5663 "title" => "Topicblogs",
5664 "rule" => array(
5665 "topicblogs[ /]([0-9.]{1,10})" => "\\1"
5666 ),
5667 "uri" => ""
5668 ),
5669 "touche" => array(
5670 "icon" => "touche",
5671 "title" => "Touché",
5672 "rule" => array(
5673 "^Touche" => ""
5674 ),
5675 "uri" => "http://touche.com.ve"
5676 ),
5677 "tuezilla" => array(
5678 "icon" => "robot",
5679 "title" => "TÃœzilla",
5680 "rule" => array(
5681 "tuezilla.de" => ""
5682 ),
5683 "uri" => "http://tuezilla.de/t_st-odp-entries-agent.html"
5684 ),
5685 "turnitin" => array(
5686 "icon" => "turnitin",
5687 "title" => "Turnitin",
5688 "rule" => array(
5689 "TurnitinBot[ /]([0-9.]{1,10})" => "\\1",
5690 "^Turnitin" => ""
5691 ),
5692 "uri" => ""
5693 ),
5694 "tutorgig" => array(
5695 "icon" => "robot",
5696 "title" => "TutorGig",
5697 "rule" => array(
5698 "TutorGig(Bot)?[ /]([0-9.]{1,10})" => "\\2"
5699 ),
5700 "uri" => ""
5701 ),
5702 "twiceler" => array(
5703 "icon" => "cuill",
5704 "title" => "Cuill",
5705 "rule" => array(
5706 "Twiceler[ /-]([0-9.]{1,10})" => "\\1",
5707 "Twiceler" => ""
5708 ),
5709 "uri" => "http://www.cuill.com/twiceler/robot.html"
5710 ),
5711 "twingly" => array(
5712 "icon" => "twingly",
5713 "title" => "Twingly",
5714 "rule" => array(
5715 "Twingly Recon" => ""
5716 ),
5717 "uri" => "http://www.twingly.com/"
5718 ),
5719 "twitter" => array(
5720 "icon" => "twitter",
5721 "title" => "Twitter",
5722 "rule" => array(
5723 "Twitterbot[ /-]([0-9.]{1,10})" => "\\1"
5724 ),
5725 "uri" => "https://dev.twitter.com/cards/getting-started#crawling"
5726 ),
5727 "typepad" => array(
5728 "icon" => "typepad",
5729 "title" => "TypePad",
5730 "rule" => array(
5731 "TypePad/([0-9a-z.]{1,10})" => "\\1"
5732 ),
5733 "uri" => ""
5734 ),
5735 "udmsearch" => array(
5736 "icon" => "robot",
5737 "title" => "UdmSearch",
5738 "rule" => array(
5739 "UdmSearch[/ ]([0-9.]{1,10})" => "\\1"
5740 ),
5741 "uri" => ""
5742 ),
5743 "ukwizz" => array(
5744 "icon" => "ukwizz",
5745 "title" => "UKWizz",
5746 "rule" => array(
5747 "^Mackster.*ukwizz" => ""
5748 ),
5749 "uri" => "http://www.ukwizz.com"
5750 ),
5751 "ultraseek" => array(
5752 "icon" => "robot",
5753 "title" => "Ultraseek",
5754 "rule" => array(
5755 "Ultraseek" => ""
5756 ),
5757 "uri" => ""
5758 ),
5759 "ultraspider" => array(
5760 "icon" => "robot",
5761 "title" => "UltraSpider",
5762 "rule" => array(
5763 "UltraSpider3000[/ ]([0-9.]{1,10})" => "\\1"
5764 ),
5765 "uri" => "http://www.search.ch"
5766 ),
5767 "umai" => array(
5768 "icon" => "robot",
5769 "title" => "Umai",
5770 "rule" => array(
5771 "umai[/ ]([0-9.]{1,10})" => "\\1"
5772 ),
5773 "uri" => ""
5774 ),
5775 "unchaos" => array(
5776 "icon" => "robot",
5777 "title" => "Unchaos",
5778 "rule" => array(
5779 "unchaos_crawler[_ /]([0-9.]{1,10})" => "\\1",
5780 "unchaos" => ""
5781 ),
5782 "uri" => ""
5783 ),
5784 "unido" => array(
5785 "icon" => "robot",
5786 "title" => "UNIdo",
5787 "rule" => array(
5788 "^unido-bot" => "\\1"
5789 ),
5790 "uri" => "http://mobicom.cs.uni-dortmund.de/bot.html"
5791 ),
5792 "updated" => array(
5793 "icon" => "robot",
5794 "title" => "Updated",
5795 "rule" => array(
5796 "updated[ /]([0-9a-z.]{1,10})" => "\\1"
5797 ),
5798 "uri" => ""
5799 ),
5800 "uptimebot" => array(
5801 "icon" => "robot",
5802 "title" => "UptimeBot",
5803 "rule" => array(
5804 "^UptimeBot" => ""
5805 ),
5806 "uri" => "http://www.uptimebot.com/"
5807 ),
5808 "urifetch" => array(
5809 "icon" => "robot",
5810 "title" => "URI::Fetch",
5811 "rule" => array(
5812 "^URI::Fetch[ /]([0-9.]{1,10})" => "\\1"
5813 ),
5814 "uri" => ""
5815 ),
5816 "urlbase" => array(
5817 "icon" => "robot",
5818 "title" => "URLBase",
5819 "rule" => array(
5820 "URLBase[ /]([0-9.]{1,10})" => "\\1"
5821 ),
5822 "uri" => ""
5823 ),
5824 "urlblaze" => array(
5825 "icon" => "robot",
5826 "title" => "URLBlaze",
5827 "rule" => array(
5828 "^URLBlaze" => ""
5829 ),
5830 "uri" => ""
5831 ),
5832 "urlcontr" => array(
5833 "icon" => "robot",
5834 "title" => "MS URL Control",
5835 "rule" => array(
5836 "Microsoft URL[ \-]?Control" => ""
5837 ),
5838 "uri" => ""
5839 ),
5840 "urlgetfile" => array(
5841 "icon" => "robot",
5842 "title" => "URLGetFile",
5843 "rule" => array(
5844 "^URLGetFile" => ""
5845 ),
5846 "uri" => ""
5847 ),
5848 "urlscope" => array(
5849 "icon" => "robot",
5850 "title" => "UrlScope",
5851 "rule" => array(
5852 "UrlScope" => ""
5853 ),
5854 "uri" => ""
5855 ),
5856 "urltrends" => array(
5857 "icon" => "urltrends",
5858 "title" => "UrlTrends",
5859 "rule" => array(
5860 "Snappy/([0-9.]{1,10})" => "\\1",
5861 ),
5862 "uri" => ""
5863 ),
5864 "usww" => array(
5865 "icon" => "usww",
5866 "title" => "USWW",
5867 "rule" => array(
5868 "usww\.com" => "",
5869 "Mozilla/5\.0 URL-Spider" => ""
5870 ),
5871 "uri" => "http://www.usww.com/"
5872 ),
5873 "usyd" => array(
5874 "icon" => "robot",
5875 "title" => "USyd-NLP-Spider",
5876 "rule" => array(
5877 "^USyd-NLP-Spider" => ""
5878 ),
5879 "uri" => "http://www.it.usyd.edu.au/~vinci/bot.html"
5880 ),
5881 "vagabondo" => array(
5882 "icon" => "wiseguys",
5883 "title" => "WiseGuys",
5884 "rule" => array(
5885 "Vagabondo[ /]([0-9.]{1,10})" => "\\1",
5886 "Vagabondo-WAP[ /]([0-9.]{1,10})" => "\\1"
5887 ),
5888 "uri" => ""
5889 ),
5890 "unicorn" => array(
5891 "icon" => "w3c",
5892 "title" => "W3C Unicorn",
5893 "rule" => array(
5894 "Unicorn[ /]([0-9.]{1,10})" => "\\1",
5895 ),
5896 "uri" => "http://validator.w3.org/unicorn/"
5897 ),
5898 "validator" => array(
5899 "icon" => "w3c",
5900 "title" => "W3C Validator",
5901 "rule" => array(
5902 "W3C_Validator[ /]([0-9.]{1,10})" => "\\1"
5903 ),
5904 "uri" => "http://validator.w3.org/"
5905 ),
5906 "validator.nu" => array(
5907 "icon" => "validatornu",
5908 "title" => "Validator.nu",
5909 "rule" => array(
5910 "^Validator.nu[ /]([0-9.]{1,10})" => "\\1",
5911 "^Validator.nu/LV" => "\\1"
5912 ),
5913 "uri" => "http://validator.nu/"
5914 ),
5915 "verity" => array(
5916 "icon" => "robot",
5917 "title" => "Verity",
5918 "rule" => array(
5919 "^vspider[ /]([0-9.]{1,10})" => "\\1",
5920 "^vspider" => ""
5921 ),
5922 "uri" => "http://www.verity.com/"
5923 ),
5924 "versionsproject" => array(
5925 "icon" => "robot",
5926 "title" => "Versions-project",
5927 "rule" => array(
5928 "InfoFly[ /]([0-9.]{1,10})" => "\\1"
5929 ),
5930 "uri" => "http://www.versions-project.org/"
5931 ),
5932 "verticalmatch" => array(
5933 "icon" => "robot",
5934 "title" => "VerticalMatch",
5935 "rule" => array(
5936 "^VMBot[ /]([0-9.]{1,10})" => "\\1"
5937 ),
5938 "uri" => "http://www.VerticalMatch.com/"
5939 ),
5940 "verzamelgids" => array(
5941 "icon" => "robot",
5942 "title" => "Verzamelgids",
5943 "rule" => array(
5944 "Verzamelgids[ /]([0-9.]{1,10})" => "\\1"
5945 ),
5946 "uri" => "http://www.verzamelgids.nl/"
5947 ),
5948 "vestris" => array(
5949 "icon" => "vestris",
5950 "title" => "Vestris",
5951 "rule" => array(
5952 "AlkalineBOT[ /]([0-9.]{1,10})" => "\\1"
5953 ),
5954 "uri" => "http://alkaline.vestris.com/"
5955 ),
5956 "vindex" => array(
5957 "icon" => "vindex",
5958 "title" => "Vindex",
5959 "rule" => array(
5960 "Vindex[ /]([0-9.]{1,10})" => "\\1"
5961 ),
5962 "uri" => ""
5963 ),
5964 "visvo" => array(
5965 "icon" => "robot",
5966 "title" => "Visvo",
5967 "rule" => array(
5968 "VisBot[ /]([0-9.]{1,10})" => "\\1"
5969 ),
5970 "uri" => "http://www.visvo.com"
5971 ),
5972 "voila" => array(
5973 "icon" => "voila",
5974 "title" => "Voila",
5975 "rule" => array(
5976 "VoilaBot[ /]?[a-z ]*([0-9.]{1,10})" => "\\1",
5977 "VoilaBot;[ /]([0-9.]{1,10})" => "\\1"
5978 ),
5979 "uri" => ""
5980 ),
5981 "vonna" => array(
5982 "icon" => "robot",
5983 "title" => "Vonna",
5984 "rule" => array(
5985 "Vonna.com b o t" => ""
5986 ),
5987 "uri" => ""
5988 ),
5989 "vortex" => array(
5990 "icon" => "robot",
5991 "title" => "Vortex",
5992 "rule" => array(
5993 "Vortex[ /]([0-9.]{1,10})" => "\\1"
5994 ),
5995 "uri" => "http://marty.anstey.ca/robots/vortex/"
5996 ),
5997 "w3sitesearch" => array(
5998 "icon" => "w3sitesearch",
5999 "title" => "W3SiteSearch",
6000 "rule" => array(
6001 "^W3SiteSearch Crawler[\_v]*([0-9.]{1,10})" => "\\1"
6002 ),
6003 "uri" => "http://www.w3sitesearch.de"
6004 ),
6005 "wagger" => array(
6006 "icon" => "robot",
6007 "title" => "Wagger",
6008 "rule" => array(
6009 "^Waggr" => ""
6010 ),
6011 "uri" => "http://www.waggr.com/"
6012 ),
6013 "wanadoo" => array(
6014 "icon" => "robot",
6015 "title" => "Wanadoo",
6016 "rule" => array(
6017 "^SurferF3[ /]([0-9./]{1,10})" => "\\1"
6018 ),
6019 "uri" => "http://www.wanadoo.fr/"
6020 ),
6021 "wapalizer" => array(
6022 "icon" => "robot",
6023 "title" => "Wapalizer",
6024 "rule" => array(
6025 "wapalizer[ /]([0-9.]{1,10})" => "\\1"
6026 ),
6027 "uri" => "http://www.wapdrive.com/"
6028 ),
6029 "watson" => array(
6030 "icon" => "addy",
6031 "title" => "Dr.Watson",
6032 "rule" => array(
6033 "Watson[ /]([0-9.]{1,10})" => "\\1",
6034 "watson\.addy\.com" => ""
6035 ),
6036 "uri" => ""
6037 ),
6038 "wavefire" => array(
6039 "icon" => "robot",
6040 "title" => "Wavefire",
6041 "rule" => array(
6042 "^Wavefire[ /]([0-9.]{1,10})" => "\\1"
6043 ),
6044 "uri" => ""
6045 ),
6046 "waypath" => array(
6047 "icon" => "waypath",
6048 "title" => "Waypath",
6049 "rule" => array(
6050 "Waypath[ \-]?Scout" => "",
6051 "Waypath (development )?crawler" => ""
6052 ),
6053 "uri" => ""
6054 ),
6055 "wauuu" => array(
6056 "icon" => "wauuu",
6057 "title" => "Wauuu",
6058 "rule" => array(
6059 "Wauuu[/ ]([0-9.]{1,10})" => "\\2"
6060 ),
6061 "uri" => "http://www.wauuu.com"
6062 ),
6063 "wdg" => array(
6064 "icon" => "wdg",
6065 "title" => "WDG Validator",
6066 "rule" => array(
6067 "^WDG_(Site)?Validator[/ ]([0-9.]{1,10})" => "\\2"
6068 ),
6069 "uri" => "http://www.htmlhelp.com/tools/validator/"
6070 ),
6071 "webagogo" => array(
6072 "icon" => "webagogo",
6073 "title" => "Webagogo",
6074 "rule" => array(
6075 "^Webagogo" => ""
6076 ),
6077 "uri" => "http://www.webagogo.be/"
6078 ),
6079 "webalta" => array(
6080 "icon" => "webalta",
6081 "title" => "WebAlta",
6082 "rule" => array(
6083 "^WebAlta( Crawler)?[/ ]([0-9.]{1,10})" => "\\2"
6084 ),
6085 "uri" => "http://www.webalta.net/ru/about_webmaster.html"
6086 ),
6087 "webdigity" => array(
6088 "icon" => "robot",
6089 "title" => "Webdigity Whois Service",
6090 "rule" => array(
6091 "^webdigity whois service" => ""
6092 ),
6093 "uri" => "http://www.webdigity.com/ws"
6094 ),
6095 "webelixir" => array(
6096 "icon" => "webelixir",
6097 "title" => "Webelixir",
6098 "rule" => array(
6099 "^webelixir" => ""
6100 ),
6101 "uri" => "http://www.webelixir.net/"
6102 ),
6103 "webbotru" => array(
6104 "icon" => "robot",
6105 "title" => "Webbot.ru",
6106 "rule" => array(
6107 " Webbot[/ ]([0-9.]{1,10})" => "\\1"
6108 ),
6109 "uri" => "http://www.webbot.ru/bot.html"
6110 ),
6111 "webcapture" => array(
6112 "icon" => "robot",
6113 "title" => "WebCapture",
6114 "rule" => array(
6115 "WebCapture[/ ]([0-9.]{1,10})" => "\\1"
6116 ),
6117 "uri" => ""
6118 ),
6119 "webcollage" => array(
6120 "icon" => "robot",
6121 "title" => "Webcollage",
6122 "rule" => array(
6123 "webcollage" => ""
6124 ),
6125 "uri" => ""
6126 ),
6127 "webcopier" => array(
6128 "icon" => "webcopier",
6129 "title" => "WebCopier",
6130 "rule" => array(
6131 "WebCopier[/ ]v?([0-9.]{1,10})" => "\\1"
6132 ),
6133 "uri" => ""
6134 ),
6135 "webcorp" => array(
6136 "icon" => "webcorp",
6137 "title" => "WebCorp",
6138 "rule" => array(
6139 "WebCorp[/ ]+([0-9.]{1,10})" => "\\1"
6140 ),
6141 "uri" => "http://www.webcorp.org.uk/"
6142 ),
6143 "webcrawl" => array(
6144 "icon" => "robot",
6145 "title" => "WebCrawl",
6146 "rule" => array(
6147 "webcrawl\.net" => ""
6148 ),
6149 "uri" => ""
6150 ),
6151 "webdownloader" => array(
6152 "icon" => "robot",
6153 "title" => "Web Downloader",
6154 "rule" => array(
6155 "Web Downloader[/ ]([0-9.]{1,10})" => "\\1"
6156 ),
6157 "uri" => ""
6158 ),
6159 "webfetch" => array(
6160 "icon" => "robot",
6161 "title" => "WebFetch",
6162 "rule" => array(
6163 "^webfetch[/ ]([0-9.]{1,10})" => "\\1"
6164 ),
6165 "uri" => ""
6166 ),
6167 "webfind" => array(
6168 "icon" => "robot",
6169 "title" => "WebFind",
6170 "rule" => array(
6171 "^WebFindBot" => ""
6172 ),
6173 "uri" => "http://www.web-find.com"
6174 ),
6175 "webglimpse" => array(
6176 "icon" => "robot",
6177 "title" => "Webglimpse",
6178 "rule" => array(
6179 "^Webglimpse[/ ]([0-9.]{1,10})" => "\\1"
6180 ),
6181 "uri" => "http://webglimpse.net"
6182 ),
6183 "webgobbler" => array(
6184 "icon" => "robot",
6185 "title" => "webGobbler",
6186 "rule" => array(
6187 "^webGobbler[/ ]([0-9.]{1,10})" => "\\1"
6188 ),
6189 "uri" => ""
6190 ),
6191 "webimages" => array(
6192 "icon" => "webimages",
6193 "title" => "WebImages",
6194 "rule" => array(
6195 "^WebImages[/ ]([0-9.]{1,10})" => "\\1"
6196 ),
6197 "uri" => "http://herbert.groot.jebbink.nl/"
6198 ),
6199 "weblight" => array(
6200 "icon" => "robot",
6201 "title" => "WebLight",
6202 "rule" => array(
6203 "^WebLight[/ ]([0-9.]{1,10})" => "\\1"
6204 ),
6205 "uri" => "http://www.illumit.com/Products/weblight/"
6206 ),
6207 "weblinks" => array(
6208 "icon" => "robot",
6209 "title" => "WebLink's",
6210 "rule" => array(
6211 "^Weblink.s checker" => ""
6212 ),
6213 "uri" => ""
6214 ),
6215 "webmeasurement" => array(
6216 "icon" => "robot",
6217 "title" => "Webmeasurement",
6218 "rule" => array(
6219 "^webmeasurement-bot" => ""
6220 ),
6221 "uri" => "http://rvs.informatik.uni-leipzig.de"
6222 ),
6223 "webminer" => array(
6224 "icon" => "robot",
6225 "title" => "WebMiner",
6226 "rule" => array(
6227 "^WebMiner[/ ]([0-9.]{1,10})" => "\\1"
6228 ),
6229 "uri" => ""
6230 ),
6231 "webmin" => array(
6232 "icon" => "webmin",
6233 "title" => "Webmin",
6234 "rule" => array(
6235 "^webmin" => ""
6236 ),
6237 "uri" => ""
6238 ),
6239 "webmon" => array(
6240 "icon" => "webmon",
6241 "title" => "Webmon",
6242 "rule" => array(
6243 "WebMon[ /]([0-9.]{1,10})" => "\\1"
6244 ),
6245 "uri" => "http://www.markwell.btinternet.co.uk/webmon/"
6246 ),
6247 "webox" => array(
6248 "icon" => "robot",
6249 "title" => " WeBoX",
6250 "rule" => array(
6251 "WeBoX[/ ]([0-9.]{1,10})" => "\\1"
6252 ),
6253 "uri" => ""
6254 ),
6255 "webpatrol" => array(
6256 "icon" => "webpatrol",
6257 "title" => "WebPatrol",
6258 "rule" => array(
6259 "^WebPatrol[ /]([0-9.]{1,10})" => "\\1"
6260 ),
6261 "uri" => "http://soft.macfeeling.com/WebPatrol.html"
6262 ),
6263 "webpix" => array(
6264 "icon" => "webpix",
6265 "title" => "WebPix",
6266 "rule" => array(
6267 "WebPix[/ ]([0-9.]{1,10})" => "\\1"
6268 ),
6269 "uri" => ""
6270 ),
6271 "webrace" => array(
6272 "icon" => "robot",
6273 "title" => "WebRACE",
6274 "rule" => array(
6275 "^WebRACE[/ ]([0-9.]{1,10})" => "\\1"
6276 ),
6277 "uri" => ""
6278 ),
6279 "webreaper" => array(
6280 "icon" => "webreaper",
6281 "title" => "WebReaper",
6282 "rule" => array(
6283 "^WebReaper " => ""
6284 ),
6285 "uri" => "http://www.webreaper.net/"
6286 ),
6287 "webresult" => array(
6288 "icon" => "robot",
6289 "title" => "Webresult",
6290 "rule" => array(
6291 "Der webresult\.de Robot" => ""
6292 ),
6293 "uri" => ""
6294 ),
6295 "webring" => array(
6296 "icon" => "robot",
6297 "title" => "Webring Checker",
6298 "rule" => array(
6299 "WebRingChecker[/ ]([0-9.]{1,10})" => "\\1"
6300 ),
6301 "uri" => ""
6302 ),
6303 "webripper" => array(
6304 "icon" => "webripper",
6305 "title" => "WebRipper",
6306 "rule" => array(
6307 "^WebRipper" => ""
6308 ),
6309 "uri" => "http://calluna-software.com"
6310 ),
6311 "webscaled" => array(
6312 "icon" => "webscaled",
6313 "title" => "Webscaled",
6314 "rule" => array(
6315 "Swarm" => ""
6316 ),
6317 "uri" => "http://webscaled.com/"
6318 ),
6319 "websearchau" => array(
6320 "icon" => "websearchau",
6321 "title" => "WebSearch.COM.AU",
6322 "rule" => array(
6323 "WebSearch.COM.AU[/ ]+([0-9.]{1,10})" => "\\1"
6324 ),
6325 "uri" => "http://WebSearch.com.au/"
6326 ),
6327 "websearchbench" => array(
6328 "icon" => "robot",
6329 "title" => "WebSearchBench",
6330 "rule" => array(
6331 "WebSearchBench WebCrawler[v/ ]+([0-9.]{1,10})" => "\\1"
6332 ),
6333 "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6334 ),
6335 "websense" => array(
6336 "icon" => "websense",
6337 "title" => "Websense",
6338 "rule" => array(
6339 "(Sqworm|websense|Konqueror/3\.(0|1)(-rc[1-6])?; i686 Linux; 2002[0-9]{4})" => ""
6340 ),
6341 "uri" => ""
6342 ),
6343 "websiteshadow" => array(
6344 "icon" => "websiteshadow",
6345 "title" => "Websiteshadow",
6346 "rule" => array(
6347 "Websiteshadowbot[ /]([0-9.]{1,10})" => "\\1"
6348 ),
6349 "uri" => "http://websiteshadow.com"
6350 ),
6351 "websiteworth" => array(
6352 "icon" => "robot",
6353 "title" => "WebsiteWorth",
6354 "rule" => array(
6355 "WebsiteWorth[v/ ]+([0-9.]{1,10})" => "\\1"
6356 ),
6357 "uri" => "http://directory.sootle.com/website-worth/tata.php"
6358 ),
6359 "websquash" => array(
6360 "icon" => "websquash",
6361 "title" => "Websquash",
6362 "rule" => array(
6363 "webs(quash\.com|ite[ \-]?Monitor)" => ""
6364 ),
6365 "uri" => ""
6366 ),
6367 "webstripper" => array(
6368 "icon" => "robot",
6369 "title" => "WebStripper",
6370 "rule" => array(
6371 "WebStripper[ /]([0-9.]{1,10})" => "\\1"
6372 ),
6373 "uri" => ""
6374 ),
6375 "webzip" => array(
6376 "icon" => "webzip",
6377 "title" => "WebZIP",
6378 "rule" => array(
6379 "Web[ \-]?ZIP[ /]([0-9.]{1,10})" => "\\1"
6380 ),
6381 "uri" => ""
6382 ),
6383 "wep" => array(
6384 "icon" => "robot",
6385 "title" => "WEP Search",
6386 "rule" => array(
6387 "WEP Search[ /]([0-9.]{1,10})" => "\\1"
6388 ),
6389 "uri" => ""
6390 ),
6391 "westwind" => array(
6392 "icon" => "robot",
6393 "title" => "West Wind Internet Protocols",
6394 "rule" => array(
6395 "^West Wind Internet Protocols[ /]([0-9.]{1,10})" => "\\1"
6396 ),
6397 "uri" => "http://www.west-wind.com/wwipstuff.asp"
6398 ),
6399 "wget" => array(
6400 "icon" => "wget",
6401 "title" => "Wget",
6402 "rule" => array(
6403 "Wget[ /]([0-9.]{1,10})" => "\\1",
6404 "Wget" => ""
6405 ),
6406 "uri" => ""
6407 ),
6408 "whizbang" => array(
6409 "icon" => "whizbang",
6410 "title" => "WhizBang",
6411 "rule" => array(
6412 "WhizBang" => ""
6413 ),
6414 "uri" => "http://www.whizbang.com/crawler/"
6415 ),
6416 "whois" => array(
6417 "icon" => "whois",
6418 "title" => "Who.is",
6419 "rule" => array(
6420 "Who.is Bot" => ""
6421 ),
6422 "uri" => "http://www.who.is/"
6423 ),
6424 "wikiwix" => array(
6425 "icon" => "wikiwix",
6426 "title" => "Wikiwix",
6427 "rule" => array(
6428 "wikiwix-bot-([0-9.]{1,10})" => "\\1"
6429 ),
6430 "uri" => "http://www.wikiwix.com/"
6431 ),
6432 "wingflyer" => array(
6433 "icon" => "robot",
6434 "title" => "WingFlyer",
6435 "rule" => array(
6436 "^WebFetch" => ""
6437 ),
6438 "uri" => "http://www.wingflyer.com/"
6439 ),
6440 "wininet" => array(
6441 "icon" => "robot",
6442 "title" => "WinInet",
6443 "rule" => array(
6444 "TeamSoft WinInet Component" => ""
6445 ),
6446 "uri" => "http://www.winsoft.sk/wininet.htm"
6447 ),
6448 "winhttp" => array(
6449 "icon" => "robot",
6450 "title" => "WinHTTP",
6451 "rule" => array(
6452 "WinHttp\.WinHttpRequest\.([0-9.]{1,10})" => "\\1"
6453 ),
6454 "uri" => ""
6455 ),
6456 "wire" => array(
6457 "icon" => "robot",
6458 "title" => "WIRE",
6459 "rule" => array(
6460 "^WIRE[ /]([0-9.]{1,10})" => "\\1"
6461 ),
6462 "uri" => ""
6463 ),
6464 "wmp" => array(
6465 "icon" => "robot",
6466 "title" => "WMP",
6467 "rule" => array(
6468 "^WMP" => ""
6469 ),
6470 "uri" => ""
6471 ),
6472 "woozweb" => array(
6473 "icon" => "woozweb",
6474 "title" => "Woozweb",
6475 "rule" => array(
6476 "woozweb" => ""
6477 ),
6478 "uri" => "http://www.woozweb.com/"
6479 ),
6480 "wordchamp" => array(
6481 "icon" => "robot",
6482 "title" => "WordChamp",
6483 "rule" => array(
6484 "^WordChampBot" => ""
6485 ),
6486 "uri" => "http://www.wordchamp.com/"
6487 ),
6488 "wordpress" => array(
6489 "icon" => "wordpress",
6490 "title" => "WordPress",
6491 "rule" => array(
6492 "WordPress[ /]([0-9.]{1,10})" => "\\1"
6493 ),
6494 "uri" => ""
6495 ),
6496 "worio" => array(
6497 "icon" => "worio",
6498 "title" => "Worio",
6499 "rule" => array(
6500 "woriobot" => ""
6501 ),
6502 "uri" => "http://worio.com/"
6503 ),
6504 "worldlight" => array(
6505 "icon" => "worldlight",
6506 "title" => "WorldLight",
6507 "rule" => array(
6508 "^WorldLight" => ""
6509 ),
6510 "uri" => ""
6511 ),
6512 "worqmada" => array(
6513 "icon" => "robot",
6514 "title" => "WorQmada",
6515 "rule" => array(
6516 "WorQmada[ /]([0-9.]{1,10})" => "\\1"
6517 ),
6518 "uri" => ""
6519 ),
6520 "wotbox" => array(
6521 "icon" => "wotbox",
6522 "title" => "Wotbox",
6523 "rule" => array(
6524 "Wotbox[ /]?[a-z]*([0-9.]{1,10})" => "\\1"
6525 ),
6526 "uri" => ""
6527 ),
6528 "wp" => array(
6529 "icon" => "wp",
6530 "title" => "Wirtualna Polska",
6531 "rule" => array(
6532 "NetSprint[ /\-]{1,4}([0-9.]{1,10})" => "\\1"
6533 ),
6534 "uri" => "http://wp.pl"
6535 ),
6536 "wsb" => array(
6537 "icon" => "robot",
6538 "title" => "WebSearchBench",
6539 "rule" => array(
6540 "WSB WebCrawler V([0-9.]{1,10})" => "\\1",
6541 "WSB " => ""
6542 ),
6543 "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6544 ),
6545 "wume" => array(
6546 "icon" => "robot",
6547 "title" => "WUME Lab's",
6548 "rule" => array(
6549 "^wume_crawler[ /]([0-9.]{1,10})" => "\\1",
6550 ),
6551 "uri" => "http://wume.cse.lehigh.edu/~xiq204/crawler/"
6552 ),
6553 "wusage" => array(
6554 "icon" => "wusage",
6555 "title" => "Wusage",
6556 "rule" => array(
6557 "Wusage[ /]([0-9.]{1,10})" => "\\1",
6558 ),
6559 "uri" => "http://www.boutell.com/wusage/"
6560 ),
6561 "wwgrapevine" => array(
6562 "icon" => "wwgrapevine",
6563 "title" => "WWgrapevine",
6564 "rule" => array(
6565 "wwgrapevine[ /]([0-9.]{1,10})" => "\\1"
6566 ),
6567 "uri" => ""
6568 ),
6569 "wws" => array(
6570 "icon" => "robot",
6571 "title" => "WWSBOT",
6572 "rule" => array(
6573 "WWSBOT[ /]([0-9.]{1,10})" => "\\1",
6574 ),
6575 "uri" => "http://www.analyzer.nu"
6576 ),
6577 "www4mail" => array(
6578 "icon" => "robot",
6579 "title" => "WWW4mail",
6580 "rule" => array(
6581 "^www4mail[ /]([0-9.]{1,10})" => "\\1"
6582 ),
6583 "uri" => "http://www.www4mail.org/"
6584 ),
6585 "wwwc" => array(
6586 "icon" => "wwwc",
6587 "title" => "WWWC",
6588 "rule" => array(
6589 "^WWWC[ /]([0-9.]{1,10})" => "\\1"
6590 ),
6591 "uri" => ""
6592 ),
6593 "wwwd" => array(
6594 "icon" => "robot",
6595 "title" => "WWWD",
6596 "rule" => array(
6597 "^WWWD[ /]([0-9.]{1,10})" => "\\1"
6598 ),
6599 "uri" => ""
6600 ),
6601 "wwweasel" => array(
6602 "icon" => "wwweasel",
6603 "title" => "WWWeasel",
6604 "rule" => array(
6605 "WWWeasel( Robot)?[/ ]v?([0-9.]{1,10})" => "\\2"
6606 ),
6607 "uri" => ""
6608 ),
6609 "wwwfi" => array(
6610 "icon" => "wwwfi",
6611 "title" => "www.fi",
6612 "rule" => array(
6613 "www\.fi crawler" => ""
6614 ),
6615 "uri" => "http://www.fi/"
6616 ),
6617 "wwwmechanize" => array(
6618 "icon" => "robot",
6619 "title" => "WWW-Mechanize",
6620 "rule" => array(
6621 "^WWW-Mechanize[/ ]([0-9.]{1,10})" => "\\1"
6622 ),
6623 "uri" => ""
6624 ),
6625 "wwwoffle" => array(
6626 "icon" => "robot",
6627 "title" => "WWWoffle",
6628 "rule" => array(
6629 "^wwwoffle[/ ]([0-9.]{1,10})" => "\\1"
6630 ),
6631 "uri" => ""
6632 ),
6633 "wwwster" => array(
6634 "icon" => "robot",
6635 "title" => "WWWster",
6636 "rule" => array(
6637 "^wwwster[/ ]([0-9.]{1,10})" => "\\1"
6638 ),
6639 "uri" => ""
6640 ),
6641 "wysigot" => array(
6642 "icon" => "wysigot",
6643 "title" => "Wysigot",
6644 "rule" => array(
6645 "Wysigot[/ ]([0-9.]{1,10})" => "\\1"
6646 ),
6647 "uri" => ""
6648 ),
6649 "xaldon" => array(
6650 "icon" => "xaldon",
6651 "title" => "Xaldon",
6652 "rule" => array(
6653 "Xaldon WebSpider" => ""
6654 ),
6655 "uri" => "http://www.xaldon.de/"
6656 ),
6657 "xenu" => array(
6658 "icon" => "xenu",
6659 "title" => "Xenu Link Sleuth",
6660 "rule" => array(
6661 "Xenu Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6662 "Xenu(&#039;s)? Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6663 "Xenu_Link_Sleuth_([0-9a-z.]{1,10})" => "\\1"
6664 ),
6665 "uri" => "http://home.snafu.de/tilman/xenulink.html"
6666 ),
6667 "xerka" => array(
6668 "icon" => "xerka",
6669 "title" => "Xerka",
6670 "rule" => array(
6671 "^Xerka WebBot v([0-9a-z.]{1,10})" => "\\1"
6672 ),
6673 "uri" => "http://www.diana-teknologia.com/www1/english/xerka.htm"
6674 ),
6675 "xirq" => array(
6676 "icon" => "robot",
6677 "title" => "XIRQ",
6678 "rule" => array(
6679 "^xirq[ /]([0-9a-z.]{1,10})" => "\\1"
6680 ),
6681 "uri" => "http://www.xirq.com"
6682 ),
6683 "xmlslurp" => array(
6684 "icon" => "robot",
6685 "title" => "XMLSlurp",
6686 "rule" => array(
6687 "^XMLSlurp[ /]([0-9a-z.]{1,10})" => "\\1"
6688 ),
6689 "uri" => ""
6690 ),
6691 "xml-sitemaps" => array(
6692 "icon" => "xml-sitemaps",
6693 "title" => "XML-Sitemaps",
6694 "rule" => array(
6695 "XML-Sitemaps[ /]([0-9a-z.]{1,10})" => "\\1"
6696 ),
6697 "uri" => ""
6698 ),
6699 "xmlrpc" => array(
6700 "icon" => "robot",
6701 "title" => "Trackback",
6702 "rule" => array(
6703 "XMLRPC" => ""
6704 ),
6705 "uri" => ""
6706 ),
6707 "xovi" => array(
6708 "icon" => "xovi",
6709 "title" => "Xovi",
6710 "rule" => array(
6711 "XoviBot[ /]([0-9a-z.]{1,10})" => "\\1"
6712 ),
6713 "uri" => "http://www.xovibot.net"
6714 ),
6715 "yacy" => array(
6716 "icon" => "yacy",
6717 "title" => "Yacy",
6718 "rule" => array(
6719 "yacy\.net" => ""
6720 ),
6721 "uri" => ""
6722 ),
6723 "yahoo" => array(
6724 "icon" => "yahoo",
6725 "title" => "Yahoo",
6726 "rule" => array(
6727 "Yahoo(! ([a-z]{1,3} )?Slurp|-)" => "",
6728 "Yahoo-MMCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6729 "Yahoo-VerticalCrawler-FormerWebCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6730 "^AnzwersCrawl[/ ]([0-9a-z.]{1,10})" => "\\1",
6731 "Y!J(-BSC|-SRD)*[/ ]([0-9a-z.]{1,10})" => "\\2",
6732 "Y!OASIS/TEST" => "",
6733 "Harvest-NG[/ ]([0-9a-z.]{1,10})" => "\\1",
6734 "Y!J; for robot study" => "",
6735 "Yahoo Japan; for robot study" => ""
6736 ),
6737 "uri" => "http://www.yahoo.com"
6738 ),
6739 "yahoo-feed" => array(
6740 "icon" => "yahoo",
6741 "title" => "Yahoo Feedseeker",
6742 "rule" => array(
6743 "^YahooFeedSeeker[/ ]([0-9a-z.]{1,10})" => "\\1"
6744 ),
6745 "uri" => "http://www.yahoo.com"
6746 ),
6747 "yandex" => array(
6748 "icon" => "yandex",
6749 "title" => "Yandex",
6750 "rule" => array(
6751 "Yandex[/ ]([0-9.]{1,10})" => "\\1",
6752 "Yandex(Bot|Images|Media|Antivirus)[/ ]([0-9.]{1,10})" => "\\2"
6753 ),
6754 "uri" => "http://yandex.com/bots"
6755 ),
6756 "yanga" => array(
6757 "icon" => "yanga",
6758 "title" => "Yanga",
6759 "rule" => array (
6760 "^Yanga.*v([0-9.]{1,10})" => "\\1"
6761 ),
6762 "uri" => "http://www.yanga.co.uk/"
6763 ),
6764 "yap" => array(
6765 "icon" => "yap",
6766 "title" => "Yap",
6767 "rule" => array(
6768 "^YapBot[_/ ]v([0-9.]{1,10})" => "\\1"
6769 ),
6770 "uri" => "http://www.yapinc.com/"
6771 ),
6772 "yarienavoir" => array(
6773 "icon" => "robot",
6774 "title" => "Yarienavoir",
6775 "rule" => array(
6776 "^yarienavoir.net[/ ]([0-9.]{1,10})" => "\\1"
6777 ),
6778 "uri" => "http://www.yarienavoir.net/"
6779 ),
6780 "yell" => array(
6781 "icon" => "yell",
6782 "title" => "Yell",
6783 "rule" => array(
6784 "YellCrawl[ /]V?([0-9.]{1,10})" => "\\1",
6785 "Yellbot[ /]Nutch-([0-9.]{1,10})" => "\\1",
6786 ),
6787 "uri" => ""
6788 ),
6789 "youdao" => array(
6790 "icon" => "youdao",
6791 "title" => "Youdao",
6792 "rule" => array(
6793 "YodaoBot-(Image|Mobile)?[ /]([0-9.]{1,10})" => "\\2",
6794 "YoudaoBot[ /]([0-9.]{1,10})" => "\\1"
6795 ),
6796 "uri" => "http://www.youdao.com/help/webmaster/spider/"
6797 ),
6798 "yoogli" => array(
6799 "icon" => "yoogli",
6800 "title" => "Yoogli",
6801 "rule" => array(
6802 "yoogliFetchAgent[ /]([0-9.]{1,10})" => "\\1"
6803 ),
6804 "uri" => "http://www.yoogli.com"
6805 ),
6806 "yotta" => array(
6807 "icon" => "robot",
6808 "title" => "Yotta",
6809 "rule" => array(
6810 "Yotta(Shopping|Cars)_Bot[ /]([0-9.]{1,10})" => "\\2",
6811 "OmniExplorer_Bot[ /]([0-9.]{1,10})" => "\\1"
6812 ),
6813 "uri" => "http://www.yottacars.com"
6814 ),
6815 "yoono" => array(
6816 "icon" => "yoono",
6817 "title" => "Yoono",
6818 "rule" => array(
6819 "Yoono" => ""
6820 ),
6821 "uri" => "http://www.yoono.com/"
6822 ),
6823 "yowedo" => array(
6824 "icon" => "robot",
6825 "title" => "Yowedo",
6826 "rule" => array(
6827 "Yowedo[ /]([0-9.]{1,10})" => "\\1"
6828 ),
6829 "uri" => "http://yowedo.com/en/partners.html"
6830 ),
6831 "yuntis" => array(
6832 "icon" => "robot",
6833 "title" => "Yuntis",
6834 "rule" => array(
6835 "Gulper Web Bot[ /]([0-9.]{1,10})" => "\\1"
6836 ),
6837 "uri" => "http://yuntis.ecsl.cs.sunysb.edu/help/robot/"
6838 ),
6839 "zao" => array(
6840 "icon" => "robot",
6841 "title" => "Zao",
6842 "rule" => array(
6843 "Zao[ /]([0-9.]{1,10})" => "\\1",
6844 "Zao-crawler" => ""
6845 ),
6846 "uri" => ""
6847 ),
6848 "zealbot" => array(
6849 "icon" => "zeal",
6850 "title" => "ZealBot",
6851 "rule" => array(
6852 "Zealbot[ /]([0-9.]{1,10})" => "\\1"
6853 ),
6854 "uri" => ""
6855 ),
6856 "zearchit" => array(
6857 "icon" => "zearchit",
6858 "title" => "Zearchit",
6859 "rule" => array(
6860 "Zearchit" => ""
6861 ),
6862 "uri" => "http://www.zearchit.de/"
6863 ),
6864 "zebz" => array(
6865 "icon" => "robot",
6866 "title" => "ze.bz",
6867 "rule" => array(
6868 "^ZeBot_(lseek\.net|www\.ze\.bz)" => ""
6869 ),
6870 "uri" => "http://www.ze.bz/"
6871 ),
6872 "zedzo" => array(
6873 "icon" => "robot",
6874 "title" => "Zedzo",
6875 "rule" => array(
6876 "zedzo.digest[ /]([0-9.]{1,10})" => "\\1"
6877 ),
6878 "uri" => "http://www.zedzo.com/"
6879 ),
6880 "zerx" => array(
6881 "icon" => "zerx",
6882 "title" => "Zerx",
6883 "rule" => array(
6884 "^zerxbot[ /](Version|v)*[ /]*([0-9.]{1,10})" => "\\2"
6885 ),
6886 "uri" => "http://www.zerx.com/"
6887 ),
6888 "zeus" => array(
6889 "icon" => "zeus",
6890 "title" => "Zeus",
6891 "rule" => array(
6892 "Zeus" => ""
6893 ),
6894 "uri" => "http://www.zeus.com"
6895 ),
6896 "zippp" => array(
6897 "icon" => "robot",
6898 "title" => "Zippp",
6899 "rule" => array(
6900 "ZipppBot[ /]([0-9.]{1,10})" => "\\1"
6901 ),
6902 "uri" => ""
6903 ),
6904 "zippy" => array(
6905 "icon" => "robot",
6906 "title" => "Zippy",
6907 "rule" => array(
6908 "^Zippy[ v/]*([0-9.]{1,10})" => "\\1"
6909 ),
6910 "uri" => "http://www.zippyfinder.com"
6911 ),
6912 "zoeky" => array(
6913 "icon" => "robot",
6914 "title" => "Zoeky",
6915 "rule" => array(
6916 "Zoekybot[ /]([0-9.]{1,10})" => "\\1"
6917 ),
6918 "uri" => ""
6919 ),
6920 "zoom" => array(
6921 "icon" => "zoom",
6922 "title" => "ZoomSpider",
6923 "rule" => array(
6924 "^ZoomSpider" => ""
6925 ),
6926 "uri" => "http://www.wrensoft.com/"
6927 ),
6928 "zspider" => array(
6929 "icon" => "robot",
6930 "title" => "Zspider",
6931 "rule" => array(
6932 "zspider[ /]([0-9.a-z]{1,10})" => "\\1"
6933 ),
6934 "uri" => "http://feedback.redkolibri.com/"
6935 ),
6936 "zumbot" => array(
6937 "icon" => "robot",
6938 "title" => "ZUM Search",
6939 "rule" => array(
6940 "ZumBot[ /]([0-9.]{1,10})" => "\\1"
6941 ),
6942 "uri" => "http://help.zum.com/inquiry"
6943 ),
6944 "zyborg" => array(
6945 "icon" => "zyborg",
6946 "title" => "WiseNutBot",
6947 "rule" => array(
6948 "(WISE|Zy)bo(rg|t)[ /]([0-9.]{1,10})" => "\\3"
6949 ),
6950 "uri" => ""
6951 ),
6952 // Catch up for the originals, they got to stay in that order.
6953 "blogbot" => array(
6954 "icon" => "blogbot",
6955 "title" => "BlogBot",
6956 "rule" => array(
6957 "Blog[ \-]?Bot" => ""
6958 ),
6959 "uri" => "http://www.blogbot.com/"
6960 ),
6961 "centrum" => array(
6962 "icon" => "centrum",
6963 "title" => "Centrum",
6964 "rule" => array(
6965 "holmes[/ ]([0-9.]{1,10})" => "\\1",
6966 "^Centrum-checker" => ""
6967 ),
6968 "uri" => ""
6969 ),
6970 "httpclient" => array(
6971 "icon" => "robot",
6972 "title" => "HTTPClient",
6973 "rule" => array(
6974 "HTTP[ \-]?Client[ /]([0-9.]{1,10})" => "\\1",
6975 "HTTP[ \-]?Client" => ""
6976 ),
6977 "uri" => "http://www.innovation.ch/java/HTTPClient/"
6978 ),
6979 "incywincy" => array(
6980 "icon" => "robot",
6981 "title" => "IncyWincy",
6982 "rule" => array(
6983 "^IncyWincy[ /]([0-9.]{1,10})" => "\\1",
6984 "^IncyWincy" => ""
6985 ),
6986 "uri" => ""
6987 ),
6988 "java" => array(
6989 "icon" => "java",
6990 "title" => "Java",
6991 "rule" => array(
6992 "^java[ /]*([0-9.a-z]{1,10})" => "\\1"
6993 ),
6994 "uri" => ""
6995 ),
6996 "libfetch" => array(
6997 "icon" => "robot",
6998 "title" => "Libfetch",
6999 "rule" => array(
7000 "^(fetch )?libfetch[ /]([0-9.]{1,10})" => "\\2"
7001 ),
7002 "uri" => "http://www.freebsd.org/"
7003 ),
7004 "libwww" => array(
7005 "icon" => "libwww",
7006 "title" => "LibWWW",
7007 "rule" => array(
7008 "^libww(w|w-perl|w-FM)[ /]([0-9.]{1,10})" => "\\2",
7009 "^libww(w|w-perl|w-FM)" => "",
7010 "MyApp.*libww(w|w-perl|w-FM)" => ""
7011 ),
7012 "uri" => ""
7013 ),
7014 "litefinder" => array(
7015 "icon" => "litefinder",
7016 "title" => "LiteFinder",
7017 "rule" => array(
7018 "LiteFinder[ /]([0-9.]{1,10})" => "\\1"
7019 ),
7020 "uri" => "http://www.litefinder.net/about.html"
7021 ),
7022 "nutchorg" => array(
7023 "icon" => "nutchorg",
7024 "title" => "Nutch",
7025 "rule" => array(
7026 "Nutc(hOrg|hCVS|h)?[ /]([0-9.]{1,10})" => "\\2",
7027 "Nutch" => ""
7028 ),
7029 "uri" => "http://lucene.apache.org/nutch/"
7030 ),
7031 "pythonurl" => array(
7032 "icon" => "pythonurl",
7033 "title" => "Python",
7034 "rule" => array(
7035 "python-requests[ /]([0-9.]{1,10})" => "\\1",
7036 "Python[ \-]?urllib" => ""
7037 ),
7038 "uri" => ""
7039 ),
7040 // Know Robots as SPAM BOTS
7041 "SPAM" => array(
7042 "icon" => "robot",
7043 "title" => "SPAM",
7044 "rule" => array(
7045 "NASA Search[/ ]([0-9.]{1,10})" => "\\1",
7046 "^PHOTO CHECK" => "",
7047 "^FOTOCHECKER" => "",
7048 "^IPTC CHECK" => "",
7049 "^DataCha0s" => "",
7050 "Datenprovider" => "",
7051 "Expanse" => "",
7052 "Hello World" => "",
7053 "Linux Gnu (cow)" => "",
7054 "Mozilliqa" => "",
7055 "cyberscan.io" => "",
7056 "OPENVASVT" => "",
7057 "researchscan" => "",
7058 "CensysInspect[/ ]([0-9.]{1,10})" => "",
7059 "InternetMeasurement[/ ]([0-9.]{1,10})" => "",
7060 "seocompany[/ ]([0-9.]{1,10})" => "",
7061 "tchelebi[/ ]([0-9.]{1,10})" => "",
7062 "masscan[/ ]([0-9.]{1,10})" => "",
7063 "l9tcpid[/ ]([0-9.]{1,10})" => "",
7064 "zgrab[/ ]([0-9.]{1,10})" => "",
7065 "^Mac Finder" => "",
7066 "^Missigua Locator[ /]([0-9.]{1,10})" => "\\1",
7067 "^Missouri College Browse" => "",
7068 "Email[ \-]?Siphon" => "",
7069 "atSpider" => "",
7070 "autoemailspider" => "",
7071 "^Demo Bot" => "",
7072 "^Program Shareware" => "",
7073 "^Snapbot" => "",
7074 "^snap.com" => "",
7075 "^Guestbook Auto Submitter" => "",
7076 "panscient.com" => "",
7077 ),
7078 "uri" => ""
7079 ),
7080 // Things we don't know by now
7081 "robot" => array(
7082 "icon" => "robot",
7083 "title" => "Robot",
7084 "rule" => array(
7085 "(robot|spider|harvest|(?<!orange)bot|(?<!msie)crawler)" => ""
7086 )
7087 )
7088 );
7089 ?>

Properties

Name Value
svn:keywords Id