ViewVC Help
View File | Revision Log | Show Annotations | View Changeset | Root Listing
root/BBClone/trunk/lib/robot.php
Revision: 450
Committed: Fri May 5 11:11:34 2023 UTC (18 months, 3 weeks ago) by joku
File size: 161543 byte(s)
Log Message:
update robots

File Contents

# Content
1 <?php
2 /* This file is part of BBClone (A PHP based Web Counter on Steroids)
3 *
4 * SVN FILE $Id$
5 *
6 * Copyright (C) 2001-2023, the BBClone Team (see doc/authors.txt for details)
7 *
8 * This program is free software: you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License as published by
10 * the Free Software Foundation, either version 3 of the License, or
11 * (at your option) any later version.
12 *
13 * This program is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 * GNU General Public License for more details.
17 *
18 * See doc/copying.txt for details
19 */
20
21 /////////////////////
22 // Robot Detection //
23 /////////////////////
24
25 $robot = array(
26 "1noon" => array(
27 "icon" => "1noon",
28 "title" => "1noon",
29 "rule" => array(
30 "1Noonbot[/ ]([0-9.]{1,10})" => "\\1",
31 "^Yeti$" => ""
32 ),
33 "uri" => ""
34 ),
35 "123people" => array(
36 "icon" => "123people",
37 "title" => "123people",
38 "rule" => array(
39 "123peoplebot[ /]([0-9.]{1,10})" => "\\1"
40 ),
41 "uri" => "http://www.123people.fr/"
42 ),
43 "123spider" => array(
44 "icon" => "robot",
45 "title" => "123Spider",
46 "rule" => array(
47 "123spider-Bot \(Version: ([0-9.]{1,10})" => "\\1"
48 ),
49 "uri" => "http://www.123spider.de/"
50 ),
51 "192com" => array(
52 "icon" => "robot",
53 "title" => "192.com",
54 "rule" => array(
55 "192.comAgent" => ""
56 ),
57 "uri" => "http://www.192.com/"
58 ),
59 "200please" => array(
60 "icon" => "200please",
61 "title" => "200please Crawler",
62 "rule" => array(
63 "200PleaseBot[ /]([0-9.]{1,10})" => "\\1"
64 ),
65 "uri" => "http://www.200please.com/bot"
66 ),
67 "2dehands" => array(
68 "icon" => "2dehands",
69 "title" => "2deHands",
70 "rule" => array(
71 "2dehands\.nl" => ""
72 ),
73 "uri" => ""
74 ),
75 "80legs" => array(
76 "icon" => "80legs",
77 "title" => "80legs",
78 "rule" => array(
79 "008[/ ]([0-9.]{1,10}).*80legs" => "\\1"
80 ),
81 "uri" => "http://www.80legs.com/"
82 ),
83 "a1sitemap" => array(
84 "icon" => "a1sitemap",
85 "title" => "A1 Sitemap",
86 "rule" => array(
87 "^A1 Sitemap Generator[ /]([0-9.]{1,10})" => "\\1",
88 "miggibot[ /]([0-9.]{1,10})" => "\\1"
89 ),
90 "uri" => "http://www.micro-sys.dk/products/sitemap-generator/"
91 ),
92 "a2b" => array(
93 "icon" => "a2b",
94 "title" => "A2B",
95 "rule" => array(
96 "www\.a2b\.cc" => ""
97 ),
98 "uri" => "http://www.a2b.cc"
99 ),
100 "abacho" => array(
101 "icon" => "robot",
102 "title" => "Abacho",
103 "rule" => array(
104 "^ABACHOBot" => ""
105 ),
106 "uri" => ""
107 ),
108 "abcdatos" => array(
109 "icon" => "abcdatos",
110 "title" => "ABCdatos",
111 "rule" => array(
112 "^ABCdatos BotLink[ /]([0-9.]{1,10})" => "\\1"
113 ),
114 "uri" => "http://www.abcdatos.com/"
115 ),
116 "abot" => array(
117 "icon" => "abot",
118 "title" => "aBot",
119 "rule" => array(
120 "^abot[ /]([0-9.]{1,10})" => "\\1"
121 ),
122 "uri" => ""
123 ),
124 "about" => array(
125 "icon" => "about",
126 "title" => "About",
127 "rule" => array(
128 "Libby[_/ ]([0-9.]{1,10})" => "\\1",
129 "About[_/ ]([0-9.]{1,10})libwww-perl" => "\\1"
130 ),
131 "uri" => ""
132 ),
133 "aboutus" => array(
134 "icon" => "aboutus",
135 "title" => "AboutUs",
136 "rule" => array(
137 "AboutUsBot" => ""
138 ),
139 "uri" => "http://www.aboutus.org/"
140 ),
141 "ackerm" => array(
142 "icon" => "robot",
143 "title" => "Ackerm",
144 "rule" => array(
145 "www.ackerm.com" => ""
146 ),
147 "uri" => "http://www.ackerm.com/"
148 ),
149 "acoi" => array(
150 "icon" => "acoi",
151 "title" => "AcoiRobot",
152 "rule" => array(
153 "^AcoiRobot" => ""
154 ),
155 "uri" => "http://monetdb.cwi.nl/acoi/projects.html"
156 ),
157 "acoon" => array(
158 "icon" => "acoon",
159 "title" => "Acoon",
160 "rule" => array(
161 "Acoon[ \-]?Robot" => ""
162 ),
163 "uri" => ""
164 ),
165 "accoona" => array(
166 "icon" => "accoona",
167 "title" => "Accoona",
168 "rule" => array(
169 "Accoona-AI-Agent[/ ]([0-9.]{1,10})" => "\\1",
170 "^accoona" => ""
171 ),
172 "uri" => ""
173 ),
174 "acme" => array(
175 "icon" => "acme",
176 "title" => "Acme",
177 "rule" => array(
178 "^Acme\.Spider" => ""
179 ),
180 "uri" => "http://www.acme.com/java/software/Acme.Spider.html"
181 ),
182 "active" => array(
183 "icon" => "robot",
184 "title" => "ActiveBookmark",
185 "rule" => array(
186 "ActiveBookmark[/ ]([0-9.]{1,10})" => "\\1"
187 ),
188 "uri" => ""
189 ),
190 "admuncher" => array(
191 "icon" => "robot",
192 "title" => "Ad Muncher",
193 "rule" => array(
194 "Ad Muncher[/ v]*([0-9.]{1,10})" => "\\1"
195 ),
196 "uri" => ""
197 ),
198 "aesop" => array(
199 "icon" => "robot",
200 "title" => "Aesop",
201 "rule" => array(
202 "^AESOP_com_SpiderMan" => ""
203 ),
204 "uri" => "http://www.aesop.com"
205 ),
206 "agada" => array(
207 "icon" => "robot",
208 "title" => "Agada",
209 "rule" => array(
210 "^agadine[/ ]([0-9.]{1,10})" => "\\1"
211 ),
212 "uri" => ""
213 ),
214 "ahrefs" => array(
215 "icon" => "ahrefs",
216 "title" => "Ahrefs",
217 "rule" => array(
218 "AhrefsBot[ /]([0-9.]{1,10})" => "\\1"
219 ),
220 "uri" => "http://ahrefs.com/"
221 ),
222 "aibot" => array(
223 "icon" => "robot",
224 "title" => "Aibot",
225 "rule" => array(
226 "AIBOT[/ ]([0-9.]{1,10})" => "\\1"
227 ),
228 "uri" => ""
229 ),
230 "aihitbot" => array(
231 "icon" => "robot",
232 "title" => "aiHit",
233 "rule" => array(
234 "aiHitBot[/ ]([0-9.]{1,10})" => "\\1"
235 ),
236 "uri" => "http://www.aihit.com/"
237 ),
238 "aipbot" => array(
239 "icon" => "robot",
240 "title" => "Aipbot",
241 "rule" => array(
242 "aipbot[/ ]([0-9.]{1,10})" => "\\1"
243 ),
244 "uri" => ""
245 ),
246 "aleksika" => array(
247 "icon" => "aleksika",
248 "title" => "Aleksika",
249 "rule" => array(
250 "Aleksika Spider[/ ]([0-9.]{1,10})" => "\\1"
251 ),
252 "uri" => ""
253 ),
254 "alertsite" => array(
255 "icon" => "alertsite",
256 "title" => "AlertSite",
257 "rule" => array(
258 "ipd[ /]([0-9.]{1,10}).*Alertsite\.com" => "\\1"
259 ),
260 "uri" => "http://www.alertsite.com/index.html"
261 ),
262 "alexa" => array(
263 "icon" => "alexa",
264 "title" => "Alexa",
265 "rule" => array(
266 "^ia_archive" => ""
267 ),
268 "uri" => "http://www.alexa.com/"
269 ),
270 "almaden" => array(
271 "icon" => "almaden",
272 "title" => "IBM Crawler",
273 "rule" => array(
274 "www\.almaden\.ibm\.com/cs/crawler" => ""
275 ),
276 "uri" => "http://www.almaden.ibm.com/cs/crawler/"
277 ),
278 "altavista" => array(
279 "icon" => "altavista",
280 "title" => "Altavista",
281 "rule" => array(
282 "Scooter[ /\-]*[a-z]*([0-9.]{1,10})" => "\\1",
283 "AltaVista V([0-9.]{1,10})" => "\\1",
284 "AltaVista Intranet V([0-9.]{1,10})" => "\\1"
285 ),
286 "uri" => "http://www.altavista.com/"
287 ),
288 "amazon" => array(
289 "icon" => "amazon",
290 "title" => "Amazon",
291 "rule" => array(
292 "^(aranhabot|amzn_assoc)" => "",
293 "^NutchEC2Test" => "",
294 "Amazonbot[/ ]([0-9.]{1,10})" => "\\1"
295 ),
296 "uri" => "http://www.amazon.com/"
297 ),
298 "amidalla" => array(
299 "icon" => "amidalla",
300 "title" => "Amidalla",
301 "rule" => array(
302 "^amibot" => ""
303 ),
304 "uri" => ""
305 ),
306 "amfibi" => array(
307 "icon" => "amfibi",
308 "title" => "Amfibi",
309 "rule" => array(
310 "Amfibibot[/ ]([0-9.]{1,10})" => "\\1",
311 "Amfibibot" => ""
312 ),
313 "uri" => ""
314 ),
315 "amphetadesk" => array(
316 "icon" => "robot",
317 "title" => "AmphetaDesk",
318 "rule" => array(
319 "AmphetaDesk[/ ]([0-9.]{1,10})" => "\\1"
320 ),
321 "uri" => ""
322 ),
323 "amphetameme" => array(
324 "icon" => "robot",
325 "title" => "Amphetameme",
326 "rule" => array(
327 "amphetameme[ \-]?crawler" => ""
328 ),
329 "uri" => ""
330 ),
331 "annomille" => array(
332 "icon" => "robot",
333 "title" => "AnnoMille",
334 "rule" => array(
335 "^AnnoMille( spider)?[/ ]([0-9.]{1,10})" => "\\2"
336 ),
337 "uri" => "http://www.annomille.it"
338 ),
339 "anonymouse" => array(
340 "icon" => "anonymouse",
341 "title" => "Anonymouse.org",
342 "rule" => array(
343 "http://Anonymouse.org" => ""
344 ),
345 "uri" => "http://anonymouse.org"
346 ),
347 "ansearch" => array(
348 "icon" => "robot",
349 "title" => "Ansearch",
350 "rule" => array(
351 "AnsearchBot[/ ]([0-9.]{1,10})" => "\\1"
352 ),
353 "uri" => ""
354 ),
355 "answerchase" => array(
356 "icon" => "answerchase",
357 "title" => "AnswerChase",
358 "rule" => array(
359 "AnswerChase( PROve)?[/ ]([0-9.]{1,10})" => "\\2"
360 ),
361 "uri" => "http://www.answerchase.com/"
362 ),
363 "antibot" => array(
364 "icon" => "robot",
365 "title" => "Antibot",
366 "rule" => array(
367 "antibot-V([0-9.]{1,10})" => "\\1"
368 ),
369 "uri" => ""
370 ),
371 "aonde" => array(
372 "icon" => "aonde",
373 "title" => "Aonde",
374 "rule" => array(
375 "^AONDE-Spider" => ""
376 ),
377 "uri" => ""
378 ),
379 "aonline" => array(
380 "icon" => "robot",
381 "title" => "A-Online.at",
382 "rule" => array(
383 "^A-Online Search" => ""
384 ),
385 "uri" => "http://www.a-online.at/"
386 ),
387 "aol" => array(
388 "icon" => "aol",
389 "title" => "AOLserver",
390 "rule" => array(
391 "^AOLserver-Tcl[/ ]([0-9.]{1,10})" => "\\1",
392 "^AOLserver" => ""
393 ),
394 "uri" => ""
395 ),
396 "apachebench" => array(
397 "icon" => "robot",
398 "title" => "ApacheBench",
399 "rule" => array(
400 "ApacheBench[ /]([0-9.]{1,10})" => "\\1"
401 ),
402 "uri" => ""
403 ),
404 "apassion4jazz" => array(
405 "icon" => "robot",
406 "title" => "Passion 4 Jazz",
407 "rule" => array(
408 "^BebopBot[ /]([0-9.]{1,10})" => "\\1"
409 ),
410 "uri" => "http://www.apassion4jazz.net/bebopbot.html"
411 ),
412 "apexoo" => array(
413 "icon" => "robot",
414 "title" => "Apexoo",
415 "rule" => array(
416 "^Apexoo Spider ([0-9.]{1,10})" => "\\1"
417 ),
418 "uri" => "http://www.apexoo.com/"
419 ),
420 "apnoti" => array(
421 "icon" => "apnoti",
422 "title" => "Apnoti",
423 "rule" => array(
424 "apnoti.*Robot[ /]v([0-9.]{1,10})" => "\\1"
425 ),
426 "uri" => "http://www.apnoti.com/"
427 ),
428 "aport" => array(
429 "icon" => "aport",
430 "title" => "Aport",
431 "rule" => array(
432 "^Aport" => ""
433 ),
434 "uri" => ""
435 ),
436 "appie" => array(
437 "icon" => "walhello",
438 "title" => "Walhello",
439 "rule" => array(
440 "appie[ /]([0-9.]{1,10})" => "\\1"
441 ),
442 "uri" => ""
443 ),
444 "apple" => array(
445 "icon" => "apple",
446 "title" => "Apple",
447 "rule" => array(
448 "Applebot[ /]([0-9.]{1,10})" => "\\1"
449 ),
450 "uri" => "http://www.apple.com/go/applebot"
451 ),
452 "appletv" => array(
453 "icon" => "apple",
454 "title" => "AppleTV",
455 "rule" => array(
456 "AppleTV" => "\\1"
457 ),
458 "uri" => "http://www.apple.com/"
459 ),
460
461 "arachmo" => array(
462 "icon" => "arachmo",
463 "title" => "Arachmo",
464 "rule" => array(
465 "compatible; Arachmo" => ""
466 ),
467 "uri" => ""
468 ),
469 "arexera" => array(
470 "icon" => "arexera",
471 "title" => "Arexera",
472 "rule" => array(
473 "^X-Crawler" => "",
474 "^TECOMAC-Crawler[ /]([0-9.]{1,10})" => "\\1"
475 ),
476 "uri" => "http://www.arexera.de/"
477 ),
478 "arianna" => array(
479 "icon" => "arianna",
480 "title" => "Arianna",
481 "rule" => array(
482 "^www.arianna.it" => ""
483 ),
484 "uri" => "http://www.arianna.it/"
485 ),
486 "artface" => array(
487 "icon" => "robot",
488 "title" => "Artface",
489 "rule" => array(
490 "^ArtfaceBot" => ""
491 ),
492 "uri" => ""
493 ),
494 "artviper" => array(
495 "icon" => "artviper",
496 "title" => "artViper",
497 "rule" => array(
498 "artViper" => ""
499 ),
500 "uri" => "http://www.artviper.net/"
501 ),
502 "asinfo" => array(
503 "icon" => "robot",
504 "title" => "Any Search Info",
505 "rule" => array(
506 "Sleek Spider[ /]([0-9.]{1,10})" => "\\1"
507 ),
508 "uri" => "http://search-info.com/"
509 ),
510 "ask" => array(
511 "icon" => "askjeeves",
512 "title" => "Ask Jeeves",
513 "rule" => array(
514 "Ask[ \-]?Jeeves" => "",
515 "teomaagent" => ""
516 ),
517 "uri" => ""
518 ),
519 "askaboutoil" => array(
520 "icon" => "robot",
521 "title" => "ASPseek",
522 "rule" => array(
523 "^AskAboutOil[ /]([0-9.]{1,10})" => "\\1"
524 ),
525 "uri" => "http://askaboutoil.com/"
526 ),
527 "asked" => array(
528 "icon" => "robot",
529 "title" => "AskEd!",
530 "rule" => array(
531 "^asked[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
532 ),
533 "uri" => "http://asked.jp"
534 ),
535 "aspseek" => array(
536 "icon" => "robot",
537 "title" => "ASPseek",
538 "rule" => array(
539 "^ASPseek[/ ]([0-9.]{1,10})" => "\\1"
540 ),
541 "uri" => ""
542 ),
543 "atlocal" => array(
544 "icon" => "robot",
545 "title" => "At Local",
546 "rule" => array(
547 "AtlocalBot[/ ]([0-9.]{1,10})" => "\\1"
548 ),
549 "uri" => "http://www.atlocal.com/"
550 ),
551 "atomz" => array(
552 "icon" => "atomz",
553 "title" => "Atomz",
554 "rule" => array(
555 "Atomz[/ ]([0-9.]{1,10})" => "\\1"
556 ),
557 "uri" => ""
558 ),
559 "avira" => array(
560 "icon" => "avira",
561 "title" => "Avira SafeSearch",
562 "rule" => array(
563 "^SafeSearch microdata crawler" => ""
564 ),
565 "uri" => "https://safesearch.avira.com"
566 ),
567 "axel" => array(
568 "icon" => "robot",
569 "title" => "Axel",
570 "rule" => array(
571 "^axel" => ""
572 ),
573 "uri" => ""
574 ),
575 "axmo" => array(
576 "icon" => "axmo",
577 "title" => "Axmo",
578 "rule" => array(
579 "AxmoRobot" => ""
580 ),
581 "uri" => ""
582 ),
583 "answerbus" => array(
584 "icon" => "answerbus",
585 "title" => "AnswerBus",
586 "rule" => array(
587 "answerbus" => ""
588 ),
589 "uri" => ""
590 ),
591 "automapit" => array(
592 "icon" => "robot",
593 "title" => "AutoMapIt",
594 "rule" => array(
595 "AutoMapIt[ /](Bot)?" => ""
596 ),
597 "uri" => "http://www.automapit.com/bot.html"
598 ),
599 "augurnfind" => array(
600 "icon" => "robot",
601 "title" => "Augurnfind",
602 "rule" => array(
603 "augurnfind[/ ][v\-]*([0-9.]{1,10})" => "\\1"
604 ),
605 "uri" => ""
606 ),
607 "awasu" => array(
608 "icon" => "awasu",
609 "title" => "Awasu",
610 "rule" => array(
611 "Awasu[/ ]([0-9a-z.]{1,10})" => "\\1"
612 ),
613 "uri" => ""
614 ),
615 "axxus" => array(
616 "icon" => "axxus",
617 "title" => "axxus.de",
618 "rule" => array(
619 "whoiam" => ""
620 ),
621 "uri" => "http://www.axxus.de/"
622 ),
623 "ayell" => array(
624 "icon" => "ayell",
625 "title" => "Ayell",
626 "rule" => array(
627 "^Eurobot[ /]([0-9.]{1,10})" => "\\1"
628 ),
629 "uri" => "http://eurobot.ayell.eu"
630 ),
631 "babaloo" => array(
632 "icon" => "babaloo",
633 "title" => "Babaloo",
634 "rule" => array(
635 "BabalooSpider[ /]([0-9.]{1,10})" => "\\1"
636 ),
637 "uri" => "http://www.babaloo.si"
638 ),
639 "babe" => array(
640 "icon" => "robot",
641 "title" => "ba.be",
642 "rule" => array(
643 "BACS http://www.ba.be" => ""
644 ),
645 "uri" => "http://www.ba.be/"
646 ),
647 "baidu" => array(
648 "icon" => "baidu",
649 "title" => "Baidu",
650 "rule" => array(
651 "Baiduspider[ /]([0-9.]{1,10})" => "\\1",
652 "Baiduspider" => ""
653 ),
654 "uri" => "http://www.baidu.com/search/spider.html"
655 ),
656 "bananatree" => array(
657 "icon" => "robot",
658 "title" => "BananaTree",
659 "rule" => array(
660 "www\.thebananatree\.org" => ""
661 ),
662 "uri" => "http://www.thebananatree.org/"
663 ),
664 "bdcindexer" => array(
665 "icon" => "robot",
666 "title" => "bdcindexer",
667 "rule" => array(
668 "bdcindexer_([0-9a-z.]{1,10})" => "\\1"
669 ),
670 "uri" => "http://www.business.com/"
671 ),
672 "bdfetch" => array(
673 "icon" => "robot",
674 "title" => "BDFetch",
675 "rule" => array(
676 "^BDFetch" => ""
677 ),
678 "uri" => ""
679 ),
680 "bdncentral" => array(
681 "icon" => "robot",
682 "title" => "Bdncentral",
683 "rule" => array(
684 "BDNcentral Crawler v([0-9.]{1,10})" => "\\1"
685 ),
686 "uri" => "http://www.bdncentral.com/robot.html"
687 ),
688 "beammachine" => array(
689 "icon" => "robot",
690 "title" => "BeamMachine",
691 "rule" => array(
692 "^BeamMachine[ /]([0-9.]{1,10})" => "\\1"
693 ),
694 "uri" => "http://www.beammachine.net/"
695 ),
696 "become" => array(
697 "icon" => "become",
698 "title" => "Become",
699 "rule" => array(
700 "Become(JP)?Bot[/ ]([0-9.]{1,10})" => "\\2",
701 "(BecomeBot|Exabot)@exava\.com\)$" => ""
702 ),
703 "uri" => "http://www.become.com/"
704 ),
705 "beebware" => array(
706 "icon" => "robot",
707 "title" => "Beebware",
708 "rule" => array(
709 "BeebwareDirectory[/ ]v?([0-9.]{1,10})" => "\\2"
710 ),
711 "uri" => ""
712 ),
713 "bigbrother" => array(
714 "icon" => "robot",
715 "title" => "Big Brother",
716 "rule" => array(
717 "^Big Brother" => ""
718 ),
719 "uri" => "http://pauillac.inria.fr/~fpottier/"
720 ),
721 "bigclique" => array(
722 "icon" => "robot",
723 "title" => "BigClique",
724 "rule" => array(
725 "^BigCliqueBOT[/ ]([0-9.]{1,10})" => "\\1"
726 ),
727 "uri" => "http://www.bigclique.com"
728 ),
729 "biglotron" => array(
730 "icon" => "robot",
731 "title" => "Biglotron",
732 "rule" => array(
733 "^BIGLOTRON" => ""
734 ),
735 "uri" => "http://www.bigclique.com"
736 ),
737 "bigsearch" => array(
738 "icon" => "bigsearch",
739 "title" => "Bigsearch",
740 "rule" => array(
741 "Bigsearch.ca[/ ]Nutch[- ]([0-9.]{1,10})" => "\\1"
742 ),
743 "uri" => ""
744 ),
745 "bilbo" => array(
746 "icon" => "robot",
747 "title" => "Bilbo",
748 "rule" => array(
749 "Bilbo[ /]([0-9.]{1,10})" => "\\1"
750 ),
751 "uri" => "http://home.broadpark.no/~tnilsen-1/Linux/Bilbo_-_Nessus_WEB/bilbo_-_nessus_web.html"
752 ),
753 "bilgi" => array(
754 "icon" => "bilgi",
755 "title" => "Bilgi",
756 "rule" => array(
757 "Bilgi(Beta)?Bot[ /]([0-9.]{1,10})" => "\\1"
758 ),
759 "uri" => "http://www.bilgi.com/"
760 ),
761 "bitacle" => array(
762 "icon" => "bitacle",
763 "title" => "Bitacle",
764 "rule" => array(
765 "Bitacle (ro)?bot[ \(/V\:]+([0-9.]{1,10})" => "\\2",
766 ),
767 "uri" => "http://bitacle.org/"
768 ),
769 "bitbeamer" => array(
770 "icon" => "bitbeamer",
771 "title" => "BitBeamer",
772 "rule" => array(
773 "BitBeamer/([0-9.]{1,10})" => "\\1"
774 ),
775 "uri" => ""
776 ),
777 "biz360" => array(
778 "icon" => "biz360",
779 "title" => "Biz360",
780 "rule" => array(
781 "^Biz360 spider" => ""
782 ),
783 "uri" => ""
784 ),
785 "backlinktest" => array(
786 "icon" => "backlinktest",
787 "title" => "BacklinkCrawler",
788 "rule" => array(
789 "BacklinkCrawler" => ""
790 ),
791 "uri" => "http://www.backlinktest.com/crawler.html"
792 ),
793 "blaizbee" => array(
794 "icon" => "blaiz-bee",
795 "title" => "Blaiz-Bee",
796 "rule" => array(
797 "Blaiz-Bee[ /]([0-9.]{1,10})" => ""
798 ),
799 "uri" => ""
800 ),
801 "blogbeat" => array(
802 "icon" => "robot",
803 "title" => "BlogBeat",
804 "rule" => array(
805 "BlogBeat/?([0-9.]{1,10})" => "\\1",
806 ),
807 "uri" => "http://www.blogbeat.nl"
808 ),
809 "blogbotde" => array(
810 "icon" => "robot",
811 "title" => "blogbot.de",
812 "rule" => array(
813 "Naamah[ /]([0-9.a-z]{1,10})[ /]Blogbot" => "\\1",
814 ),
815 "uri" => "http://blogbot.de/"
816 ),
817 "blogcensus" => array(
818 "icon" => "blogcensus",
819 "title" => "Blogcensus",
820 "rule" => array(
821 "^Blogcensus" => "",
822 ),
823 "uri" => "http://blogcensus.de/bot/"
824 ),
825 "blogdex" => array(
826 "icon" => "robot",
827 "title" => "Blogdex",
828 "rule" => array(
829 "Blogdex[ /]([0-9.]{1,10})" => "\\1",
830 ),
831 "uri" => ""
832 ),
833 "blogg" => array(
834 "icon" => "blogg",
835 "title" => "Blogg",
836 "rule" => array(
837 "^blogg\.de" => ""
838 ),
839 "uri" => ""
840 ),
841 "blogland" => array(
842 "icon" => "robot",
843 "title" => "BlogLand",
844 "rule" => array(
845 "BlogLand[/ ]([0-9.]{1,10})" => "\\1"
846 ),
847 "uri" => ""
848 ),
849 "bloglines" => array(
850 "icon" => "bloglines",
851 "title" => "Bloglines",
852 "rule" => array(
853 "Bloglines[ /]([0-9.]{1,10})" => "\\1",
854 "Bloglines" => ""
855 ),
856 "uri" => ""
857 ),
858 "blogmap" => array(
859 "icon" => "robot",
860 "title" => "Blogmap",
861 "rule" => array(
862 "blogmap" => ""
863 ),
864 "uri" => ""
865 ),
866 "blogosphere" => array(
867 "icon" => "robot",
868 "title" => "Blogosphere",
869 "rule" => array(
870 "Blogosphere" => ""
871 ),
872 "uri" => ""
873 ),
874 "blogpeople" => array(
875 "icon" => "robot",
876 "title" => "BlogPeople",
877 "rule" => array(
878 "BlogPeople" => ""
879 ),
880 "uri" => ""
881 ),
882 "blogpulse" => array(
883 "icon" => "blogpulse",
884 "title" => "Blogpulse",
885 "rule" => array(
886 "Blogpulse" => ""
887 ),
888 "uri" => ""
889 ),
890 "blogranking" => array(
891 "icon" => "blogranking",
892 "title" => "BlogRanking",
893 "rule" => array(
894 "^BlogRanking(/RSS checker)?" => ""
895 ),
896 "uri" => ""
897 ),
898 "blogs" => array(
899 "icon" => "blogs",
900 "title" => "Blo.gs",
901 "rule" => array(
902 "blo\.gs[ /]([0-9.]{1,10})" => "\\1",
903 "blo\.gs" => ""
904 ),
905 "uri" => ""
906 ),
907 "blogshares" => array(
908 "icon" => "blogshares",
909 "title" => "BlogShares",
910 "rule" => array(
911 "BlogShares[ /]V?([0-9.]{1,10})" => "\\1",
912 "(^| |\()Blogshares(\.com| |\))" => ""
913 ),
914 "uri" => ""
915 ),
916 "blogslife" => array(
917 "icon" => "robot",
918 "title" => "BlogsLife",
919 "rule" => array(
920 "Blogslive" => ""
921 ),
922 "uri" => ""
923 ),
924 "blogsnow" => array(
925 "icon" => "blogsnow",
926 "title" => "BlogsNow",
927 "rule" => array(
928 "blogsnowbot" => "",
929 "BlogsNow" => ""
930 ),
931 "uri" => ""
932 ),
933 "blogstreet" => array(
934 "icon" => "blogstreet",
935 "title" => "BlogStreet",
936 "rule" => array(
937 "^BlogStreetBot" => ""
938 ),
939 "uri" => ""
940 ),
941 "blogsurf" => array(
942 "icon" => "robot",
943 "title" => "BlogSurf",
944 "rule" => array(
945 "nomadscafe_ra[/ ]([0-9.]{1,10})" => "\\1"
946 ),
947 "uri" => ""
948 ),
949 "blogtick" => array(
950 "icon" => "robot",
951 "title" => "BlogTick",
952 "rule" => array(
953 "BlogTickServer" => ""
954 ),
955 "uri" => ""
956 ),
957 "blogwatcher" => array(
958 "icon" => "blogwatcher",
959 "title" => "Blogwatcher",
960 "rule" => array(
961 "blogWatcher_Spider[/ ]([0-9.]{1,10})" => "\\1"
962 ),
963 "uri" => ""
964 ),
965 "blogwise" => array(
966 "icon" => "blogwise",
967 "title" => "Blogwise",
968 "rule" => array(
969 "Blogwise\.com(-MetaChecker)?[/ ]([0-9.]{1,10})" => "\\2"
970 ),
971 "uri" => ""
972 ),
973 "boardreader" => array(
974 "icon" => "boardreader",
975 "title" => "BoardReader",
976 "rule" => array(
977 "BoardReader[ \-](Image|Favicon)[ \-]Fetcher[ /]+([0-9.]{1,10})" => "\\2"
978 ),
979 "uri" => "http://www.boardreader.com"
980 ),
981 "bobby" => array(
982 "icon" => "bobby",
983 "title" => "Bobby",
984 "rule" => array(
985 "bobby[ /]([0-9.]{1,10})" => "\\1"
986 ),
987 "uri" => ""
988 ),
989 "boitho" => array(
990 "icon" => "robot",
991 "title" => "Boitho",
992 "rule" => array(
993 "Boitho\.com[ \-](dc|robot)?[/ ]([0-9.]{1,10})" => "\\2"
994 ),
995 "uri" => ""
996 ),
997 "booch" => array(
998 "icon" => "robot",
999 "title" => "Booch",
1000 "rule" => array(
1001 "^booch[_ /]([0-9.]{1,10})" => "\\1"
1002 ),
1003 "uri" => ""
1004 ),
1005 "book" => array(
1006 "icon" => "book",
1007 "title" => "Bookmark",
1008 "rule" => array(
1009 "http://www\.bookmark\.ne\.jp" => ""
1010 ),
1011 "uri" => ""
1012 ),
1013 "bookdog" => array(
1014 "icon" => "bookdog",
1015 "title" => "Bookdog",
1016 "rule" => array(
1017 "^Bookdog[ /]([0-9.]{1,10})" => "\\1"
1018 ),
1019 "uri" => ""
1020 ),
1021 "bordermanager" => array(
1022 "icon" => "bordermanager",
1023 "title" => "Border Manager",
1024 "rule" => array(
1025 "BorderManager[ /]([0-9.]{1,10})" => "\\1"
1026 ),
1027 "uri" => ""
1028 ),
1029 "botonparade" => array(
1030 "icon" => "botonparade",
1031 "title" => "Bot on Parade",
1032 "rule" => array(
1033 "BotOnParade" => ""
1034 ),
1035 "uri" => "http://www.bots-on-para.de/bot.html"
1036 ),
1037 "botje" => array(
1038 "icon" => "botje",
1039 "title" => "Botje",
1040 "rule" => array(
1041 "Plukkie[ /]([0-9.]{1,10})" => "\\1"
1042 ),
1043 "uri" => "http://www.botje.com/"
1044 ),
1045 "bottomfeeder" => array(
1046 "icon" => "bottomfeeder",
1047 "title" => "BottomFeeder",
1048 "rule" => array(
1049 "BottomFeeder[ /]([0-9.]{1,10})" => "\\1"
1050 ),
1051 "uri" => ""
1052 ),
1053 "browseremulator" => array(
1054 "icon" => "browseremulator",
1055 "title" => "BrowserEmulator",
1056 "rule" => array(
1057 "BrowserEmulator[ /]([0-9.]{1,10})" => "\\1"
1058 ),
1059 "uri" => "http://www.dejavu.org/emulator.htm"
1060 ),
1061 "browsershots" => array(
1062 "icon" => "browsershots",
1063 "title" => "Browsershots",
1064 "rule" => array(
1065 "Browsershots URL Check" => ""
1066 ),
1067 "uri" => "http://browsershots.org"
1068 ),
1069 "browserspy" => array(
1070 "icon" => "robot",
1071 "title" => "BrowserSpy",
1072 "rule" => array(
1073 "BrowserSpy" => ""
1074 ),
1075 "uri" => ""
1076 ),
1077 "bruinbot" => array(
1078 "icon" => "robot",
1079 "title" => "BruinBot",
1080 "rule" => array(
1081 "BruinBot" => ""
1082 ),
1083 "uri" => ""
1084 ),
1085 "bruno" => array(
1086 "icon" => "robot",
1087 "title" => "Bruno",
1088 "rule" => array(
1089 "^Bruno" => ""
1090 ),
1091 "uri" => ""
1092 ),
1093 "btbot" => array(
1094 "icon" => "btbot",
1095 "title" => "BitTorrent",
1096 "rule" => array(
1097 "BTbot/([0-9.]{1,10})" => "\\1"
1098 ),
1099 "uri" => ""
1100 ),
1101 "bubing" => array(
1102 "icon" => "robot",
1103 "title" => "BUbiNG",
1104 "rule" => array(
1105 "BUbiNG" => ""
1106 ),
1107 "uri" => "http://law.di.unimi.it/BUbiNG.html"
1108 ),
1109 "builtwith" => array(
1110 "icon" => "builtwith",
1111 "title" => "BuiltWith",
1112 "rule" => array(
1113 "BuiltWith[/ ]([0-9.]{1,10})" => "\\1"
1114 ),
1115 "uri" => "http://builtwith.com/bot.html"
1116 ),
1117 "bulkfeeds" => array(
1118 "icon" => "robot",
1119 "title" => "Bulkfeeds",
1120 "rule" => array(
1121 "Bulkfeeds[/ ]([a-z0-9.]{1,10})" => "\\1"
1122 ),
1123 "uri" => ""
1124 ),
1125 "burf" => array(
1126 "icon" => "burf",
1127 "title" => "Burf.com",
1128 "rule" => array(
1129 "^Norbert the Spider" => ""
1130 ),
1131 "uri" => "http://www.burf.com/"
1132 ),
1133 "butch" => array(
1134 "icon" => "robot",
1135 "title" => "Butch",
1136 "rule" => array(
1137 "Butch(__| )?([a-z0-9.]{1,10})" => "\\2"
1138 ),
1139 "uri" => ""
1140 ),
1141 "buzzlogic" => array(
1142 "icon" => "buzzlogic",
1143 "title" => "Buzzlogic",
1144 "rule" => array(
1145 "BuzzBot[ /]([0-9.]{1,10})" => "\\1"
1146 ),
1147 "uri" => "http://www.buzzlogic.com"
1148 ),
1149 "catchbot" => array(
1150 "icon" => "catchbot",
1151 "title" => "CatchBot",
1152 "rule" => array(
1153 "^CatchBot[/ ]([0-9.]{1,10})" => "\\1"
1154 ),
1155 "uri" => "http://www.catchbot.com"
1156 ),
1157 "camdiscover" => array(
1158 "icon" => "robot",
1159 "title" => "Camdiscover",
1160 "rule" => array(
1161 "^Camcrawler" => ""
1162 ),
1163 "uri" => ""
1164 ),
1165 "cazoodle" => array(
1166 "icon" => "cazoodle",
1167 "title" => "Cazoodle",
1168 "rule" => array(
1169 "^CazoodleBot/(Nutch|CazoodleBot)[/ \-]([0-9.]{1,10})" => "\\2",
1170 "^CazoodleBot[/ ]([a-z0-9.]{1,10})" => "\\1"
1171 ),
1172 "uri" => "http://www.cazoodle.com/cazoodlebot"
1173 ),
1174 "ccbot" => array(
1175 "icon" => "robot",
1176 "title" => "ccBot",
1177 "rule" => array(
1178 "CCBot[/ ]([0-9.]{1,10})" => "\\1"
1179 ),
1180 "uri" => "http://www.commoncrawl.org/bot.html"
1181 ),
1182 "ccgcrawl" => array(
1183 "icon" => "robot",
1184 "title" => "CCGCrawl",
1185 "rule" => array(
1186 "CCGCrawl[/ ]([0-9.]{1,10})" => "\\1"
1187 ),
1188 "uri" => "http://www.myworkbase.com/bot.html"
1189 ),
1190 "cerberian" => array(
1191 "icon" => "robot",
1192 "title" => "Cerberian Drtrs",
1193 "rule" => array(
1194 "^Cerberian Drtrs" => ""
1195 ),
1196 "uri" => ""
1197 ),
1198 "cfnetwork" => array(
1199 "icon" => "robot",
1200 "title" => "Cerberian Drtrs",
1201 "rule" => array(
1202 "^CFNetwork[/ ]([0-9.]{1,10})" => "\\1"
1203 ),
1204 "uri" => "http://www.cfnetwork.be/"
1205 ),
1206 "charlotte" => array(
1207 "icon" => "charlotte",
1208 "title" => "Charlotte",
1209 "rule" => array(
1210 "Charlotte[/ ]([0-9a-z.]{1,10})" => "\\1"
1211 ),
1212 "uri" => ""
1213 ),
1214 "cirilizator" => array(
1215 "icon" => "cirilizator",
1216 "title" => "Cirilizator",
1217 "rule" => array(
1218 "Cirilizator[/ ]([0-9.]{1,10})" => "\\1"
1219 ),
1220 "uri" => ""
1221 ),
1222 "claria" => array(
1223 "icon" => "robot",
1224 "title" => "Claria",
1225 "rule" => array(
1226 "(Claria|Diamond)(Bot)?[ /]([0-9.]{1,10})" => "\\3",
1227 "(Claria|Diamond)(Bot)" => ""
1228 ),
1229 "uri" => ""
1230 ),
1231 "claymont" => array(
1232 "icon" => "claymont",
1233 "title" => "Claymont",
1234 "rule" => array(
1235 "claymont\.com" => "",
1236 "OliverPerry" => ""
1237 ),
1238 "uri" => "http://www.claymont.com"
1239 ),
1240 "clipinc" => array(
1241 "icon" => "clipinc",
1242 "title" => "ClipInc",
1243 "rule" => array(
1244 "ClipInc" => ""
1245 ),
1246 "uri" => "http://tobit.software"
1247 ),
1248 "clush" => array(
1249 "icon" => "clush",
1250 "title" => "Clush",
1251 "rule" => array(
1252 "Clus(tered-Search-|h)Bot[ /]([0-9.]{1,10})" => "\\2"
1253 ),
1254 "uri" => ""
1255 ),
1256 "cmsworldmap" => array(
1257 "icon" => "cmsworldmap",
1258 "title" => "CMS World Map",
1259 "rule" => array(
1260 "cmsworldmap" => ""
1261 ),
1262 "uri" => "http://www.cmsworldmap.com/"
1263 ),
1264 "cobion" => array(
1265 "icon" => "robot",
1266 "title" => "Cobion",
1267 "rule" => array(
1268 " (QXW03018|obot)\)" => ""
1269 ),
1270 "uri" => ""
1271 ),
1272 "coccoc" => array(
1273 "icon" => "coccoc",
1274 "title" => "Coccoc",
1275 "rule" => array(
1276 "coccoc[ /]([0-9.]{1,10})" => "\\1",
1277 "coccocbot-web[ /]([0-9.]{1,10})" => "\\1"
1278 ),
1279 "uri" => "http://help.coccoc.com"
1280 ),
1281 "coldfusion" => array(
1282 "icon" => "coldfusion",
1283 "title" => "ColdFusion",
1284 "rule" => array(
1285 "^coldfusion" => ""
1286 ),
1287 "uri" => ""
1288 ),
1289 "combine" => array(
1290 "icon" => "robot",
1291 "title" => "Combine",
1292 "rule" => array(
1293 "Combine[ /]([0-9.]{1,10})" => "\\1"
1294 ),
1295 "uri" => ""
1296 ),
1297 "combot" => array(
1298 "icon" => "robot",
1299 "title" => "comBot",
1300 "rule" => array(
1301 "^comBot[ /]([0-9.]{1,10})" => "\\1"
1302 ),
1303 "uri" => ""
1304 ),
1305 "comet" => array(
1306 "icon" => "comet",
1307 "title" => "Comet",
1308 "rule" => array(
1309 "cometsearch@cometsystems" => ""
1310 ),
1311 "uri" => ""
1312 ),
1313 "commerobo" => array(
1314 "icon" => "robot",
1315 "title" => "Commerobo",
1316 "rule" => array(
1317 "Commerobo[/ ]([0-9.]{1,10})" => "\\1"
1318 ),
1319 "uri" => ""
1320 ),
1321 "comrite" => array(
1322 "icon" => "robot",
1323 "title" => "ComRite",
1324 "rule" => array(
1325 "Comrite[/ ]([0-9.]{1,10})" => "\\1"
1326 ),
1327 "uri" => "http://www.comrite.com/"
1328 ),
1329 "convera" => array(
1330 "icon" => "convera",
1331 "title" => "Convera",
1332 "rule" => array(
1333 "Convera(MultiMedia)?Crawler[/ ]([0-9.]{1,10})" => "\\2",
1334 "Convera Internet Spider V([0-9.]{1,10})" => "\\1"
1335 ),
1336 "uri" => ""
1337 ),
1338 "coolbot" => array(
1339 "icon" => "robot",
1340 "title" => "CoolBot",
1341 "rule" => array(
1342 "^CoolBot" => ""
1343 ),
1344 "uri" => ""
1345 ),
1346 "cosmix" => array(
1347 "icon" => "robot",
1348 "title" => "Cosmix",
1349 "rule" => array(
1350 "^(voyager|cfetch|CosmixCrawler|carleson)[/ ]([0-9.]{1,10})" => "\\2",
1351 ),
1352 "uri" => ""
1353 ),
1354 "cosmos" => array(
1355 "icon" => "robot",
1356 "title" => "Cosmos",
1357 "rule" => array(
1358 "^cosmos" => ""
1359 ),
1360 "uri" => ""
1361 ),
1362 "cosmoty" => array(
1363 "icon" => "robot",
1364 "title" => "Cosmoty",
1365 "rule" => array(
1366 "^beautybot[/ ]([0-9.]{1,10})" => "\\1"
1367 ),
1368 "uri" => "http://www.uchoose.de/crawler/beautybot/"
1369 ),
1370 "covario" => array(
1371 "icon" => "covario",
1372 "title" => "Covario",
1373 "rule" => array(
1374 "Covario-IDS[/ ]([0-9.]{1,10})" => "\\1"
1375 ),
1376 "uri" => "http://www.covario.com/ids/"
1377 ),
1378 "creativecommons" => array(
1379 "icon" => "creativecommons",
1380 "title" => "Creative Commons",
1381 "rule" => array(
1382 "CreativeCommons[/ ]([0-9.]{1,6}(-dev)?)" => "\\1"
1383 ),
1384 "uri" => ""
1385 ),
1386 "cscrawler" => array(
1387 "icon" => "robot",
1388 "title" => "CsCrawler",
1389 "rule" => array(
1390 "CsCrawler" => ""
1391 ),
1392 "uri" => "http://www.kde.cs.uni-kassel.de/lehre/ss2005/googlespam/crawler.html"
1393 ),
1394 "jigsaw" => array(
1395 "icon" => "jigsaw",
1396 "title" => "Jigsaw",
1397 "rule" => array(
1398 "Jigsaw[ /]([0-9.]{1,10})" => "\\1"
1399 ),
1400 "uri" => "http://jigsaw.w3.org/css-validator/"
1401 ),
1402 "csscheck" => array(
1403 "icon" => "w3c",
1404 "title" => "W3C CSS Validator",
1405 "rule" => array(
1406 "CSS(Check|_Validator).+[ /]([0-9.]{1,10})" => "\\2"
1407 ),
1408 "uri" => "http://jigsaw.w3.org/css-validator/"
1409 ),
1410 "custo" => array(
1411 "icon" => "robot",
1412 "title" => "Custo",
1413 "rule" => array(
1414 "Custo[ /]([0-9.]{1,10})" => "\\1"
1415 ),
1416 "uri" => ""
1417 ),
1418 "cybernavi" => array(
1419 "icon" => "robot",
1420 "title" => "CyberNavi",
1421 "rule" => array(
1422 "CyberNavi_WebGet[ /]([0-9.]{1,10})" => "\\1"
1423 ),
1424 "uri" => ""
1425 ),
1426 "cyberpatrol" => array(
1427 "icon" => "cyberpatrol",
1428 "title" => "CyberPatrol",
1429 "rule" => array(
1430 "^CyberPatrol" => ""
1431 ),
1432 "uri" => "http://www.cyberpatrol.com/cyberpatrolcrawler.asp"
1433 ),
1434 "cyberz" => array(
1435 "icon" => "cyberz",
1436 "title" => "Cyberz",
1437 "rule" => array(
1438 "Cyberz Communication Agent" => ""
1439 ),
1440 "uri" => ""
1441 ),
1442 "cydral" => array(
1443 "icon" => "robot",
1444 "title" => "Cydral",
1445 "rule" => array(
1446 "CydralSpider[ /]([0-9.]{1,10})" => "\\1"
1447 ),
1448 "uri" => ""
1449 ),
1450 "cynthia" => array(
1451 "icon" => "cynthia",
1452 "title" => "Cynthia Says",
1453 "rule" => array(
1454 "Cynthia[ /]([0-9.]{1,10})" => "\\1"
1455 ),
1456 "uri" => ""
1457 ),
1458 "d4x" => array(
1459 "icon" => "d4x",
1460 "title" => "Downloader for X",
1461 "rule" => array(
1462 "Downloader for X[ /]([0-9.]{1,10})" => "\\1"
1463 ),
1464 "uri" => ""
1465 ),
1466 "da" => array(
1467 "icon" => "da",
1468 "title" => "DA",
1469 "rule" => array(
1470 "^DA[ /]([0-9.]{1,10})" => "\\1"
1471 ),
1472 "uri" => ""
1473 ),
1474 "daum" => array(
1475 "icon" => "daum",
1476 "title" => "DAUM",
1477 "rule" => array(
1478 "DAUMOA[ /]([0-9.]{1,10})" => "\\1",
1479 "Daum[ /]([0-9.]{1,10})" => "\\1",
1480 "DAUM Web Robot" => "",
1481 "daum.net" => "",
1482 "Daum Communications Corp" => "",
1483 "EDI[ /]([0-9.]{1,10})" => "\\1",
1484 "Edacious.*Intelligent Web Robot" => "",
1485 "RaBot[/ ]([0-9.]{1,10}) Agent" => "\\1"
1486 ),
1487 "uri" => "http://ws.daum.net/"
1488 ),
1489 "daypop" => array(
1490 "icon" => "robot",
1491 "title" => "Daypop",
1492 "rule" => array(
1493 "daypopbot[/ ]([0-9.]{1,10})" => "\\1"
1494 ),
1495 "uri" => ""
1496 ),
1497 "delfi" => array(
1498 "icon" => "delfi",
1499 "title" => "Delfi",
1500 "rule" => array(
1501 "crawl at delfi dot lt" => ""
1502 ),
1503 "uri" => ""
1504 ),
1505 "depspid" => array(
1506 "icon" => "depspid",
1507 "title" => "DepSpid",
1508 "rule" => array(
1509 "DepSpid[/ ]([0-9.]{1,10})" => "\\1"
1510 ),
1511 "uri" => ""
1512 ),
1513 "devonagent" => array(
1514 "icon" => "devonagent",
1515 "title" => "DEVONagent",
1516 "rule" => array(
1517 "DEVONtech" => ""
1518 ),
1519 "uri" => ""
1520 ),
1521 "diffbot" => array(
1522 "icon" => "diffbot",
1523 "title" => "Diffbot",
1524 "rule" => array(
1525 " Diffbot" => ""
1526 ),
1527 "uri" => "http://www.diffbot.com"
1528 ),
1529 "diribot" => array(
1530 "icon" => "diribot",
1531 "title" => "Diri",
1532 "rule" => array(
1533 "diribot" => ""
1534 ),
1535 "uri" => "http://www.diri.bg"
1536 ),
1537 "directhit" => array(
1538 "icon" => "robot",
1539 "title" => "Direct Hit",
1540 "rule" => array(
1541 "EZResult -- Internet Search Engine" => ""
1542 ),
1543 "uri" => "http://www.directhit.com"
1544 ),
1545 "disco" => array(
1546 "icon" => "disco",
1547 "title" => "Disco",
1548 "rule" => array(
1549 "disco/Nutch[/ -]([0-9.]{1,10})" => "\\1",
1550 "discobot[/ -]([0-9.]{1,10})" => "\\1",
1551 "disco-crawl@discoveryengine.com" => ""
1552 ),
1553 "uri" => "http://www.discoveryengine.com/"
1554 ),
1555 "discopump" => array(
1556 "icon" => "robot",
1557 "title" => "DISCo Pump",
1558 "rule" => array(
1559 "DISCo Pump[/ ]([0-9.]{1,10})" => "\\1"
1560 ),
1561 "uri" => ""
1562 ),
1563 "dkimreputation" => array(
1564 "icon" => "dkimreputation",
1565 "title" => "DKIM Reputation",
1566 "rule" => array(
1567 "DKIMRepBot[ /]([0-9.]{1,10})" => "\\1"
1568 ),
1569 "uri" => "http://www.dkim-reputation.org"
1570 ),
1571 "dnsdigger" => array(
1572 "icon" => "dnsdigger",
1573 "title" => "DNS-Digger",
1574 "rule" => array(
1575 "DNS-Digger-Explorer[ /]([0-9.]{1,10})" => "\\1"
1576 ),
1577 "uri" => "http://www.dnsdigger.com"
1578 ),
1579 "dnsvalidation" => array(
1580 "icon" => "dnsvalidation",
1581 "title" => "DNS Validation",
1582 "rule" => array(
1583 "DNSValidation[ /]([0-9.]{1,10})" => "\\1"
1584 ),
1585 "uri" => "http://www.dnsvalidation.com/"
1586 ),
1587 "doctorhtml" => array(
1588 "icon" => "robot",
1589 "title" => "DoctorHTML",
1590 "rule" => array(
1591 "Doctor[ \-]?HTML" => ""
1592 ),
1593 "uri" => ""
1594 ),
1595 "dolphin" => array(
1596 "icon" => "dolphin",
1597 "title" => "Dolphin",
1598 "rule" => array(
1599 "Dolphin[ /]([0-9.]{1,10})" => "\\1"
1600 ),
1601 "uri" => "http://telehouse.ru/crawler.html"
1602 ),
1603 "domaindatei" => array(
1604 "icon" => "robot",
1605 "title" => "Domaindatei",
1606 "rule" => array(
1607 "DomaindateiSpider[ /]([0-9.]{1,10})" => "\\1"
1608 ),
1609 "uri" => ""
1610 ),
1611 "dontbuylists" => array(
1612 "icon" => "dontbuylists",
1613 "title" => "Dontbuylists",
1614 "rule" => array(
1615 "DBLBot[ /]([0-9.]{1,10})" => "\\1"
1616 ),
1617 "uri" => "http://www.dontbuylists.com"
1618 ),
1619 "dotbot" => array(
1620 "icon" => "robot",
1621 "title" => "DotBot",
1622 "rule" => array(
1623 "DotBot[ /]([0-9.]{1,10})" => "\\1"
1624 ),
1625 "uri" => "http://www.dotnetdotcom.org"
1626 ),
1627 "doweb" => array(
1628 "icon" => "doweb",
1629 "title" => "DoWeb",
1630 "rule" => array(
1631 "^www.doweb.co.uk" => ""
1632 ),
1633 "uri" => "http://www.doweb.co.uk/"
1634 ),
1635 "downforeveryoneorjustme" => array(
1636 "icon" => "downforeveryoneorjustme",
1637 "title" => "Down for everyone or just me",
1638 "rule" => array(
1639 "downforeveryoneorjustme" => ""
1640 ),
1641 "uri" => "http://www.downforeveryoneorjustme.com"
1642 ),
1643 "downloadninja" => array(
1644 "icon" => "robot",
1645 "title" => "Download Ninja",
1646 "rule" => array(
1647 "Download Ninja[ /]([0-9.]{1,10})" => "\\1"
1648 ),
1649 "uri" => ""
1650 ),
1651 "drupal" => array(
1652 "icon" => "drupal",
1653 "title" => "Drupal",
1654 "rule" => array(
1655 "^Drupal" => ""
1656 ),
1657 "uri" => ""
1658 ),
1659 "dsns" => array(
1660 "icon" => "robot",
1661 "title" => "DSNS Scanner",
1662 "rule" => array(
1663 "^DSNS" => ""
1664 ),
1665 "uri" => ""
1666 ),
1667 "dtsagent" => array(
1668 "icon" => "robot",
1669 "title" => "DTS Agent",
1670 "rule" => array(
1671 "DTS Agent" => ""
1672 ),
1673 "uri" => ""
1674 ),
1675 "duckduckgo" => array(
1676 "icon" => "duckduckgo",
1677 "title" => "DuckDuckGo",
1678 "rule" => array(
1679 "DuckDuckGo-Favicons-Bot[ /]([0-9.]{1,10})" => "\\1",
1680 "DuckDuckBot-Https[ /]([0-9.]{1,10})" => "\\1"
1681 ),
1682 "uri" => "http://duckduckgo.com"
1683 ),
1684 "earthcom" => array(
1685 "icon" => "earthcom",
1686 "title" => "Earthcom",
1687 "rule" => array(
1688 "EARTHCOM\.info[/ ]([0-9a-z.]{1,10})" => "\\1"
1689 ),
1690 "uri" => ""
1691 ),
1692 "ebay" => array(
1693 "icon" => "ebay",
1694 "title" => "eBay",
1695 "rule" => array(
1696 "eBay Relevance Ad Crawler" => ""
1697 ),
1698 "uri" => ""
1699 ),
1700 "echo" => array(
1701 "icon" => "robot",
1702 "title" => "Echo.com",
1703 "rule" => array(
1704 "_TrueRobot[/ ]([0-9.]{1,10})" => "\\1"
1705 ),
1706 "uri" => "http://www.echo.com/"
1707 ),
1708 "eert" => array(
1709 "icon" => "robot",
1710 "title" => "Eert",
1711 "rule" => array(
1712 "eert spdr[/ ]([0-9.]{1,10})" => "\\1"
1713 ),
1714 "uri" => "http://bot.eert.net"
1715 ),
1716 "eknip" => array(
1717 "icon" => "eknip",
1718 "title" => "E-Knip",
1719 "rule" => array(
1720 "eknip[ /]([0-9a-z.]{1,10})" => "\\1"
1721 ),
1722 "uri" => ""
1723 ),
1724 "zoominfo" => array(
1725 "icon" => "zoominfo",
1726 "title" => "ZoomInfo", //Previous called Eliyon
1727 "rule" => array(
1728 "NextGenSearchBot[/ ]([0-9.]{1,10})" => "\\1"
1729 ),
1730 "uri" => "http://www.zoominfo.com/business/nextgensearchbot.html"
1731 ),
1732 "emeraldshield" => array(
1733 "icon" => "emeraldshield",
1734 "title" => "EmeraldShield",
1735 "rule" => array(
1736 "^EmeraldShield" => ""
1737 ),
1738 "uri" => ""
1739 ),
1740 "empas" => array(
1741 "icon" => "empas",
1742 "title" => "Empas",
1743 "rule" => array(
1744 "DigExt; empas\)$" => "",
1745 "^EMPAS[_\-]ROBOT" => ""
1746 ),
1747 "uri" => ""
1748 ),
1749 "entfer" => array(
1750 "icon" => "entfer",
1751 "title" => "Entfer",
1752 "rule" => array(
1753 "EntferBot[ /]([0-9.]{1,10})" => "\\1"
1754 ),
1755 "uri" => "https://entfer.com"
1756 ),
1757 "entireweb" => array(
1758 "icon" => "entireweb",
1759 "title" => "Entireweb",
1760 "rule" => array(
1761 "Speedy[ ]?Spider" => ""
1762 ),
1763 "uri" => ""
1764 ),
1765 "envolk" => array(
1766 "icon" => "envolk",
1767 "title" => "Envolk",
1768 "rule" => array(
1769 "envolk\[ITS\]spider[/ ]([0-9.]{1,10})" => "\\1",
1770 "envolk[/ ]([0-9.]{1,10})" => "\\1"
1771 ),
1772 "uri" => ""
1773 ),
1774 "esnet" => array(
1775 "icon" => "robot",
1776 "title" => "ES.NET",
1777 "rule" => array(
1778 "ES.NET Crawler[ /]([0-9.]{1,10})" => "\\1"
1779 ),
1780 "uri" => ""
1781 ),
1782 "estyle" => array(
1783 "icon" => "estyle",
1784 "title" => "eStyle Search",
1785 "rule" => array(
1786 "eStyleSearch[ /]([0-9.]{1,10})" => "\\1"
1787 ),
1788 "uri" => ""
1789 ),
1790 "eurip" => array(
1791 "icon" => "robot",
1792 "title" => "Eurip",
1793 "rule" => array(
1794 "EuripBot[ /]([0-9.]{1,10})" => "\\1"
1795 ),
1796 "uri" => "http://www.eurip.com"
1797 ),
1798 "eurodirectory" => array(
1799 "icon" => "robot",
1800 "title" => "Euro Directory",
1801 "rule" => array(
1802 "www\.euro-directory\.com" => ""
1803 ),
1804 "uri" => "http://www.euro-directory.com/"
1805 ),
1806 "euroseek" => array(
1807 "icon" => "euroseek",
1808 "title" => "EuroSeek",
1809 "rule" => array(
1810 "Arachnoidea" => ""
1811 ),
1812 "uri" => ""
1813 ),
1814 "evaal" => array(
1815 "icon" => "evaal",
1816 "title" => "Evaal",
1817 "rule" => array(
1818 "^EvaalSE" => ""
1819 ),
1820 "uri" => "http://www.evaal.com/"
1821 ),
1822 "eventax" => array(
1823 "icon" => "eventax",
1824 "title" => "Eventax",
1825 "rule" => array(
1826 "^eventax[ /]([0-9.]{1,10})" => "\\1"
1827 ),
1828 "uri" => "http://www.eventax.de/"
1829 ),
1830 "everbee" => array(
1831 "icon" => "everbee",
1832 "title" => "Everbee",
1833 "rule" => array(
1834 "EverbeeCrawler" => ""
1835 ),
1836 "uri" => ""
1837 ),
1838 "everest" => array(
1839 "icon" => "everest",
1840 "title" => "Everest",
1841 "rule" => array(
1842 "Everest-Vulcan Inc.[ /]([0-9.]{1,10})" => "\\1"
1843 ),
1844 "uri" => ""
1845 ),
1846 "exabot" => array(
1847 "icon" => "exabot",
1848 "title" => "ExaBot",
1849 "rule" => array(
1850 "^NG[ /]([0-9.]{1,10})" => "\\1",
1851 "Exabot/([0-9.]{1,10})" => "\\1",
1852 "ExaBotTest/([0-9.]{1,10})" => "\\1",
1853 "ExaBot-(Test|Images)/([0-9.]{1,10})" => "\\2",
1854 "ExaBot-Thumbnails" => ""
1855 ),
1856 "uri" => "http://www.exabot.com/go/robot"
1857 ),
1858 "exactseek" => array(
1859 "icon" => "exactseek",
1860 "title" => "ExactSeek",
1861 "rule" => array(
1862 "^exactseek[ \-]?(pagereaper|crawler)[ \-]?([0-9.]{1,10})" => "\\2",
1863 "ExactSeek[ \.\-]?(Crawler|com)" => ""
1864 ),
1865 "uri" => "http://www.exactseek.com/"
1866 ),
1867 "excite" => array(
1868 "icon" => "excite",
1869 "title" => "Excite",
1870 "rule" => array(
1871 "Architext[ \-]?Spider" => ""
1872 ),
1873 "uri" => ""
1874 ),
1875 "execrawl" => array(
1876 "icon" => "robot",
1877 "title" => "Execrawl",
1878 "rule" => array(
1879 "Execrawl[ /]([0-9.]{1,10})" => "\\1",
1880 "Execrawl" => ""
1881 ),
1882 "uri" => ""
1883 ),
1884 "expertmonitor" => array(
1885 "icon" => "robot",
1886 "title" => "ExpertMonitor",
1887 "rule" => array(
1888 "^NetMonitor[ /]([0-9.]{1,10})" => "\\1"
1889 ),
1890 "uri" => ""
1891 ),
1892 "explorerrss" => array(
1893 "icon" => "robot",
1894 "title" => "Explorer RSS",
1895 "rule" => array(
1896 "^Windows-RSS-Platform[ /]([0-9.]{1,10})" => "\\1"
1897 ),
1898 "uri" => ""
1899 ),
1900 "ezooms" => array(
1901 "icon" => "robot",
1902 "title" => "Ezooms",
1903 "rule" => array(
1904 "ezooms[/ ]([0-9a-z.\-]{1,10})" => "\\1"
1905 ),
1906 "uri" => ""
1907 ),
1908 "facebook" => array(
1909 "icon" => "facebook",
1910 "title" => "Facebook",
1911 "rule" => array(
1912 "FacebookFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
1913 "facebookexternalhit/([0-9.]{1,10})" => "\\1",
1914 "^facebook" => ""
1915 ),
1916 "uri" => "http://www.facebook.com/"
1917 ),
1918 "fast" => array(
1919 "icon" => "fast",
1920 "title" => "Fast",
1921 "rule" => array(
1922 "^FAST( Enterprise |-Web| MetaWeb )?Crawler[ /]([0-9.]{1,10})" => "\\2",
1923 "^FAST( Enterprise |-Web| MetaWeb | PartnerSite )?Crawler" => "",
1924 "^Fast Crawler" => "",
1925 "^libwww-perl[ /]([0-9.]{1,10}) FP[ /]([0-9.]{1,10})" => "\\2"
1926 ),
1927 "uri" => "http://www.alltheweb.com/"
1928 ),
1929 "fastbuzz" => array(
1930 "icon" => "fastbuzz",
1931 "title" => "Fastbuzz",
1932 "rule" => array(
1933 "^fastbuzz\.com" => ""
1934 ),
1935 "uri" => ""
1936 ),
1937 "favorg" => array(
1938 "icon" => "robot",
1939 "title" => "FavOrg",
1940 "rule" => array(
1941 "^FavOrg" => ""
1942 ),
1943 "uri" => ""
1944 ),
1945 "favorstar" => array(
1946 "icon" => "favorstar",
1947 "title" => "Favorstar",
1948 "rule" => array(
1949 "favorstarbot[ /]([0-9.]{1,10})" => "\\1"
1950 ),
1951 "uri" => "http://favorstar.com/bot.html"
1952 ),
1953 "faxo" => array(
1954 "icon" => "robot",
1955 "title" => "Faxo",
1956 "rule" => array(
1957 "^Faxobot[ /]([0-9.]{1,10})" => "\\1"
1958 ),
1959 "uri" => "http://www.faxo.com/"
1960 ),
1961 "fdse" => array(
1962 "icon" => "robot",
1963 "title" => "FDSE Robot",
1964 "rule" => array(
1965 "FDSE[ \-]?robot" => ""
1966 ),
1967 "uri" => ""
1968 ),
1969 "feedback" => array(
1970 "icon" => "robot",
1971 "title" => "FeedBack",
1972 "rule" => array(
1973 "FeedBack[/ ]([0-9.]{1,10})" => "\\1"
1974 ),
1975 "uri" => ""
1976 ),
1977 "feedburner" => array(
1978 "icon" => "feedburner",
1979 "title" => "FeedBurner",
1980 "rule" => array(
1981 "^FeedBurner[/ ]([0-9.]{1,10})" => "\\1"
1982 ),
1983 "uri" => ""
1984 ),
1985 "feeddemon" => array(
1986 "icon" => "feeddemon",
1987 "title" => "FeedDemon",
1988 "rule" => array(
1989 "FeedDemon[/ ]([0-9.]{1,10})" => "\\1"
1990 ),
1991 "uri" => ""
1992 ),
1993 "feedfind" => array(
1994 "icon" => "feedfind",
1995 "title" => "FeedFind",
1996 "rule" => array(
1997 "Feed::Find[ /]([0-9.]{1,10})" => "\\1"
1998 ),
1999 "uri" => ""
2000 ),
2001 "feedonfeeds" => array(
2002 "icon" => "robot",
2003 "title" => "Feed On Feeds",
2004 "rule" => array(
2005 "FeedOnFeeds[/ ]([0-9.]{1,10})" => "\\1"
2006 ),
2007 "uri" => ""
2008 ),
2009 "feedparser" => array(
2010 "icon" => "robot",
2011 "title" => "Feedparser",
2012 "rule" => array(
2013 "UniversalFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
2014 "FeedParser" => ""
2015 ),
2016 "uri" => ""
2017 ),
2018 "feedreader" => array(
2019 "icon" => "feedreader",
2020 "title" => "Feedreader",
2021 "rule" => array(
2022 "^Feedreader" => ""
2023 ),
2024 "uri" => ""
2025 ),
2026 "feedserver" => array(
2027 "icon" => "robot",
2028 "title" => "FeedServer",
2029 "rule" => array(
2030 "FeedServer[/ ]([0-9.]{1,10})" => "\\1"
2031 ),
2032 "uri" => ""
2033 ),
2034 "feedster" => array(
2035 "icon" => "feedster",
2036 "title" => "Feedster",
2037 "rule" => array(
2038 "Feedster Crawler[/ ]([0-9.]{1,10})" => "\\1"
2039 ),
2040 "uri" => ""
2041 ),
2042 "feedvalidator" => array(
2043 "icon" => "feedvalidator",
2044 "title" => "Feed Validator",
2045 "rule" => array(
2046 "^FeedValidator[/ ]([0-9.]{1,10})" => "\\1"
2047 ),
2048 "uri" => ""
2049 ),
2050 "fdm" => array(
2051 "icon" => "robot",
2052 "title" => "Free Download Manager",
2053 "rule" => array(
2054 "^FDM[/ ]([0-9a-z.]{1,10})" => "\\1"
2055 ),
2056 "uri" => ""
2057 ),
2058 "filangy" => array(
2059 "icon" => "robot",
2060 "title" => "Filangy",
2061 "rule" => array(
2062 "Filangy[/ ]([0-9.]{1,10})" => "\\1"
2063 ),
2064 "uri" => "http://www.filangy.com/"
2065 ),
2066 "findanisp" => array(
2067 "icon" => "robot",
2068 "title" => "FindAnISP",
2069 "rule" => array(
2070 "FindAnISP" => ""
2071 ),
2072 "uri" => "http://www.findanisp.com/"
2073 ),
2074 "findengines" => array(
2075 "icon" => "findengines",
2076 "title" => "FindEngines",
2077 "rule" => array(
2078 "FindEngines! Bot" => ""
2079 ),
2080 "uri" => ""
2081 ),
2082 "findexa" => array(
2083 "icon" => "findexa",
2084 "title" => "Findexa",
2085 "rule" => array(
2086 "Findexa Crawler" => ""
2087 ),
2088 "uri" => ""
2089 ),
2090 "findlinks" => array(
2091 "icon" => "findlinks",
2092 "title" => "FindLinks",
2093 "rule" => array(
2094 "findlinks[ /]([0-9.]{1,10})" => "\\1",
2095 "^FindLinks" => ""
2096 ),
2097 "uri" => ""
2098 ),
2099 "findoor" => array(
2100 "icon" => "findoor",
2101 "title" => "Findoor",
2102 "rule" => array(
2103 "^findoor(-Bot)?" => "\\1"
2104 ),
2105 "uri" => ""
2106 ),
2107 "firefly" => array(
2108 "icon" => "firefly",
2109 "title" => "Firefly",
2110 "rule" => array(
2111 "Firefly" => ""
2112 ),
2113 "uri" => ""
2114 ),
2115 "flashget" => array(
2116 "icon" => "flashget",
2117 "title" => "FlashGet",
2118 "rule" => array(
2119 "^FlashGet" => ""
2120 ),
2121 "uri" => ""
2122 ),
2123 "flatland" => array(
2124 "icon" => "flatland",
2125 "title" => "Flatland",
2126 "rule" => array(
2127 "^flatlandbot" => ""
2128 ),
2129 "uri" => "http://www.flatlandindustries.com/flatlandbot"
2130 ),
2131 "flickbot" => array(
2132 "icon" => "flickbot",
2133 "title" => "FlickBot",
2134 "rule" => array(
2135 "FlickBot[ /]([0-9.]{1,10})" => "\\1"
2136 ),
2137 "uri" => ""
2138 ),
2139 "flightdeckreports" => array(
2140 "icon" => "flightdeckreports",
2141 "title" => "Flight Deck Reports",
2142 "rule" => array(
2143 "FlightDeckReportsBot[ /]([0-9.]{1,10})" => "\\1"
2144 ),
2145 "uri" => "http://www.flightdeckreports.com/"
2146 ),
2147 "forex" => array(
2148 "icon" => "robot",
2149 "title" => "Forex",
2150 "rule" => array(
2151 "^Forex Trading Network Organization" => ""
2152 ),
2153 "uri" => "http://www.netforex.org/"
2154 ),
2155 "freshmeat" => array(
2156 "icon" => "freshmeat",
2157 "title" => "Freshmeat",
2158 "rule" => array(
2159 "fmII URL validator[ /]([0-9.]{1,10})" => "\\1",
2160 "freshmeat.net URL validator[ /]([0-9.]{1,10})" => "\\1"
2161 ),
2162 "uri" => "http://www.freshmeat.net/"
2163 ),
2164 "friend" => array(
2165 "icon" => "friend",
2166 "title" => "Friend",
2167 "rule" => array(
2168 "www\.friend\.fr" => ""
2169 ),
2170 "uri" => "http://www.friend.fr/"
2171 ),
2172 "frontier" => array(
2173 "icon" => "frontier",
2174 "title" => "Frontier",
2175 "rule" => array(
2176 "Frontier[ /]([0-9.]{1,10})" => "\\1"
2177 ),
2178 "uri" => ""
2179 ),
2180 "fyberspider" => array(
2181 "icon" => "robot",
2182 "title" => "FyberSpider",
2183 "rule" => array(
2184 "FyberSpider[ /]([0-9.]{1,10})" => "\\1"
2185 ),
2186 "uri" => "http://www.fyberspider.com/"
2187 ),
2188 "gaisbot" => array(
2189 "icon" => "gais",
2190 "title" => "Gaisbot",
2191 "rule" => array(
2192 "Gaisbot[ /]([0-9.]{1,10})" => "\\1"
2193 ),
2194 "uri" => ""
2195 ),
2196 "galaxy" => array(
2197 "icon" => "galaxy",
2198 "title" => "Galaxy",
2199 "rule" => array(
2200 "GalaxyBot[ /]([0-9.]{1,10})" => "\\1",
2201 "www.galaxy.com" => ""
2202 ),
2203 "uri" => "http://www.galaxy.com/"
2204 ),
2205 "gamespy" => array(
2206 "icon" => "gamespy",
2207 "title" => "GameSpy",
2208 "rule" => array(
2209 "GameSpyHTTP[ /]([0-9.]{1,10})" => "\\1"
2210 ),
2211 "uri" => ""
2212 ),
2213 "garlik" => array(
2214 "icon" => "garlik",
2215 "title" => "Garlik",
2216 "rule" => array(
2217 "GarlikCrawler[ /]([0-9.]{1,10})" => "\\1"
2218 ),
2219 "uri" => "http://garlik.com/"
2220 ),
2221 "gdesktop" => array(
2222 "icon" => "gdesktop",
2223 "title" => "Google Desktop",
2224 "rule" => array(
2225 "compatible; Google Desktop" => ""
2226 ),
2227 "uri" => ""
2228 ),
2229 "genome" => array(
2230 "icon" => "robot",
2231 "title" => "Genome Machine",
2232 "rule" => array(
2233 "Genome[ \-]?Machine" => ""
2234 ),
2235 "uri" => ""
2236 ),
2237 "geohash" => array(
2238 "icon" => "geohash",
2239 "title" => "Geohash",
2240 "rule" => array(
2241 "GeoHasher(/Nutch)[ /-]([0-9.]{1,10})" => "\\2"
2242 ),
2243 "uri" => "http://geohash.org/"
2244 ),
2245 "geona" => array(
2246 "icon" => "robot",
2247 "title" => "Geona",
2248 "rule" => array(
2249 "GeonaBot[ /]([0-9.]{1,10})" => "\\1"
2250 ),
2251 "uri" => ""
2252 ),
2253 "geoblog" => array(
2254 "icon" => "robot",
2255 "title" => "The World as a Blog",
2256 "rule" => array(
2257 "The World as a Blog" => ""
2258 ),
2259 "uri" => ""
2260 ),
2261 "geourl" => array(
2262 "icon" => "geourl",
2263 "title" => "GeoUrl",
2264 "rule" => array(
2265 "geourl[ /]([0-9.]{1,10})" => "\\1",
2266 "^GeoURLBot[ /]([0-9.]{1,10})" => "\\1",
2267 ),
2268 "uri" => ""
2269 ),
2270 "getnetwise" => array(
2271 "icon" => "robot",
2272 "title" => "GetNetWise",
2273 "rule" => array(
2274 " Crayon Crawler" => ""
2275 ),
2276 "uri" => ""
2277 ),
2278 "getright" => array(
2279 "icon" => "getright",
2280 "title" => "GetRight",
2281 "rule" => array(
2282 "GetRight[ /]([0-9.]{1,10})" => "\\1"
2283 ),
2284 "uri" => ""
2285 ),
2286 "getsmart" => array(
2287 "icon" => "getsmart",
2288 "title" => "GetSmart",
2289 "rule" => array(
2290 "GetSmart[ /]([0-9.]{1,10})" => "\\1"
2291 ),
2292 "uri" => ""
2293 ),
2294 "gigabot" => array(
2295 "icon" => "gigablast",
2296 "title" => "Gigablast",
2297 "rule" => array(
2298 "(Gigabot|Sitesearch)[/ ]([0-9.]{1,10})" => "\\2",
2299 "GigabotSiteSearch[/ ]([0-9.]{1,10})" => "\\1",
2300 "GigablastOpenSource" => ""
2301 ),
2302 "uri" => ""
2303 ),
2304 "gimme" => array(
2305 "icon" => "gimme",
2306 "title" => "gimmeUSA",
2307 "rule" => array(
2308 "Gimme60bot[ /]([0-9.]{1,10})" => "\\1"
2309 ),
2310 "uri" => "http://gimme60.com"
2311 ),
2312 "ginger" => array(
2313 "icon" => "ginger",
2314 "title" => "GingerCrawler",
2315 "rule" => array(
2316 "GingerCrawler[ /]([0-9.]{1,10})" => "\\1"
2317 ),
2318 "uri" => "http://www.gingersoftware.com/crawler_agent.htm"
2319 ),
2320 "girafabot" => array(
2321 "icon" => "girafa",
2322 "title" => "Girafa",
2323 "rule" => array(
2324 "Girafabot" => ""
2325 ),
2326 "uri" => ""
2327 ),
2328 "globalspec" => array(
2329 "icon" => "globalspec",
2330 "title" => "GlobalSpec",
2331 "rule" => array(
2332 "Ocelli[ /]([0-9.]{1,10})" => "\\1"
2333 ),
2334 "uri" => ""
2335 ),
2336 "glucose" => array(
2337 "icon" => "glucose",
2338 "title" => "Glucose",
2339 "rule" => array(
2340 "glucose[ /]([0-9a-z.\-]{1,10})" => "\\1"
2341 ),
2342 "uri" => ""
2343 ),
2344 "gnomit" => array(
2345 "icon" => "gnomit",
2346 "title" => "Gnomit",
2347 "rule" => array(
2348 "gnomit[ /]([0-9.]{1,10})" => "\\1"
2349 ),
2350 "uri" => "http://www.gnomit.com/",
2351 ),
2352 "goforit" => array(
2353 "icon" => "goforit",
2354 "title" => "GoForIt",
2355 "rule" => array(
2356 "^GoForIt\.com" => "",
2357 "^GOFORITBOT" => ""
2358 ),
2359 "uri" => ""
2360 ),
2361 "goguides" => array(
2362 "icon" => "robot",
2363 "title" => "GoGuides",
2364 "rule" => array(
2365 "^GoGuidesBot[ /]([0-9.]{1,10})" => "\\1"
2366 ),
2367 "uri" => "http://www.goguides.org/"
2368 ),
2369 // Needs to be before google for correct detection
2370 "mediapartners" => array(
2371 "icon" => "google",
2372 "title" => "Mediapartners",
2373 "rule" => array (
2374 "Mediapartners-Google[ /]([0-9.]{1,10})" => "\\1",
2375 "Mediapartners-Google" => ""
2376 ),
2377 "uri" => ""
2378 ),
2379 "google" => array(
2380 "icon" => "google",
2381 "title" => "Google",
2382 "rule" => array (
2383 "Googl(e|ebot)(-Image)?/([0-9.]{1,10})" => "\\3",
2384 "Googl(e|ebot)(-Image)?/" => "",
2385 "^gsa-crawler" => "",
2386 "Google Web Preview" => ""
2387 ),
2388 "uri" => "http://www.google.com/"
2389 ),
2390 "googlesitemaps" => array(
2391 "icon" => "google",
2392 "title" => "Google-Sitemaps",
2393 "rule" => array (
2394 "Googl(e|ebot)(-Sitemaps)?/([0-9.]{1,10})" => "\\3",
2395 "GSiteCrawler[ /v]*([0-9.a-z]{1,10})" => "\\1",
2396 "Googl(e|ebot)(-Sitemaps)?/" => ""
2397 ),
2398 "uri" => ""
2399 ),
2400 "googlemobile" => array(
2401 "icon" => "google",
2402 "title" => "Google-Mobile",
2403 "rule" => array (
2404 "Googl(e|ebot)(-Mobile)?/([0-9.]{1,10})" => "\\3",
2405 "Googl(e|ebot)(-Mobile)?/" => ""
2406 ),
2407 "uri" => ""
2408 ),
2409 "googleads" => array(
2410 "icon" => "google",
2411 "title" => "Google-AdsBot",
2412 "rule" => array (
2413 "^AdsBot-Google" => "",
2414 ),
2415 "uri" => ""
2416 ),
2417 "googlefeeds" => array(
2418 "icon" => "google",
2419 "title" => "Google-Feedfetcher",
2420 "rule" => array (
2421 "^Feedfetcher-Google" => "",
2422 ),
2423 "uri" => ""
2424 ),
2425 "googlverification" => array(
2426 "icon" => "google",
2427 "title" => "Google-Site-Verification",
2428 "rule" => array (
2429 "Google-Site-Verification[ /]([0-9.]{1,10})" => "\\1"
2430 ),
2431 "uri" => ""
2432 ),
2433 // Needs to be AFTER Google detection
2434 "goo" => array(
2435 "icon" => "goo",
2436 "title" => "Goo",
2437 "rule" => array (
2438 "(gazz|ichiro|mog(et|imogi))[ /]([0-9.]{1,10})" => "\\3",
2439 "DoCoMo[ /]([0-9.]{1,10})" => "\\1"
2440 ),
2441 "uri" => ""
2442 ),
2443 "goongee" => array(
2444 "icon" => "robot",
2445 "title" => "GoonGee",
2446 "rule" => array (
2447 "^Big Fish[ /]v?([0-9.]{1,10})" => "\\2"
2448 ),
2449 "uri" => "http://www.goongee.com/"
2450 ),
2451 "gpost" => array(
2452 "icon" => "gpost",
2453 "title" => "GPost",
2454 "rule" => array(
2455 "^GPostbot" => ""
2456 ),
2457 "uri" => ""
2458 ),
2459 "grapeshot" => array(
2460 "icon" => "grapeshot",
2461 "title" => "Grapeshot",
2462 "rule" => array(
2463 "GrapeshotCrawler[/ ]([0-9.]{1,10})" => "\\1"
2464 ),
2465 "uri" => "http://www.grapeshot.co.uk/crawler.php"
2466 ),
2467 "gregarius" => array(
2468 "icon" => "robot",
2469 "title" => "Gregarius",
2470 "rule" => array(
2471 "^Gregarius[/ ]([0-9.]{1,10})" => ""
2472 ),
2473 "uri" => ""
2474 ),
2475 "grub" => array(
2476 "icon" => "grub",
2477 "title" => "Grub",
2478 "rule" => array(
2479 "grub[ \-]?client[ /\-]{1,5}([0-9.]{1,10})" => "\\1",
2480 "grub crawler" => "",
2481 "grub[/ ]([0-9.]{1,10})" => "\\1",
2482 "^GrubNG([0-9. ]{1,10})?" => "\\1"
2483 ),
2484 "uri" => "http://www.grub.org/"
2485 ),
2486 "gulliver" => array(
2487 "icon" => "robot",
2488 "title" => "Gulliver",
2489 "rule" => array(
2490 "Gulliver" => ""
2491 ),
2492 "uri" => ""
2493 ),
2494 "guruji" => array(
2495 "icon" => "guruji",
2496 "title" => "Guruji",
2497 "rule" => array(
2498 "GurujiBot[/ ]([0-9.]{1,10})" => "\\1"
2499 ),
2500 "uri" => "http://www.guruji.com/"
2501 ),
2502 "gush" => array(
2503 "icon" => "robot",
2504 "title" => "Gush",
2505 "rule" => array(
2506 "^Gush[/ ]([0-9.]{1,10})" => "\\1"
2507 ),
2508 "uri" => ""
2509 ),
2510 "gziptester" => array(
2511 "icon" => "robot",
2512 "title" => "Gzip Tester",
2513 "rule" => array(
2514 "HTTP_Compression_Test" => "",
2515 "g(id)?zip[ \-]?test(er)?" => ""
2516 ),
2517 "uri" => "http://whatsmyip.org/"
2518 ),
2519 "hanzoweb" => array(
2520 "icon" => "hanzoweb",
2521 "title" => "Hanzoweb",
2522 "rule" => array(
2523 "^Hanzoweb" => ""
2524 ),
2525 "uri" => ""
2526 ),
2527 "harbot" => array(
2528 "icon" => "harbot",
2529 "title" => "Harbot",
2530 "rule" => array(
2531 "^Harbot GateStation" => ""
2532 ),
2533 "uri" => ""
2534 ),
2535 "hatena" => array(
2536 "icon" => "hatena",
2537 "title" => "Hatena",
2538 "rule" => array(
2539 "Hatena (Antenna|Bookmark|Pagetitle Agent)[ /]([0-9.]{1,10})" => "\\2"
2540 ),
2541 "uri" => ""
2542 ),
2543 "htmlparser" => array(
2544 "icon" => "htmlparser",
2545 "title" => "HTMLParser",
2546 "rule" => array(
2547 "HTMLParser[ /]([0-9.]{1,10})" => "\\1",
2548 "lua-resty-http/0.10" => ""
2549 ),
2550 "uri" => "http://htmlparser.sourceforge.net/"
2551 ),
2552 "helix" => array(
2553 "icon" => "helix",
2554 "title" => "Heritrix",
2555 "rule" => array(
2556 "^helix[ /]([0-9.]{1,10})" => "\\1"
2557 ),
2558 "uri" => "http://www.sitesearch.ca/helix/"
2559 ),
2560 "heritrix" => array(
2561 "icon" => "heritrix",
2562 "title" => "Heritrix",
2563 "rule" => array(
2564 "heritrix[ /]([0-9.]{1,10})" => "\\1",
2565 "archive.org_bot" => "",
2566 "InternetArchive[ /]([0-9.a-z]{1,10})" => "\\1"
2567 ),
2568 "uri" => "http://archive.org"
2569 ),
2570 "hiddenmarket" => array(
2571 "icon" => "robot",
2572 "title" => "HiddenMarket",
2573 "rule" => array(
2574 "HiddenMarket[ /\-]([0-9.]{1,10})" => "\\1"
2575 ),
2576 "uri" => ""
2577 ),
2578 "honda" => array(
2579 "icon" => "robot",
2580 "title" => "Honda",
2581 "rule" => array(
2582 "Honda-Search[ /]([0-9.]{1,10})" => "\\1"
2583 ),
2584 "uri" => "http://www.honda-search.com"
2585 ),
2586 "hoowwwer" => array(
2587 "icon" => "hoowwwer",
2588 "title" => "HooWWWer",
2589 "rule" => array(
2590 "HooWWWer[ /]([0-9.]{1,10})" => "\\1"
2591 ),
2592 "uri" => ""
2593 ),
2594 "hotzonu" => array(
2595 "icon" => "hotzonu",
2596 "title" => "Hotzonu",
2597 "rule" => array(
2598 "Hotzonu[ /]([0-9.]{1,10})" => "\\1"
2599 ),
2600 "uri" => ""
2601 ),
2602 "houxou" => array(
2603 "icon" => "robot",
2604 "title" => "Houxou",
2605 "rule" => array(
2606 "HouxouCrawler[ /]Nutch.([0-9.]{1,10})" => "\\1",
2607 "HouxouCrawler" => ""
2608 ),
2609 "uri" => ""
2610 ),
2611 "htdig" => array(
2612 "icon" => "htdig",
2613 "title" => "ht://Dig",
2614 "rule" => array(
2615 "htdig[ /]([0-9.]{1,10})" => "\\1",
2616 "htdig" => "\\1"
2617 ),
2618 "uri" => ""
2619 ),
2620 "html2jpg" => array(
2621 "icon" => "html2jpg",
2622 "title" => "HTML2JPG",
2623 "rule" => array(
2624 "^HTML2JPG" => ""
2625 ),
2626 "uri" => ""
2627 ),
2628 "httperf" => array(
2629 "icon" => "robot",
2630 "title" => "HTTPerf",
2631 "rule" => array(
2632 "httperf[ /]([0-9.]{1,10})" => "\\1"
2633 ),
2634 "uri" => ""
2635 ),
2636 "httpunit" => array(
2637 "icon" => "httpunit",
2638 "title" => "HttpUnit",
2639 "rule" => array(
2640 "httpunit[ /]([0-9.]{1,10})" => "\\1"
2641 ),
2642 "uri" => ""
2643 ),
2644 "httrack" => array(
2645 "icon" => "httrack",
2646 "title" => "HTTrack",
2647 "rule" => array(
2648 "HTTrack[ /]([0-9.]{1,10})" => "\\1"
2649 ),
2650 "uri" => ""
2651 ),
2652 "huaweisymantec" => array(
2653 "icon" => "huaweisymantec",
2654 "title" => "HuaweiSymantec",
2655 "rule" => array(
2656 "HuaweiSymantecSpider[ /]([0-9.]{1,10})" => "\\1"
2657 ),
2658 "uri" => "http://www.huaweisymantec.com/en/IRL/spider/"
2659 ),
2660 "hungary" => array(
2661 "icon" => "hungary",
2662 "title" => "Hungary",
2663 "rule" => array(
2664 "HuRob[ /]([0-9.]{1,10})" => "\\1"
2665 ),
2666 "uri" => ""
2667 ),
2668 "i18n" => array(
2669 "icon" => "w3c",
2670 "title" => "W3C I18n Checker",
2671 "rule" => array(
2672 "^W3C_I18n-Checker[ /]([0-9.]{1,10})" => "\\1"
2673 ),
2674 "uri" => "http://validator.w3.org/services"
2675 ),
2676 "iakke" => array(
2677 "icon" => "iakke",
2678 "title" => "Iakké",
2679 "rule" => array(
2680 "^iakke_bot[ /]v([0-9.]{1,10})" => "\\1"
2681 ),
2682 "uri" => "http://fr.iakke.com/"
2683 ),
2684 "iask" => array(
2685 "icon" => "iask",
2686 "title" => "IAsk",
2687 "rule" => array(
2688 "iaskspider[ /]([0-9.]{1,10})" => "\\1",
2689 "^iaskspider" => ""
2690 ),
2691 "uri" => "http://iask.com"
2692 ),
2693 "icc" => array(
2694 "icon" => "icc",
2695 "title" => "ICC-Crawler",
2696 "rule" => array(
2697 "^ICC-Crawler" => ""
2698 ),
2699 "uri" => "http://kc.nict.go.jp/icc/crawl.html"
2700 ),
2701 "icerocket" => array(
2702 "icon" => "icerocket",
2703 "title" => "Icerocket",
2704 "rule" => array(
2705 "BlogzIce[ /]([0-9.]{1,10})" => "\\1",
2706 "BlogSearch[ /]([0-9.]{1,10})" => "\\1"
2707 ),
2708 "uri" => ""
2709 ),
2710 "icjobs" => array(
2711 "icon" => "icjobs",
2712 "title" => "iCjobs",
2713 "rule" => array(
2714 "iCjobs[ /]([0-9.]{1,10})" => "\\1"
2715 ),
2716 "uri" => "http://www.icjobs.de/"
2717 ),
2718 "icra" => array(
2719 "icon" => "icra",
2720 "title" => "ICRA",
2721 "rule" => array(
2722 "^ICRA_Semantic_spider[ /]([0-9.]{1,10})" => "\\1"
2723 ),
2724 "uri" => "http://www.icra.org"
2725 ),
2726 "iknow" => array(
2727 "icon" => "robot",
2728 "title" => "I know",
2729 "rule" => array(
2730 "Comaneci_bot[ /]([0-9.]{1,10})" => "\\1"
2731 ),
2732 "uri" => ""
2733 ),
2734 "ilial" => array(
2735 "icon" => "robot",
2736 "title" => "Ilial",
2737 "rule" => array(
2738 "ilial[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
2739 ),
2740 "uri" => ""
2741 ),
2742 "ilocal" => array(
2743 "icon" => "ilocal",
2744 "title" => "ilocal",
2745 "rule" => array(
2746 "^ilocal" => "",
2747 ),
2748 "uri" => "http://www.ilocal.nl"
2749 ),
2750 "ilse" => array(
2751 "icon" => "ilse",
2752 "title" => "Ilse",
2753 "rule" => array(
2754 "I(NGRID|lseRobot|lseBot)[ /]([0-9.]{1,10})" => "\\1"
2755 ),
2756 "uri" => "http://ilse.nl/"
2757 ),
2758 "iltrovatore" => array(
2759 "icon" => "iltrovatore",
2760 "title" => "IlTrovatore",
2761 "rule" => array(
2762 "iltrovatore-setaccio[ /]([0-9.]{1,10})" => "\\1",
2763 "Iltrovatore-Setaccio" => "",
2764 "iltrovatore[ /]([0-9.]{1,10})" => "\\1"
2765 ),
2766 "uri" => ""
2767 ),
2768 "indylibrary" => array(
2769 "icon" => "robot",
2770 "title" => "Indy Library",
2771 "rule" => array(
2772 "Indy[ \-]?Library" => ""
2773 ),
2774 "uri" => ""
2775 ),
2776 "inela" => array(
2777 "icon" => "robot",
2778 "title" => "Inela",
2779 "rule" => array(
2780 "InelaBot[ /]([0-9.]{1,10})" => ""
2781 ),
2782 "uri" => "http://inelegant.org/bot"
2783 ),
2784 "ineturl" => array(
2785 "icon" => "robot",
2786 "title" => "InetURL",
2787 "rule" => array(
2788 "InetURL.?[ /]([0-9.]{1,10})" => ""
2789 ),
2790 "uri" => ""
2791 ),
2792 "infoart" => array(
2793 "icon" => "robot",
2794 "title" => "InfoArt",
2795 "rule" => array(
2796 "InfoArt crawler" => ""
2797 ),
2798 "uri" => ""
2799 ),
2800 "infomine" => array(
2801 "icon" => "infomine",
2802 "title" => "INFOMINE",
2803 "rule" => array(
2804 "^DataFountains/DMOZ" => "",
2805 "^INFOMINE[ /]([0-9.]{1,10})" => "\\1"
2806 ),
2807 "uri" => "http://infomine.ucr.edu/"
2808 ),
2809 "infoseek" => array(
2810 "icon" => "infoseek",
2811 "title" => "Infoseek",
2812 "rule" => array(
2813 "SideWinder[ /]?([0-9a-z.]{1,10})" => "\\1",
2814 "Infoseek" => ""
2815 ),
2816 "uri" => ""
2817 ),
2818 "inktomi" => array(
2819 "icon" => "inktomi",
2820 "title" => "Inktomi",
2821 "rule" => array(
2822 "slurp@inktomi\.com" => ""
2823 ),
2824 "uri" => ""
2825 ),
2826 "innerprise" => array(
2827 "icon" => "robot",
2828 "title" => "Innerprise",
2829 "rule" => array(
2830 "^InnerpriseBot[ /]([0-9.]{1,10})" => "\\1",
2831 "URL[ _]Spider[ _]Pro[ /]([0-9.+]{1,10})" => "\\1",
2832 "^ES[ .]NET[ _]Crawler[ /]([0-9.]{1,10})" => "\\1"
2833 ),
2834 "uri" => "http://www.innerprise.com/"
2835 ),
2836 "inria" => array(
2837 "icon" => "inria",
2838 "title" => "Inria",
2839 "rule" => array(
2840 "^xyro_" => ""
2841 ),
2842 "uri" => ""
2843 ),
2844 "insitor" => array(
2845 "icon" => "insitor",
2846 "title" => "Insitor",
2847 "rule" => array(
2848 "^Insitor(,|\.|naut)" => ""
2849 ),
2850 "uri" => "http://www.insitor.com/"
2851 ),
2852 "internetninja" => array(
2853 "icon" => "robot",
2854 "title" => "Internet Ninja",
2855 "rule" => array(
2856 "^Internet Ninja[ /]([0-9.]{1,10})" => "\\1"
2857 ),
2858 "uri" => ""
2859 ),
2860 "internetseer" => array(
2861 "icon" => "internetseer",
2862 "title" => "InternetSeer",
2863 "rule" => array(
2864 "^InternetSeer\.com" => ""
2865 ),
2866 "uri" => ""
2867 ),
2868 "interseek" => array(
2869 "icon" => "interseek",
2870 "title" => "Interseek",
2871 "rule" => array(
2872 "Interseek.com" => ""
2873 ),
2874 "uri" => "http://www.interseek.com"
2875 ),
2876 "intravnews" => array(
2877 "icon" => "intravnews",
2878 "title" => "IntraVnews",
2879 "rule" => array(
2880 "IntraVnews[ /]([0-9.]{1,10})" => "\\1"
2881 ),
2882 "uri" => "http://www.intravnews.com/"
2883 ),
2884 "ionos" => array(
2885 "icon" => "ionos",
2886 "title" => "IONOS",
2887 "rule" => array(
2888 "IonCrawl" => ""
2889 ),
2890 "uri" => "https://www.ionos.de/terms-gtc/faq-crawler-en/"
2891 ),
2892 "ip2location" => array(
2893 "icon" => "ip2location",
2894 "title" => "IP2LocationBot",
2895 "rule" => array(
2896 "^IP2(Map|Location)Bot[ /]([0-9.]{1,10})" => "\\2"
2897 ),
2898 "uri" => "http://www.ip2location.com"
2899 ),
2900 "ipworks" => array(
2901 "icon" => "ipworks",
2902 "title" => "IP*Works",
2903 "rule" => array(
2904 "^IP\*Works\! V([0-9.]{1,10})" => "\\1"
2905 ),
2906 "uri" => "http://www.nsoftware.com/ipworks/"
2907 ),
2908 "irca" => array(
2909 "icon" => "robot",
2910 "title" => "Novell iChain Cool Solutions caching",
2911 "rule" => array(
2912 "^ICRA_(label_generator|Semantic_spider)[ /]([0-9.]{1,10})" => "\\2",
2913 "^Mozilla[/ ]([0-9.]{1,10})[/ ]\(compatible[ ;]*ICS" => "\\1"
2914 ),
2915 "uri" => "http://www.icra.org"
2916 ),
2917 "irvine" => array(
2918 "icon" => "robot",
2919 "title" => "Irvine",
2920 "rule" => array(
2921 "Irvine[ /]([0-9.]{1,10})" => "\\1"
2922 ),
2923 "uri" => ""
2924 ),
2925 "ips-agent" => array(
2926 "icon" => "robot",
2927 "title" => "IPS-agent",
2928 "rule" => array(
2929 "ips-agent" => ""
2930 ),
2931 "uri" => ""
2932 ),
2933 "isara" => array(
2934 "icon" => "isara",
2935 "title" => "Isara",
2936 "rule" => array(
2937 "Isara[ -]([0-9.]{1,10})" => "\\1"
2938 ),
2939 "uri" => "http://www.isara.org/"
2940 ),
2941 "isspider" => array(
2942 "icon" => "robot",
2943 "title" => "ISSpider",
2944 "rule" => array(
2945 "ISSpider[ /\-]([0-9.]{1,10})" => "\\1"
2946 ),
2947 "uri" => ""
2948 ),
2949 "it2media" => array(
2950 "icon" => "it2media",
2951 "title" => "IT2media",
2952 "rule" => array(
2953 "www.adressendeutschland.de" => ""
2954 ),
2955 "uri" => "http://www.adressendeutschland.de/"
2956 ),
2957 "ivia" => array(
2958 "icon" => "robot",
2959 "title" => "iVia",
2960 "rule" => array(
2961 "iVia Site Checker.?[ /]([0-9.]{1,10})" => "\\1"
2962 ),
2963 "uri" => ""
2964 ),
2965 "jeteye" => array(
2966 "icon" => "jeteye",
2967 "title" => "Jeteye",
2968 "rule" => array(
2969 "Jetbot[ /]([0-9.]{1,10})" => "\\1"
2970 ),
2971 "uri" => ""
2972 ),
2973 "jobsde" => array(
2974 "icon" => "jobsde",
2975 "title" => "jobs.de",
2976 "rule" => array(
2977 "www\.jobs\.de" => "",
2978 "jobs.de-Robot" => ""
2979 ),
2980 "uri" => "http://www.jobs.de/"
2981 ),
2982 "jpluck" => array(
2983 "icon" => "robot",
2984 "title" => "Jpluck",
2985 "rule" => array(
2986 "JPluck[ /]([0-9a-z.]{1,10})" => "\\1"
2987 ),
2988 "uri" => ""
2989 ),
2990 "jxta" => array(
2991 "icon" => "robot",
2992 "title" => "Jxta",
2993 "rule" => array(
2994 "falcon[ /]([0-9.]{1,10})" => "\\1"
2995 ),
2996 "uri" => ""
2997 ),
2998 "jyte" => array(
2999 "icon" => "jyte",
3000 "title" => "Jyte",
3001 "rule" => array(
3002 "jyte_fetcher[ /]([0-9.]{1,10})" => "\\1"
3003 ),
3004 "uri" => ""
3005 ),
3006 "jyxo" => array(
3007 "icon" => "jyxo",
3008 "title" => "Jyxo",
3009 "rule" => array(
3010 "Jyxobot[ /]([0-9.]{1,10})" => "\\1"
3011 ),
3012 "uri" => ""
3013 ),
3014 "kalooga" => array(
3015 "icon" => "kalooga",
3016 "title" => "Kalooga",
3017 "rule" => array(
3018 "kalooga[ /-]([0-9.]{1,10})" => "\\1",
3019 "^kalooga" => "",
3020 "KaloogaBot" => ""
3021 ),
3022 "uri" => "http://www.kalooga.com"
3023 ),
3024 "keywen" => array(
3025 "icon" => "keywen",
3026 "title" => "Keywen",
3027 "rule" => array(
3028 "EasyDL[ /]([0-9.]{1,10})" => "\\1"
3029 ),
3030 "uri" => ""
3031 ),
3032 "kilomonkey" => array(
3033 "icon" => "robot",
3034 "title" => "Kilomonkey",
3035 "rule" => array(
3036 "kmky-not-a-bot[ /]([0-9.]{1,10})" => "\\1"
3037 ),
3038 "uri" => "http://www.kilomonkey.com/notabot.txt"
3039 ),
3040 "kinja" => array(
3041 "icon" => "kinja",
3042 "title" => "Kinja",
3043 "rule" => array(
3044 "kinjabot[ /]([0-9.]{1,10})" => "\\1",
3045 "^kinjabot" => ""
3046 ),
3047 "uri" => ""
3048 ),
3049 "kiwi" => array(
3050 "icon" => "robot",
3051 "title" => "KiwiStatus",
3052 "rule" => array(
3053 "KiwiStatus[ /]([0-9.]{1,10})" => "\\1",
3054 "KiwiStatus" => ""
3055 ),
3056 "uri" => "http://www.nzs.com/kiei-status/"
3057 ),
3058 "lachesis" => array(
3059 "icon" => "robot",
3060 "title" => "Lachesis",
3061 "rule" => array(
3062 "lachesis" => ""
3063 ),
3064 "uri" => ""
3065 ),
3066 "lanshan" => array(
3067 "icon" => "robot",
3068 "title" => "Lachesis",
3069 "rule" => array(
3070 "lanshanbot[/ ]([0-9.]{1,10})" => "\\1"
3071 ),
3072 "uri" => ""
3073 ),
3074 "lapozz" => array(
3075 "icon" => "lapozz",
3076 "title" => "Lapozz",
3077 "rule" => array(
3078 "LapozzBot[/ ]?([0-9.]{1,10})" => "\\1"
3079 ),
3080 "uri" => ""
3081 ),
3082 "larbin" => array(
3083 "icon" => "robot",
3084 "title" => "Larbin",
3085 "rule" => array(
3086 "larbin[_/ ]?([0-9.]{1,10})" => "\\1"
3087 ),
3088 "uri" => ""
3089 ),
3090 "laurion" => array(
3091 "icon" => "robot",
3092 "title" => "Laurion",
3093 "rule" => array(
3094 "^IPiumBot" => ""
3095 ),
3096 "uri" => "http://www.laurion.com/"
3097 ),
3098 "leechget" => array(
3099 "icon" => "leechget",
3100 "title" => "LeechGet",
3101 "rule" => array(
3102 "^LeechGet[ /]([0-9.]{1,10})" => "\\1"
3103 ),
3104 "uri" => ""
3105 ),
3106 "linguaseek" => array(
3107 "icon" => "linguaseek",
3108 "title" => "Linguaseek",
3109 "rule" => array(
3110 "^LinguaBot[ /]v([0-9.]{1,10})" => "\\1"
3111 ),
3112 "uri" => "http://www.linguaseek.com/"
3113 ),
3114 "linguee" => array(
3115 "icon" => "linguee",
3116 "title" => "Linguee",
3117 "rule" => array(
3118 "^Linguee Bot" => ""
3119 ),
3120 "uri" => "http://www.linguee.com/"
3121 ),
3122 "linkapedia" => array(
3123 "icon" => "linkapedia",
3124 "title" => "Linkapedia",
3125 "rule" => array(
3126 "^linkapedia" => ""
3127 ),
3128 "uri" => "http://www.linkapedia.com"
3129 ),
3130 "linkdex" => array(
3131 "icon" => "linkdex",
3132 "title" => "Linkdex",
3133 "rule" => array(
3134 "linkdexbot[ /]([0-9.]{1,10})" => "\\1"
3135 ),
3136 "uri" => "http://www.linkdex.com/bots/"
3137 ),
3138 "linkedin" => array(
3139 "icon" => "linkedin",
3140 "title" => "LinkedIn",
3141 "rule" => array(
3142 "LinkedInBot[ /]([0-9.]{1,10})" => "\\1"
3143 ),
3144 "uri" => "http://www.linkedin.com"
3145 ),
3146 "linkguard" => array(
3147 "icon" => "robot",
3148 "title" => "Linkguard",
3149 "rule" => array(
3150 "Linkguard Online[ /]([0-9.]{1,10})" => "\\1"
3151 ),
3152 "uri" => "http://www.linkguard.com/"
3153 ),
3154 "linklint" => array(
3155 "icon" => "linklint",
3156 "title" => "Linklint",
3157 "rule" => array(
3158 "^Linklint[-\-a-z /]*([0-9.]{1,10})" => "\\1"
3159 ),
3160 "uri" => "http://www.linklint.org/"
3161 ),
3162 "linkman" => array(
3163 "icon" => "linkman",
3164 "title" => "Linkman",
3165 "rule" => array(
3166 "\(compatible; Linkman\)" => ""
3167 ),
3168 "uri" => ""
3169 ),
3170 // Needs to be before linkcheck for correct detection
3171 "linkchecker" => array(
3172 "icon" => "w3c",
3173 "title" => "W3C Link Checker",
3174 "rule" => array(
3175 "^W3C-checklink[ /]([0-9.]{1,10})" => "\\1"
3176 ),
3177 "uri" => "http://validator.w3.org/checklink"
3178 ),
3179 "linkcheck" => array(
3180 "icon" => "linkcheck",
3181 "title" => "Linkcheck",
3182 "rule" => array(
3183 "checklink[ /]([0-9.]{1,10})" => "\\1",
3184 "Link[ \-]?(Chec(k|ker)|Val(et|idator))" => "",
3185 "Adaxas Spider" => "",
3186 "Agent-SharewarePlazaFileCheckBot[ /]([0-9.]{1,10})" => "\\1",
3187 // "NetMechanic V([0-9.]{1,10})" => "\\1",
3188 "^InfoLink" => "",
3189 "InternetLinkAgent" => "",
3190 "; SPENG\)" => "",
3191 "SharewarePlazaFileCheckBot" => "",
3192 "fileboost.net" => "",
3193 "^billbot" => ""
3194 ),
3195 "uri" => ""
3196 ),
3197 "linkru" => array(
3198 "icon" => "robot",
3199 "title" => "Link.RU",
3200 "rule" => array(
3201 "^Link.RU bot" => ""
3202 ),
3203 "uri" => ""
3204 ),
3205 "linkssql" => array(
3206 "icon" => "robot",
3207 "title" => "Links SQL",
3208 "rule" => array(
3209 "links sql" => ""
3210 ),
3211 "uri" => ""
3212 ),
3213 "linksweeper" => array(
3214 "icon" => "robot",
3215 "title" => "Link Sweeper",
3216 "rule" => array(
3217 "LinkSweeper[ /]([0-9.]{1,10})" => "\\1"
3218 ),
3219 "uri" => ""
3220 ),
3221 "linkwalker" => array(
3222 "icon" => "robot",
3223 "title" => "Link Walker",
3224 "rule" => array(
3225 "^LinkWalker" => ""
3226 ),
3227 "uri" => ""
3228 ),
3229 "lipperhey" => array(
3230 "icon" => "lipperhey",
3231 "title" => "Lipperhey",
3232 "rule" => array(
3233 "Lipperhey Spider" => ""
3234 ),
3235 "uri" => "http://www.lipperhey.com"
3236 ),
3237 "livedoor" => array(
3238 "icon" => "livedoor",
3239 "title" => "Livedoor",
3240 "rule" => array(
3241 "^Livedoor( SF( - California Crawl)?|Checkers)[ /]" => ""
3242 ),
3243 "uri" => ""
3244 ),
3245 "livejournal" => array(
3246 "icon" => "livejournal",
3247 "title" => "Live Journal",
3248 "rule" => array(
3249 "^LiveJournal\.com" => ""
3250 ),
3251 "uri" => "http://www.livejournal.com"
3252 ),
3253 "ljpic" => array(
3254 "icon" => "ljpic",
3255 "title" => "ljpic",
3256 "rule" => array(
3257 "LjSEEK Picture-Bot[ /]+([0-9.]{1,10})" => "\\1"
3258 ),
3259 "uri" => "http://www.ljpic.com"
3260 ),
3261 "lmspider" => array(
3262 "icon" => "robot",
3263 "title" => "Lmspider",
3264 "rule" => array(
3265 "^lmspider" => ""
3266 ),
3267 "uri" => ""
3268 ),
3269 "locators" => array(
3270 "icon" => "robot",
3271 "title" => "Locaters",
3272 "rule" => array(
3273 "^FiNDoBot[/ ]([0-9a-z.]{1,10})" => "\\1"
3274 ),
3275 "uri" => ""
3276 ),
3277 "look" => array(
3278 "icon" => "look",
3279 "title" => "Look",
3280 "rule" => array(
3281 "www\.look\.com" => "",
3282 "Lookbot" => ""
3283 ),
3284 "uri" => ""
3285 ),
3286 "looksmart" => array(
3287 "icon" => "looksmart",
3288 "title" => "LookSmart",
3289 "rule" => array(
3290 "^Martini" => "",
3291 "^MantraAgent" => "",
3292 "FurlBot" => "",
3293 "looksmart-sv-fw" => ""
3294 ),
3295 "uri" => ""
3296 ),
3297 "loop" => array(
3298 "icon" => "loop",
3299 "title" => "LOOP",
3300 "rule" => array(
3301 "NetResearchServer[ /]([0-9.]{1,10})" => "\\1"
3302 ),
3303 "uri" => ""
3304 ),
3305 "lotkyll" => array(
3306 "icon" => "robot",
3307 "title" => "Lotkyll",
3308 "rule" => array(
3309 "Lotkyll" => ""
3310 ),
3311 "uri" => ""
3312 ),
3313 "ltx71" => array(
3314 "icon" => "robot",
3315 "title" => "LTX71",
3316 "rule" => array(
3317 "ltx71" => ""
3318 ),
3319 "uri" => "http://ltx71.com/"
3320 ),
3321 "lwp" => array(
3322 "icon" => "robot",
3323 "title" => "lwp",
3324 "rule" => array(
3325 "lwp(-trivial|::simple)[ /]([0-9.]{1,10})" => "\\2"
3326 ),
3327 "uri" => ""
3328 ),
3329 "lycos" => array(
3330 "icon" => "lycos",
3331 "title" => "Lycos",
3332 "rule" => array(
3333 "Lycos_Spider_" => ""
3334 ),
3335 "uri" => ""
3336 ),
3337 "magpierss" => array(
3338 "icon" => "rss",
3339 "title" => "MagpieRSS",
3340 "rule" => array(
3341 "MagpieRSS" => ""
3342 ),
3343 "uri" => "http://magpierss.sourceforge.net/"
3344 ),
3345 "mailru" => array(
3346 "icon" => "mailru",
3347 "title" => "Mail.Ru",
3348 "rule" => array(
3349 "^Mail.Ru[ /]([0-9.]{1,10})" => "\\1",
3350 "Mail.RU_Bot[ /]([0-9.]{1,10})" => "\\1"
3351 ),
3352 "uri" => "http://www.mail.ru/"
3353 ),
3354 "mailsweeper" => array(
3355 "icon" => "robot",
3356 "title" => "Mail Sweeper",
3357 "rule" => array(
3358 "Mail[ \-]?Sweeper" => ""
3359 ),
3360 "uri" => ""
3361 ),
3362 "marvin" => array(
3363 "icon" => "robot",
3364 "title" => "Marvin",
3365 "rule" => array(
3366 "^Marvin" => ""
3367 ),
3368 "uri" => ""
3369 ),
3370 "matkurja" => array(
3371 "icon" => "matkurja",
3372 "title" => "Mat'Kurja",
3373 "rule" => array(
3374 "Mosad[ /]([0-9.]{1,10})" => "\\1"
3375 ),
3376 "uri" => ""
3377 ),
3378 "mavicanet" => array(
3379 "icon" => "mavicanet",
3380 "title" => "Mavicanet",
3381 "rule" => array(
3382 "Mavicanet robot" => ""
3383 ),
3384 "uri" => ""
3385 ),
3386 "meanpath" => array(
3387 "icon" => "meanpath",
3388 "title" => "Meanpath",
3389 "rule" => array(
3390 "meanpathbot[ /]([0-9.]{1,10})" => "\\1"
3391 ),
3392 "uri" => "http://www.meanpath.com/meanpathbot.html"
3393 ),
3394 "mediater" => array(
3395 "icon" => "robot",
3396 "title" => "Mediater",
3397 "rule" => array (
3398 "^libwww[ /]([0-9.]{1,10})" => "\\1"
3399 ),
3400 "uri" => ""
3401 ),
3402 "memory" => array(
3403 "icon" => "memory",
3404 "title" => "internet Memory",
3405 "rule" => array (
3406 "memoryBot[ /]([0-9.]{1,10})" => "\\1"
3407 ),
3408 "uri" => "http://internetmemory.org/en/"
3409 ),
3410 "mercator" => array(
3411 "icon" => "robot",
3412 "title" => "Mercator",
3413 "rule" => array(
3414 "Mercator" => ""
3415 ),
3416 "uri" => ""
3417 ),
3418 "metacarta" => array(
3419 "icon" => "robot",
3420 "title" => "Metacarta",
3421 "rule" => array(
3422 "^RRC (crawler_admin@bigfoot.com)" => "",
3423 "^flunky" => "",
3424 "^Mozilla.*\(samualt9@bigfoot.com\)$" => ""
3425 ),
3426 "uri" => "http://www.metacarta.com"
3427 ),
3428 "metager" => array(
3429 "icon" => "metager",
3430 "title" => "MetaGer",
3431 "rule" => array(
3432 "MetaGer" => ""
3433 ),
3434 "uri" => ""
3435 ),
3436 "metamark" => array(
3437 "icon" => "robot",
3438 "title" => "Metamark",
3439 "rule" => array(
3440 "^XRL[ /]([0-9.a-z]{1,10})" => "\\1"
3441 ),
3442 "uri" => "http://metamark.net"
3443 ),
3444 "metamedic" => array(
3445 "icon" => "metamedic",
3446 "title" => "MetaMedic",
3447 "rule" => array(
3448 "MediBot[ /]([0-9.]{1,10})" => "\\1"
3449 ),
3450 "uri" => ""
3451 ),
3452 "mirago" => array(
3453 "icon" => "mirago",
3454 "title" => "Mirago",
3455 "rule" => array(
3456 "Mirago" => ""
3457 ),
3458 "uri" => ""
3459 ),
3460 "misterwong" => array(
3461 "icon" => "misterwong",
3462 "title" => "Mister Wong",
3463 "rule" => array(
3464 "Mister Wong-Bot[ /]([0-9.]{1,10})" => "\\1"
3465 ),
3466 "uri" => "http://www.mister-wong.de/"
3467 ),
3468 "miva" => array(
3469 "icon" => "miva",
3470 "title" => "Miva",
3471 "rule" => array(
3472 "AlgoFeedback@miva\.com" => ""
3473 ),
3474 "uri" => "http://www.miva.com/"
3475 ),
3476 "mj12" => array(
3477 "icon" => "mj12",
3478 "title" => "Majestic-12",
3479 "rule" => array(
3480 "Mj12bot[ /]v?([0-9.]{1,10})" => "\\1",
3481 "MJ12bot \(mini\)[ /]([0-9.]{1,10})" => "\\1"
3482 ),
3483 "uri" => "http://majestic12.co.uk/bot.php"
3484 ),
3485 "mlbot" => array(
3486 "icon" => "robot",
3487 "title" => "MLBot",
3488 "rule" => array(
3489 "^MLBot" => ""
3490 ),
3491 "uri" => "http://www.metadatalabs.com/mlbot"
3492 ),
3493 "mnogo" => array(
3494 "icon" => "mnogo",
3495 "title" => "mnoGoSearch",
3496 "rule" => array(
3497 "Mnogosearch[ /\-]([0-9.]{1,10})" => "\\1"
3498 ),
3499 "uri" => "http://www.mnogosearch.org/"
3500 ),
3501 "mobileok" => array(
3502 "icon" => "mobileok",
3503 "title" => "W3C mobileOK",
3504 "rule" => array(
3505 "^W3C-mobileOK" => ""
3506 ),
3507 "uri" => "http://www.w3.org/2006/07/mobileok-ddc"
3508 ),
3509 "mojeek" => array(
3510 "icon" => "mojeek",
3511 "title" => "Mojeek",
3512 "rule" => array(
3513 "MojeekBot[ /]([0-9.]{1,10})" => "\\1"
3514 ),
3515 "uri" => "https://www.mojeek.com/bot.html"
3516 ),
3517 "momspider" => array(
3518 "icon" => "robot",
3519 "title" => "MOM Spider",
3520 "rule" => array(
3521 "MOMspider[ /]([0-9.]{1,10})" => "\\1"
3522 ),
3523 "uri" => ""
3524 ),
3525 "moreover" => array(
3526 "icon" => "moreover",
3527 "title" => "Moreover",
3528 "rule" => array(
3529 "^Moreoverbot[ /]([0-9.]{1,10})" => "\\1"
3530 ),
3531 "uri" => ""
3532 ),
3533 "movabletype" => array(
3534 "icon" => "movabletype",
3535 "title" => "Movable Type",
3536 "rule" => array(
3537 "MovableType[ /]([0-9.]{1,10})" => "\\1"
3538 ),
3539 "uri" => ""
3540 ),
3541 "mozdex" => array(
3542 "icon" => "mozdex",
3543 "title" => "MozDex",
3544 "rule" => array(
3545 "mozDex[ /]([0-9.]{1,6}(-dev)?)" => "\\1"
3546 ),
3547 "uri" => ""
3548 ),
3549 "mqbot" => array(
3550 "icon" => "robot",
3551 "title" => "MQbot",
3552 "rule" => array(
3553 "MQbot" => ""
3554 ),
3555 "uri" => ""
3556 ),
3557 "msnbot" => array(
3558 "icon" => "bing",
3559 "title" => "Bing",
3560 "rule" => array(
3561 "MSN(BOT|PTC)[ /]([0-9.]{1,10})" => "\\2",
3562 "MS Search ([0-9.]{1,10}) Robot" => "\\1",
3563 "MSNBOT-(MEDIA|PRODUCTS|NewsBlogs)[ /]([0-9.]{1,10})" => "\\2",
3564 "bingbot[ /]([0-9.]{1,10})" => "\\1"
3565 ),
3566 "uri" => ""
3567 ),
3568 "msnbot-mobile" => array(
3569 "icon" => "msn",
3570 "title" => "MSN Mobile",
3571 "rule" => array(
3572 "MSNBOT-(MOBILE|)[ /]([0-9.]{1,10})" => "\\2",
3573 "MSNBOT_Mobile" => "",
3574 "MSMOBOT" => ""
3575 ),
3576 "uri" => ""
3577 ),
3578 "mslivebot" => array(
3579 "icon" => "livesearch",
3580 "title" => "MS Live Search",
3581 "rule" => array(
3582 "MSNBOT-(Academic)[ /]([0-9.]{1,10})" => "\\2"
3583 ),
3584 "uri" => ""
3585 ),
3586 "msproxy" => array(
3587 "icon" => "robot",
3588 "title" => "MSProxy",
3589 "rule" => array(
3590 "MSProxy[ /]([0-9.]{1,10})" => "\\1"
3591 ),
3592 "uri" => ""
3593 ),
3594 "msrbot" => array(
3595 "icon" => "robot",
3596 "title" => "MSRBOT",
3597 "rule" => array(
3598 "^MSRBOT" => ""
3599 ),
3600 "uri" => "http://research.microsoft.com/research/sv/msrbot/"
3601 ),
3602 "mswebdav" => array(
3603 "icon" => "robot",
3604 "title" => "MS-WebDAV",
3605 "rule" => array(
3606 "Microsoft[ \-]?WebDAV[ \-]?MiniRedir" => ""
3607 ),
3608 "uri" => ""
3609 ),
3610 "mticon" => array(
3611 "icon" => "robot",
3612 "title" => "MTIcon",
3613 "rule" => array(
3614 "MTIcon[/ ]([0-9.]{1,10})" => "\\1"
3615 ),
3616 "uri" => ""
3617 ),
3618 "multipage-validator" => array(
3619 "icon" => "multipage-validator",
3620 "title" => "Multipage Validator",
3621 "rule" => array(
3622 "^W3C_Multipage_Validator[ /]([0-9.]{1,10})" => "\\1"
3623 ),
3624 "uri" => "http://www.validator.ca/"
3625 ),
3626 "myrss" => array(
3627 "icon" => "rss",
3628 "title" => "MyRSS",
3629 "rule" => array(
3630 "MyRSS.jp[/ ]([0-9.]{1,10})" => "\\1"
3631 ),
3632 "uri" => ""
3633 ),
3634 "multimap" => array(
3635 "icon" => "robot",
3636 "title" => "Multimap",
3637 "rule" => array(
3638 "Multimap Geotag Blog Parser[/ ]([0-9.]{1,10})" => "\\1"
3639 ),
3640 "uri" => ""
3641 ),
3642 "najdi" => array(
3643 "icon" => "najdi",
3644 "title" => "Najdi.si",
3645 "rule" => array(
3646 "Najdi.si" => ""
3647 ),
3648 "uri" => "http://www.najdi.si"
3649 ),
3650 "nameprotect" => array(
3651 "icon" => "nameprotect",
3652 "title" => "Name Protect",
3653 "rule" => array(
3654 "NPBot" => ""
3655 ),
3656 "uri" => ""
3657 ),
3658 "nationaldirectory" => array(
3659 "icon" => "robot",
3660 "title" => "National Directory",
3661 "rule" => array(
3662 "NationalDirectory-WebSpider[ /]([0-9.]{1,10})" => "\\1"
3663 ),
3664 "uri" => ""
3665 ),
3666 "natsumican" => array(
3667 "icon" => "robot",
3668 "title" => "Natsu Mican",
3669 "rule" => array(
3670 "NATSU[ \-]MICAN[/ ]([0-9a-z.]{1,10})" => "\\1"
3671 ),
3672 "uri" => ""
3673 ),
3674 "naverbot" => array(
3675 "icon" => "naverbot",
3676 "title" => "Naver",
3677 "rule" => array(
3678 "NaverBot([_\-]dloader)?[/ \-]([0-9.]{1,10})" => "\\2",
3679 "Naver(Bot)?" => "",
3680 "^nabot" => ""
3681 ),
3682 "uri" => ""
3683 ),
3684 "navisso" => array(
3685 "icon" => "navisso",
3686 "title" => "Navisso",
3687 "rule" => array(
3688 "Navisso(Bot)?" => ""
3689 ),
3690 "uri" => "http://www.navisso.com"
3691 ),
3692 "neevabot" => array(
3693 "icon" => "neeva",
3694 "title" => "Neeva",
3695 "rule" => array(
3696 "Neevabot[ /]([0-9.]{1,10})" => "\\1"
3697 ),
3698 "uri" => "https://neeva.com/neevabot"
3699 ),
3700 "neofonie" => array(
3701 "icon" => "robot",
3702 "title" => "Neofonie",
3703 "rule" => array(
3704 "www.neofonie.de" => ""
3705 ),
3706 "uri" => "http://www.neofonie.de/loesungen/search/robot.html"
3707 ),
3708 "neomo" => array(
3709 "icon" => "robot",
3710 "title" => "Neomo",
3711 "rule" => array(
3712 "Francis[ /]([0-9.]{1,10})" => "\\1"
3713 ),
3714 "uri" => ""
3715 ),
3716 "nessus" => array(
3717 "icon" => "nessus",
3718 "title" => "Nessus",
3719 "rule" => array(
3720 "Nessus\)$" => ""
3721 ),
3722 "uri" => ""
3723 ),
3724 "nerdybot" => array(
3725 "icon" => "robot",
3726 "title" => "NerdyBot",
3727 "rule" => array(
3728 "NerdyBot" => ""
3729 ),
3730 "uri" => "http://nerdybot.com/"
3731 ),
3732 "nerdbynature" => array(
3733 "icon" => "nerdbynature",
3734 "title" => "NerdByNature",
3735 "rule" => array(
3736 "NerdByNature.Bot" => ""
3737 ),
3738 "uri" => "http://www.nerdbynature.net/bot"
3739 ),
3740 "netants" => array(
3741 "icon" => "netants",
3742 "title" => "NetAnts",
3743 "rule" => array(
3744 "NetAnts[ /]([0-9.]{1,10})" => "\\1"
3745 ),
3746 "uri" => ""
3747 ),
3748 "netcraft" => array(
3749 "icon" => "netcraft",
3750 "title" => "Netcraft",
3751 "rule" => array(
3752 "netcraft" => ""
3753 ),
3754 "uri" => ""
3755 ),
3756 "netinfo" => array(
3757 "icon" => "netinfo",
3758 "title" => "Netinfo",
3759 "rule" => array(
3760 "^NetinfoBot[ /]([0-9.]{1,10})" => "\\1"
3761 ),
3762 "uri" => "http://netinfo.bg/"
3763 ),
3764 "netluchs" => array(
3765 "icon" => "netluchs",
3766 "title" => "Netluchs",
3767 "rule" => array(
3768 "Netluchs[ /]([0-9.a-z]{1,10})" => "\\1"
3769 ),
3770 "uri" => "http://www.netluchs.de/"
3771 ),
3772 "netmechanic" => array(
3773 "icon" => "netmechanic",
3774 "title" => "NetMechanic",
3775 "rule" => array(
3776 "NetMechanic[ /V]{1,5}([0-9.]{1,10})" => "\\1"
3777 ),
3778 "uri" => ""
3779 ),
3780 "netnose" => array(
3781 "icon" => "netnose",
3782 "title" => "NetNose",
3783 "rule" => array(
3784 "NetNose[ \-]Crawler[/ ]([0-9.]{1,10})" => "\\1"
3785 ),
3786 "uri" => ""
3787 ),
3788 "netoskop" => array(
3789 "icon" => "robot",
3790 "title" => "Netoskop",
3791 "rule" => array(
3792 "netoskop" => ""
3793 ),
3794 "uri" => ""
3795 ),
3796 "netpromoter" => array(
3797 "icon" => "netpromoter",
3798 "title" => "NetPromoter",
3799 "rule" => array(
3800 "NetPromoter Spider" => ""
3801 ),
3802 "uri" => "http://www.net-promoter.com/"
3803 ),
3804 "netprospector" => array(
3805 "icon" => "robot",
3806 "title" => "Netprospector",
3807 "rule" => array(
3808 "^netprospector" => ""
3809 )
3810 ),
3811 "netpumper" => array(
3812 "icon" => "robot",
3813 "title" => "Netpumper",
3814 "rule" => array(
3815 "^NetPumper[/ ]([0-9.]{1,10})" => "\\1"
3816 ),
3817 "uri" => ""
3818 ),
3819 "netscapeproxy" => array(
3820 "icon" => "netscape",
3821 "title" => "Netscape Proxy",
3822 "rule" => array(
3823 "Netscape-Proxy[/ ]([0-9.]{1,10})" => "\\1"
3824 ),
3825 "uri" => ""
3826 ),
3827 "netspective" => array(
3828 "icon" => "robot",
3829 "title" => "NetSpective",
3830 "rule" => array(
3831 "^WebFilter Robot ([0-9.]{1,10})" => "\\1"
3832 ),
3833 "uri" => ""
3834 ),
3835 "netvibes" => array(
3836 "icon" => "netvibes",
3837 "title" => " Netvibes",
3838 "rule" => array(
3839 "^Netvibes" => "\\1"
3840 ),
3841 "uri" => ""
3842 ),
3843 "newsfire" => array(
3844 "icon" => "newsfire",
3845 "title" => "NewsFire",
3846 "rule" => array(
3847 "NewsFire[/ ]([0-9.]{1,10})" => "\\1"
3848 ),
3849 "uri" => ""
3850 ),
3851 "newsgator" => array(
3852 "icon" => "newsgator",
3853 "title" => "NewsGator",
3854 "rule" => array(
3855 "NewsGato(r|rOnline)[/ ]([0-9.]{1,10})" => "\\2"
3856 ),
3857 "uri" => ""
3858 ),
3859 "newzcrawler" => array(
3860 "icon" => "newzcrawler",
3861 "title" => "NewzCrawler",
3862 "rule" => array(
3863 "NewzCrawler[/ ]([0-9.]{1,10})" => "\\1"
3864 ),
3865 "uri" => ""
3866 ),
3867 "nextopia" => array(
3868 "icon" => "newzcrawler",
3869 "title" => "NewzCrawler",
3870 "rule" => array(
3871 "^NextopiaBOT.*[v ]([0-9.]{1,10})" => "\\1"
3872 ),
3873 "uri" => ""
3874 ),
3875 "ngsearch" => array(
3876 "icon" => "ngsearch",
3877 "title" => "NG Search",
3878 "rule" => array(
3879 "NG-Search[/ ]([0-9.]{1,10})" => "\\1"
3880 ),
3881 "uri" => ""
3882 ),
3883 "nimble" => array(
3884 "icon" => "robot",
3885 "title" => "Nimble",
3886 "rule" => array(
3887 "NimbleCrawler[/ ]([0-9.]{1,10})" => "\\1"
3888 ),
3889 "uri" => ""
3890 ),
3891 "nmap" => array(
3892 "icon" => "nmap",
3893 "title" => "Nmap",
3894 "rule" => array(
3895 "Nmap Scripting Engine" => ""
3896 ),
3897 "uri" => "http://nmap.org/book/nse.html"
3898 ),
3899 "nusearch" => array(
3900 "icon" => "robot",
3901 "title" => "NuSearch",
3902 "rule" => array(
3903 "^nuSearch" => ""
3904 ),
3905 "uri" => "http://www.nusearch.com/"
3906 ),
3907 "noago" => array(
3908 "icon" => "noago",
3909 "title" => "Noago",
3910 "rule" => array(
3911 "Noago Spider" => ""
3912 ),
3913 "uri" => "http://www.noago.com/"
3914 ),
3915 "noviforum" => array(
3916 "icon" => "noviforum",
3917 "title" => "Noviforum",
3918 "rule" => array(
3919 "TridentSpider[/ ]?([0-9.]{1,10})" => "\\1"
3920 ),
3921 "uri" => ""
3922 ),
3923 "noxtrum" => array(
3924 "icon" => "noxtrum",
3925 "title" => "noXtrum",
3926 "rule" => array(
3927 "noxtrumbot[/ ]?([0-9.]{1,10})" => "\\1"
3928 ),
3929 "uri" => ""
3930 ),
3931 "noyona" => array(
3932 "icon" => "robot",
3933 "title" => "Noyona",
3934 "rule" => array(
3935 "noyona.([0-9._]{1,10})" => "\\1"
3936 ),
3937 "uri" => "http://noyona.com/"
3938 ),
3939 "nsauditor" => array(
3940 "icon" => "nsauditor",
3941 "title" => "Nsauditor",
3942 "rule" => array(
3943 "Nsauditor[ /]([0-9.]{1,10})" => "\\1"
3944 ),
3945 "uri" => "http://www.nsauditor.com/"
3946 ),
3947 "obidosbot" => array(
3948 "icon" => "robot",
3949 "title" => "Bookwatch",
3950 "rule" => array(
3951 "obidos[ \-]?bot" => ""
3952 ),
3953 "uri" => ""
3954 ),
3955 "objectssearch" => array(
3956 "icon" => "robot",
3957 "title" => "Objects Search",
3958 "rule" => array(
3959 "ObjectsSearch[ /]([0-9.]{1,10})" => "\\1"
3960 ),
3961 "uri" => ""
3962 ),
3963 "obot" => array(
3964 "icon" => "ibm",
3965 "title" => "IBM (ONLY) Crawler",
3966 "rule" => array(
3967 "oBot[ /]([0-9.]{1,10})" => "\\1"
3968 ),
3969 "uri" => "http://filterdb.iss.net/crawler/"
3970 // Previous from "ONLY Solutions GmbH" – that is what the O stands for
3971 ),
3972 "ocawa" => array(
3973 "icon" => "ocawa",
3974 "title" => "Ocawa",
3975 "rule" => array(
3976 "Ocawa[ /]([A-Z.a-z][0-9.]{1,10})" => "\\1",
3977 "Ocawa" => ""
3978 ),
3979 "uri" => "http://www.ocawa.com/"
3980 ),
3981 "octora" => array(
3982 "icon" => "octora",
3983 "title" => "Octora",
3984 "rule" => array(
3985 "^Octora (Beta)?" => ""
3986 ),
3987 "uri" => "http://www.octora.com/"
3988 ),
3989 "offlineexplorer" => array(
3990 "icon" => "robot",
3991 "title" => "OfflineExplorer",
3992 "rule" => array(
3993 "^Offline Explorer[ /]([0-9.]{1,10})" => "\\1"
3994 ),
3995 "uri" => ""
3996 ),
3997 "okhttp" => array(
3998 "icon" => "okhttp",
3999 "title" => "OkHttp",
4000 "rule" => array(
4001 "okhttp[ /]([0-9.]{1,10})" => "\\1",
4002 "okhttp" => ""
4003 ),
4004 "uri" => "https://square.github.io/okhttp/"
4005 ),
4006 "omea" => array(
4007 "icon" => "omea",
4008 "title" => "Omea Reader",
4009 "rule" => array(
4010 "Omea Reader[ /]([0-9.]{1,10})" => "\\1"
4011 ),
4012 "uri" => ""
4013 ),
4014 "onet" => array(
4015 "icon" => "onet",
4016 "title" => "Onet",
4017 "rule" => array(
4018 "OnetSzukaj[ /]([0-9.]{1,10})" => "\\1",
4019 "Onet\.pl" => "",
4020 "inktomi.search.onet" => ""
4021 ),
4022 "uri" => "http://www.onet.pl"
4023 ),
4024 "online24" => array(
4025 "icon" => "robot",
4026 "title" => "Online24",
4027 "rule" => array(
4028 "^Online24-Bot .* ([0-9.]{1,10})" => "\\1"
4029 ),
4030 "uri" => "http://www.online24.de"
4031 ),
4032 "onlinewebcheck" => array(
4033 "icon" => "csehtmlvalidator",
4034 "title" => "CSE HTML Validator",
4035 "rule" => array(
4036 "onlinewebcheck" => ""
4037 ),
4038 "uri" => "http://www.onlinewebcheck.com"
4039 ),
4040 "onsearch" => array(
4041 "icon" => "onsearch",
4042 "title" => "OnSearch",
4043 "rule" => array(
4044 "^onCHECK-Robot" => ""
4045 ),
4046 "uri" => "http://www.onsearch.de"
4047 ),
4048 "onto" => array(
4049 "icon" => "robot",
4050 "title" => "OntoSpider",
4051 "rule" => array(
4052 "^OntoSpider[ /]([0-9.]{1,10})" => "\\1"
4053 ),
4054 "uri" => "http://ontospider.i-n.info/"
4055 ),
4056 "openacoon" => array(
4057 "icon" => "robot",
4058 "title" => "OpenAcoon",
4059 "rule" => array(
4060 "^OpenAcoon v([0-9.]{1,10})" => "\\1"
4061 ),
4062 "uri" => "http://www.openacoon.de/"
4063 ),
4064 "openfind" => array(
4065 "icon" => "openfind",
4066 "title" => "Openfind",
4067 "rule" => array(
4068 "openbot[ /]([0-9.]{1,10})" => "\\1",
4069 "Openfind Robot[ /]([0-9.A-Z]{1,10})" => "\\1"
4070 ),
4071 "uri" => ""
4072 ),
4073 "opentagger" => array(
4074 "icon" => "robot",
4075 "title" => "OpenTagger",
4076 "rule" => array(
4077 "^OpenTaggerBot" => ""
4078 ),
4079 "uri" => "http://www.opentagger.com/opentaggerbot.htm"
4080 ),
4081 "opentext" => array(
4082 "icon" => "opentext",
4083 "title" => "OpenText",
4084 "rule" => array(
4085 "^OpenTextSiteCrawler[ /]([0-9.]{1,10})" => "\\1"
4086 ),
4087 "uri" => "http://www.opentext.net/"
4088 ),
4089 "openweb" => array(
4090 "icon" => "robot",
4091 "title" => "OpenWebSpider",
4092 "rule" => array(
4093 "^OpenWebSpider[ /]([0-9.]{1,10})" => "\\1",
4094 "^OpenWebSpider v([0-9.A-Z]{1,10})" => "\\1"
4095 ),
4096 "uri" => "http://www.openwebspider.org"
4097 ),
4098 "openx" => array(
4099 "icon" => "openx",
4100 "title" => "OpenX Spider",
4101 "rule" => array(
4102 "OpenX" => ""
4103 ),
4104 "uri" => "http://www.openx.org"
4105 ),
4106 "orange" => array(
4107 "icon" => "orange",
4108 "title" => "Orange",
4109 "rule" => array(
4110 "OrangeBot-Mobile[ /]([0-9.]{1,10})" => "\\1",
4111 "OrangeBot[ /]([0-9.]{1,10})" => "\\1"
4112 ),
4113 "uri" => "http://orange.com/"
4114 ),
4115 "organica" => array(
4116 "icon" => "robot",
4117 "title" => "Organica",
4118 "rule" => array(
4119 "crawler@organica\.us" => ""
4120 ),
4121 "uri" => ""
4122 ),
4123 "outfox" => array(
4124 "icon" => "robot",
4125 "title" => "Outfox Melon",
4126 "rule" => array(
4127 "OutfoxMelonBot[ /]([0-9.]{1,10})" => "\\1",
4128 "OutfoxBot[ /]([0-9.]{1,10})" => "\\1"
4129 ),
4130 "uri" => ""
4131 ),
4132 "overture" => array(
4133 "icon" => "overture",
4134 "title" => "Overture",
4135 "rule" => array(
4136 "Overture[ \-]?WebCrawler" => ""
4137 ),
4138 "uri" => ""
4139 ),
4140 "owler" => array(
4141 "icon" => "robot",
4142 "title" => "Owler",
4143 "rule" => array(
4144 "Owler[ /]([0-9.]{1,10})" => "\\1",
4145 "Owler" => ""
4146 ),
4147 "uri" => ""
4148 ),
4149 "page2rss" => array(
4150 "icon" => "page2rss",
4151 "title" => "Page2RSS",
4152 "rule" => array(
4153 "Page2RSS[ /]([0-9.]{1,10})" => "\\1"
4154 ),
4155 "uri" => "http://page2rss.com"
4156 ),
4157 "pagebytes" => array(
4158 "icon" => "robot",
4159 "title" => "PageBites",
4160 "rule" => array(
4161 "^PageBitesHyperBot[ /]([0-9.]{1,10})" => "\\1"
4162 ),
4163 "uri" => ""
4164 ),
4165 "pagesinventory" => array(
4166 "icon" => "pagesinventory",
4167 "title" => "PagesInventory",
4168 "rule" => array(
4169 "^PagesInventory" => ""
4170 ),
4171 "uri" => "http://www.pagesinventory.com"
4172 ),
4173 "pagesjaunes" => array(
4174 "icon" => "pagesjaunes",
4175 "title" => "Pages Jaunes",
4176 "rule" => array(
4177 "PJBot[ /]([0-9.]{1,10})" => "\\1"
4178 ),
4179 "uri" => "http://www.pagesjaunes.fr/"
4180 ),
4181 "pagevalet" => array(
4182 "icon" => "wdg",
4183 "title" => "WDG Page Valet",
4184 "rule" => array(
4185 "^Page Valet[ /]([0-9.]{1,10})" => "\\1"
4186 ),
4187 "uri" => "http://www.htmlhelp.com/tools/validator/"
4188 ),
4189 "panopeabot" => array(
4190 "icon" => "robot",
4191 "title" => "PanopeaBot",
4192 "rule" => array(
4193 "PanopeaBot[/ ]([0-9.]{1,10})" => "\\1"
4194 ),
4195 "uri" => ""
4196 ),
4197 "parchmenthill" => array(
4198 "icon" => "robot",
4199 "title" => "Parchment Hill",
4200 "rule" => array(
4201 "ParchBot[ /]([0-9.]{1,10})" => "\\1"
4202 ),
4203 "uri" => "http://www.parchmenthill.com/search.htm"
4204 ),
4205 "pascient" => array(
4206 "icon" => "pascient",
4207 "title" => "Pascient",
4208 "rule" => array(
4209 "panscient.com" => ""
4210 ),
4211 "uri" => "http://www.panscient.com/"
4212 ),
4213 "peerbot" => array(
4214 "icon" => "peerbot",
4215 "title" => "Peerbot",
4216 "rule" => array(
4217 "^PEERbot" => ""
4218 ),
4219 "uri" => ""
4220 ),
4221 "petalbot" => array(
4222 "icon" => "huawei",
4223 "title" => "PetalBot", // Huawei Search - also called Aspiegel
4224 "rule" => array(
4225 "PetalBot" => "",
4226 "AspiegelBot" => ""
4227 ),
4228 "uri" => "https://aspiegel.com/petalbot"
4229 ),
4230 "php" => array(
4231 "icon" => "php",
4232 "title" => "PHP",
4233 "rule" => array(
4234 "^PHP[ /]([0-9.]{1,10})" => "\\1"
4235 ),
4236 "uri" => ""
4237 ),
4238 "phpcrawl" => array(
4239 "icon" => "robot",
4240 "title" => "PHPCrawl",
4241 "rule" => array(
4242 "^PHPCrawl" => ""
4243 ),
4244 "uri" => "http://phpcrawl.cuab.de/"
4245 ),
4246 "phpdig" => array(
4247 "icon" => "robot",
4248 "title" => "PhpDig",
4249 "rule" => array(
4250 "^PhpDig[ /]([0-9.]{1,10})" => "\\1"
4251 ),
4252 "uri" => "http://www.finbot.com/"
4253 ),
4254 "phpversiontracker" => array(
4255 "icon" => "phpversiontracker",
4256 "title" => "PHP version tracker",
4257 "rule" => array(
4258 "^PHP version tracker" => ""
4259 ),
4260 "uri" => "http://www.nexen.net/phpversion/bot.php"
4261 ),
4262 "pictureofinternet" => array(
4263 "icon" => "robot",
4264 "title" => "PictureOfInternet",
4265 "rule" => array(
4266 "^PictureOfInternet[ /]([0-9.]{1,10})" => ""
4267 ),
4268 "uri" => ""
4269 ),
4270 "pingdom" => array(
4271 "icon" => "pingdom",
4272 "title" => "Pingdom",
4273 "rule" => array(
4274 "^Pingdom GIGRIB v([0-9.]{1,10})" => "\\1",
4275 "^Pingdom" => ""
4276 ),
4277 "uri" => "http://www.pingdom.com/"
4278 ),
4279 "pinseri" => array(
4280 "icon" => "pinseri",
4281 "title" => "Pinseri",
4282 "rule" => array(
4283 "www\.pinseri\.com/bloglist" => ""
4284 ),
4285 "uri" => ""
4286 ),
4287 "plagger" => array(
4288 "icon" => "plagger",
4289 "title" => "Plagger",
4290 "rule" => array(
4291 "Plagger[ /]([0-9.]{1,10})" => "\\1"
4292 ),
4293 "uri" => "http://www.plugger.org"
4294 ),
4295 "planet" => array(
4296 "icon" => "planet",
4297 "title" => "Planet",
4298 "rule" => array(
4299 "Planet[ /]([0-9.]{1,10})" => "\\1"
4300 ),
4301 "uri" => ""
4302 ),
4303 "plantynet" => array(
4304 "icon" => "robot",
4305 "title" => "PlantyNet",
4306 "rule" => array(
4307 "PlantyNet_WebRobot[_ /]V?([0-9.]{1,10})" => "\\1"
4308 ),
4309 "uri" => ""
4310 ),
4311 "pluck" => array(
4312 "icon" => "pluck",
4313 "title" => "Pluck",
4314 "rule" => array(
4315 "PluckFeedCrawler[ /]([0-9.]{1,10})" => "\\1"
4316 ),
4317 "uri" => ""
4318 ),
4319 "plsearch" => array(
4320 "icon" => "plsearch",
4321 "title" => "PlanetSearch",
4322 "rule" => array(
4323 "fido[ /]([0-9.]{1,10}) Harvest" => "\\1"
4324 ),
4325 "uri" => ""
4326 ),
4327 "poe" => array(
4328 "icon" => "robot",
4329 "title" => "POE-Component",
4330 "rule" => array(
4331 "^POE-Component-Client-HTTP[/ ]([0-9.]{1,10})" => "\\1"
4332 ),
4333 "uri" => ""
4334 ),
4335 "pogodak" => array(
4336 "icon" => "pogodak",
4337 "title" => "Pogodak",
4338 "rule" => array(
4339 "Pogodak\.hr[/ ]?([0-9.]{1,10})" => "\\1"
4340 ),
4341 "uri" => ""
4342 ),
4343 "poodle" => array(
4344 "icon" => "robot",
4345 "title" => "Poodle predictor",
4346 "rule" => array(
4347 "P(oo|ooo)dle[ \-]?predictor[ \-]?([0-9.]{1,10})" => "\\1",
4348 "P(oo|ooo)dle[ \-]?predictor" => ""
4349 ),
4350 "uri" => "http://www.gritechnologies.com/tools/spider.go"
4351 ),
4352 "pompos" => array(
4353 "icon" => "pompos",
4354 "title" => "Pompos",
4355 "rule" => array(
4356 "Pompos[ /]([0-9.]{1,10})" => "\\1"
4357 ),
4358 "uri" => ""
4359 ),
4360 "popdex" => array(
4361 "icon" => "robot",
4362 "title" => "Popdexter",
4363 "rule" => array(
4364 "Popdexter" => ""
4365 ),
4366 "uri" => ""
4367 ),
4368 "postrank" => array(
4369 "icon" => "postrank",
4370 "title" => "PostRank",
4371 "rule" => array(
4372 "^PostRank[ /]+([0-9.]{1,10})" => "\\1"
4373 ),
4374 "uri" => "http://www.postrank.com/"
4375 ),
4376 "powermarks" => array(
4377 "icon" => "robot",
4378 "title" => "Powermarks",
4379 "rule" => array(
4380 "Powermarks[ /]([0-9.]{1,10})" => "\\1"
4381 ),
4382 "uri" => ""
4383 ),
4384 "pinterest" => array(
4385 "icon" => "pinterest",
4386 "title" => "PROBE!",
4387 "rule" => array(
4388 "Pinterest[ /]([0-9.]{1,10})" => "\\1"
4389 ),
4390 "uri" => "http://www.pinterest.com/"
4391 ),
4392 "probe" => array(
4393 "icon" => "robot",
4394 "title" => "PROBE!",
4395 "rule" => array(
4396 "^PROBE!" => ""
4397 ),
4398 "uri" => ""
4399 ),
4400 "projecthoneypot" => array(
4401 "icon" => "projecthoneypot",
4402 "title" => "Project Honeypot",
4403 "rule" => array(
4404 "^PHPot Verispider[ /v]+([0-9.]{1,10})" => "\\1",
4405 "projecthoneypot" => ""
4406 ),
4407 "uri" => "http://www.projecthoneypot.org"
4408 ),
4409 "proxycache" => array(
4410 "icon" => "robot",
4411 "title" => "Proxy Cache",
4412 "rule" => array(
4413 "^Mozilla/[0-9.]{1,10} \(compatible\;\)$" => ""
4414 ),
4415 "uri" => ""
4416 ),
4417 "proxyhunter" => array(
4418 "icon" => "robot",
4419 "title" => "ProxyHunter",
4420 "rule" => array(
4421 "ProxyHunter" => ""
4422 ),
4423 "uri" => ""
4424 ),
4425 "psbot" => array(
4426 "icon" => "picsearch",
4427 "title" => "PicSearch",
4428 "rule" => array(
4429 "^psbot" => ""
4430 ),
4431 "uri" => ""
4432 ),
4433 "pubsub" => array(
4434 "icon" => "pubsub",
4435 "title" => "PubSub",
4436 "rule" => array(
4437 "^PubSub-RSS-Reader[ /]([0-9.]{1,10})" => "\\1",
4438 "^PubSub\.com" => ""
4439 ),
4440 "uri" => ""
4441 ),
4442 "pubarch" => array(
4443 "icon" => "robot",
4444 "title" => "PubArchive",
4445 "rule" => array(
4446 "publiclibraryarchive.org" => ""
4447 ),
4448 "uri" => ""
4449 ),
4450 "pukiwiki" => array(
4451 "icon" => "pukiwiki",
4452 "title" => "PukiWiki",
4453 "rule" => array(
4454 "PukiWiki[ /]([0-9.]{1,10})" => "\\1"
4455 ),
4456 "uri" => ""
4457 ),
4458 "pwebotxy" => array(
4459 "icon" => "pwebotxy",
4460 "title" => "PWeBot/X.Y",
4461 "rule" => array(
4462 "^PWeBot[ /]([0-9.]{1,10})" => "\\1"
4463 ),
4464 "uri" => "http://www.programacionweb.net/robot.php"
4465 ),
4466 "pxys" => array(
4467 "icon" => "robot",
4468 "title" => "PXYS",
4469 "rule" => array(
4470 "^pxys" => ""
4471 ),
4472 "uri" => ""
4473 ),
4474 "qango" => array(
4475 "icon" => "qango",
4476 "title" => "Qango",
4477 "rule" => array(
4478 "^Qango.com" => ""
4479 ),
4480 "uri" => "http://www.quango.com/"
4481 ),
4482 "qihoo" => array(
4483 "icon" => "qihoo",
4484 "title" => "Qihoo",
4485 "rule" => array(
4486 "QihooBot[ /]([0-9.]{1,10})" => "\\1"
4487 ),
4488 "uri" => "http://www.qihoo.com/"
4489 ),
4490 "qseero" => array(
4491 "icon" => "robot",
4492 "title" => "Qseero",
4493 "rule" => array(
4494 "Qseero v([0-9.]{1,10})" => "\\1"
4495 ),
4496 "uri" => "http://www.q0.com/"
4497 ),
4498 "quantcast" => array(
4499 "icon" => "robot",
4500 "title" => "Quantcast",
4501 "rule" => array(
4502 "Quantcastbot[ /]([0-9.]{1,10})" => "\\1"
4503 ),
4504 "uri" => "http://www.quantcast.com/"
4505 ),
4506 "quepasa" => array(
4507 "icon" => "quepasa",
4508 "title" => "Quepasa",
4509 "rule" => array(
4510 "Quepasa[ \-]?Creep" => ""
4511 ),
4512 "uri" => ""
4513 ),
4514 "questfinder" => array(
4515 "icon" => "robot",
4516 "title" => "QuestFinder",
4517 "rule" => array(
4518 "www\.questfinder\.com" => ""
4519 ),
4520 "uri" => ""
4521 ),
4522 "qwantify" => array(
4523 "icon" => "qwantify",
4524 "title" => "Qwantify",
4525 "rule" => array(
4526 "Qwantify[ /]([0-9.]{1,10})" => "\\1"
4527 ),
4528 "uri" => "https://www.qwant.com/"
4529 ),
4530 "qweery" => array(
4531 "icon" => "robot",
4532 "title" => "Qweery",
4533 "rule" => array(
4534 "^QweeryBot[ /]([0-9.]{1,10})" => "\\1"
4535 ),
4536 "uri" => "http://qweerybot.qweery.nl"
4537 ),
4538 "racaicrawler" => array(
4539 "icon" => "robot",
4540 "title" => "RacaiCrawler",
4541 "rule" => array(
4542 "RacaiCrawler[ -]([0-9.]{1,10})" => "\\1"
4543 )
4544 ),
4545 "radian6" => array(
4546 "icon" => "robot",
4547 "title" => "Radian6",
4548 "rule" => array(
4549 "www\.radian6\.com" => ""
4550 ),
4551 "uri" => "http://www.radian6.com"
4552 ),
4553 "radiofx" => array(
4554 "icon" => "radiofx",
4555 "title" => "Radio.fx",
4556 "rule" => array(
4557 "Radio.fx" => ""
4558 ),
4559 "uri" => "https://de.tobit.softwarw"
4560 ),
4561 "rambler" => array(
4562 "icon" => "rambler",
4563 "title" => "Rambler",
4564 "rule" => array(
4565 "StackRambler[ /]([0-9.]{1,10})" => "\\1"
4566 ),
4567 "uri" => ""
4568 ),
4569 "ramiba" => array(
4570 "icon" => "robot",
4571 "title" => "Ramiba",
4572 "rule" => array(
4573 "^ramiba(-bot)?" => "\\1"
4574 ),
4575 "uri" => ""
4576 ),
4577 "rankur" => array(
4578 "icon" => "rankur",
4579 "title" => "Rankur",
4580 "rule" => array(
4581 "^RankurBot/Rankur([0-9.]{1,10})" => "\\1"
4582 ),
4583 "uri" => "http://rankur.com/",
4584 ),
4585 "red" => array(
4586 "icon" => "red",
4587 "title" => "RED",
4588 "rule" => array(
4589 "RED[ /]([0-9.]{1,10})" => "\\1"
4590 ),
4591 "uri" => "http://redbot.org/"
4592 ),
4593 "rediff" => array(
4594 "icon" => "rediff",
4595 "title" => "Rediff",
4596 "rule" => array(
4597 "^RedBot/redbot[ /\-]([0-9.]{1,10})" => "\\1"
4598 ),
4599 "uri" => "http://www.rediff.com",
4600 ),
4601 "repia" => array(
4602 "icon" => "robot",
4603 "title" => "Repia",
4604 "rule" => array(
4605 "webmaster@repia\.com" => ""
4606 ),
4607 "uri" => ""
4608 ),
4609 "robotgenius" => array(
4610 "icon" => "robot",
4611 "title" => "Robot Genius",
4612 "rule" => array(
4613 "^robotgenius" => ""
4614 ),
4615 "uri" => "http://robotgenius.net",
4616 ),
4617 "robozilla" => array(
4618 "icon" => "robot",
4619 "title" => "Robozilla",
4620 "rule" => array(
4621 "Robozilla" => ""
4622 ),
4623 "uri" => ""
4624 ),
4625 "rogerbot" => array(
4626 "icon" => "moz",
4627 "title" => "Moz Rogerbot",
4628 "rule" => array(
4629 "rogerbot[ /]([0-9.]{1,10})" => "\\1"
4630 ),
4631 "uri" => "http://moz.com/help/guides/moz-procedures/who-is-rogerbot"
4632 ),
4633 "rojo" => array(
4634 "icon" => "rojo",
4635 "title" => "Rojo",
4636 "rule" => array(
4637 "Rojo[ /]([0-9.]{1,10})" => "\\1"
4638 ),
4639 "uri" => ""
4640 ),
4641 "rss-atom" => array(
4642 "icon" => "rss",
4643 "title" => "RSS / Atom",
4644 "rule" => array(
4645 "^Apple-PubSub" => "",
4646 "^AppleSyndication" => ""
4647 ),
4648 "uri" => ""
4649 ),
4650 "rssbot" => array(
4651 "icon" => "rss",
4652 "title" => "RSS-bot",
4653 "rule" => array(
4654 "rss-bot[ /]([0-9.]{1,10})" => "\\1"
4655 ),
4656 "uri" => ""
4657 ),
4658 "rssbandit" => array(
4659 "icon" => "rssbandit",
4660 "title" => "RssBandit",
4661 "rule" => array(
4662 "RssBandit[ /]([0-9.]{1,10})" => "\\1"
4663 ),
4664 "uri" => ""
4665 ),
4666 "rssimages" => array(
4667 "icon" => "rss",
4668 "title" => "RssImages",
4669 "rule" => array(
4670 "rssImagesBot[ /]([0-9.]{1,10})" => "\\1"
4671 ),
4672 "uri" => ""
4673 ),
4674 "rssmicro" => array(
4675 "icon" => "rssmicro",
4676 "title" => "RSSMicro",
4677 "rule" => array(
4678 "RSSMicro\.com" => ""
4679 ),
4680 "uri" => "http://www.rssmicro.com"
4681 ),
4682 "rssowl" => array(
4683 "icon" => "rssowl",
4684 "title" => "RSSOwl",
4685 "rule" => array(
4686 "RSSOwl[ /]([0-9a-z.]{1,10})" => "\\1"
4687 ),
4688 "uri" => ""
4689 ),
4690 "rssreader" => array(
4691 "icon" => "rss",
4692 "title" => "RssReader",
4693 "rule" => array(
4694 "RssReader[ /]([0-9.]{1,10})" => ""
4695 ),
4696 "uri" => ""
4697 ),
4698 "rtgi" => array(
4699 "icon" => "rtgi",
4700 "title" => "Rtgi",
4701 "rule" => array(
4702 "RTGI" => ""
4703 ),
4704 "uri" => "http://rtgi.fr/"
4705 ),
4706 "rufusbot" => array(
4707 "icon" => "robot",
4708 "title" => "RufusBot",
4709 "rule" => array(
4710 "RufusBot" => ""
4711 ),
4712 "uri" => ""
4713 ),
4714 "runet" => array(
4715 "icon" => "runet",
4716 "title" => "iTrack RuNet Crawler",
4717 "rule" => array(
4718 "Runet-Research-Crawler" => ""
4719 ),
4720 "uri" => "http://www.itrack.ru/research/cmsrate/"
4721 ),
4722 "runnk" => array(
4723 "icon" => "robot",
4724 "title" => "Runnk",
4725 "rule" => array(
4726 "Runnk RSS finder" => ""
4727 ),
4728 "uri" => "http://www.runnk.com/il/law"
4729 ),
4730 "sagool" => array(
4731 "icon" => "robot",
4732 "title" => "Sagool",
4733 "rule" => array(
4734 "MaSagool" => ""
4735 ),
4736 "uri" => "http://sagool.jp/"
4737 ),
4738 "sanszbot" => array(
4739 "icon" => "robot",
4740 "title" => "Sansz",
4741 "rule" => array(
4742 "SanszBot" => ""
4743 ),
4744 "uri" => ""
4745 ),
4746 "saucereader" => array(
4747 "icon" => "saucereader",
4748 "title" => "Sauce Reader",
4749 "rule" => array(
4750 "Sauce[ ]?Reader[ /]([0-9.]{1,10})" => "\\1"
4751 ),
4752 "uri" => ""
4753 ),
4754 "sbider" => array(
4755 "icon" => "sbider",
4756 "title" => "SBIder",
4757 "rule" => array(
4758 "SBIder[/ ]([0-9.]{1,10})" => "\\1",
4759 "SBIder[/ ]SBIder.([0-9.]{1,10})" => "\\1"
4760 ),
4761 "uri" => ""
4762 ),
4763 "scirus" => array(
4764 "icon" => "robot",
4765 "title" => "Scirus",
4766 "rule" => array(
4767 "FAST-WebCrawler/[0-9a-z.]{1,10}/Scirus" => ""
4768 ),
4769 "uri" => ""
4770 ),
4771 "scoutjet" => array(
4772 "icon" => "scoutjet",
4773 "title" => "ScoutJet",
4774 "rule" => array(
4775 "ScoutJet" => ""
4776 ),
4777 "uri" => "http://www.scoutjet.com/"
4778 ),
4779 "scrapy" => array(
4780 "icon" => "scrapy",
4781 "title" => "Scrapy",
4782 "rule" => array(
4783 "Scrapy[ /]([0-9.]{1,10})" => "\\1"
4784 ),
4785 "uri" => "http://scrapy.org"
4786 ),
4787 "scrubby" => array(
4788 "icon" => "scrubby",
4789 "title" => "Scrubby",
4790 "rule" => array(
4791 "Scrubby[ /]([0-9.]{1,10})" => "\\1"
4792 ),
4793 "uri" => ""
4794 ),
4795 "sdm" => array(
4796 "icon" => "sdm",
4797 "title" => "SUN Download Manager",
4798 "rule" => array(
4799 "Sun Download Manager[/ ]([0-9.]{1,10})" => "\\1"
4800 ),
4801 "uri" => ""
4802 ),
4803 "sealinks" => array(
4804 "icon" => "robot",
4805 "title" => "Sea Links",
4806 "rule" => array(
4807 "SEA-Links( HTML-Scanner Pingoo\!)?[ /]([0-9.]{1,10})" => "\\2"
4808 ),
4809 "uri" => ""
4810 ),
4811 "search17" => array(
4812 "icon" => "robot",
4813 "title" => "Search 17",
4814 "rule" => array(
4815 "Search17Bot[ /]([0-9.]{1,10})" => "\\1"
4816 ),
4817 "uri" => "http://www.search17.com/bot.php"
4818 ),
4819 "search2" => array(
4820 "icon" => "search2",
4821 "title" => "Search2.net",
4822 "rule" => array(
4823 "^S2Bot[ /]([0-9.]{1,10})" => "\\1"
4824 ),
4825 "uri" => "http://search2.net/"
4826 ),
4827 "searchbot" => array(
4828 "icon" => "robot",
4829 "title" => "Searchbot",
4830 "rule" => array(
4831 "Searchbot[ /]([0-9.]{1,10})" => "\\1"
4832 ),
4833 "uri" => ""
4834 ),
4835 "searchch" => array(
4836 "icon" => "robot",
4837 "title" => "Search.ch",
4838 "rule" => array(
4839 "search\.ch[ /]?V?([0-9.]{1,10})" => "\\1"
4840 ),
4841 "uri" => ""
4842 ),
4843 "searchengineworld" => array(
4844 "icon" => "robot",
4845 "title" => "SearchEngineWorld",
4846 "rule" => array(
4847 "searchengineworld" => ""
4848 ),
4849 "uri" => "http://www.searchengineworld.com/"
4850 ),
4851 "searchhippo" => array(
4852 "icon" => "searchhippo",
4853 "title" => "Searchhippo",
4854 "rule" => array(
4855 "searchhippo" => ""
4856 ),
4857 "uri" => "http://www.searchhippo.com/"
4858 ),
4859 "searchthruus" => array(
4860 "icon" => "robot",
4861 "title" => "SearchThruUs",
4862 "rule" => array(
4863 "www\.unitek-systems\.co\.uk[ /]([0-9.]{1,10})" => "\\1"
4864 ),
4865 "uri" => ""
4866 ),
4867 "securecomputing" => array(
4868 "icon" => "robot",
4869 "title" => "Secure Computing",
4870 "rule" => array(
4871 "securecomputing" => ""
4872 ),
4873 "uri" => ""
4874 ),
4875 "seekport" => array(
4876 "icon" => "seekport",
4877 "title" => "Seekport",
4878 "rule" => array(
4879 "Seekbot[ /]([0-9.]{1,10})" => "\\1"
4880 ),
4881 "uri" => ""
4882 ),
4883 "semanticdiscovery" => array(
4884 "icon" => "robot",
4885 "title" => "Semantic Discovery",
4886 "rule" => array(
4887 "semanticdiscovery[ /]([0-9.]{1,10})" => "\\1"
4888 ),
4889 "uri" => ""
4890 ),
4891 "semrush" => array(
4892 "icon" => "semrush",
4893 "title" => "SEMrush",
4894 "rule" => array(
4895 "SemrushBot[ /]([0-9.]{1,10})" => "\\1"
4896 ),
4897 "uri" => "http://www.semrush.com/bot.html"
4898 ),
4899 "sengine" => array(
4900 "icon" => "sengine",
4901 "title" => "Sengine",
4902 "rule" => array(
4903 "netEstate NE Crawler" => ""
4904 ),
4905 "uri" => "http://www.sengine.info/"
4906 ),
4907 "sensis" => array(
4908 "icon" => "sensis",
4909 "title" => "Sensis",
4910 "rule" => array(
4911 "^Sensis(.com.au)? Web Crawler" => ""
4912 ),
4913 "uri" => "http://sensis.com.au"
4914 ),
4915 "seokicks" => array(
4916 "icon" => "seokicks",
4917 "title" => "SEOkicks",
4918 "rule" => array(
4919 "SEOkicks-Robot" => ""
4920 ),
4921 "uri" => "http://www.seokicks.de/"
4922 ),
4923 "seoprofiler" => array(
4924 "icon" => "seoprofiler",
4925 "title" => "SEOprofiler",
4926 "rule" => array(
4927 "spbot[ /]([0-9.]{1,10})" => "\\1"
4928 ),
4929 "uri" => "http://www.seoprofiler.com/"
4930 ),
4931 "setooz" => array(
4932 "icon" => "setooz",
4933 "title" => "Setooz",
4934 "rule" => array(
4935 "OOZBOT[ /]([0-9.]{1,10})" => "\\1"
4936 ),
4937 "uri" => "http://www.setooz.com/oozbot.html"
4938 ),
4939 "seznam" => array(
4940 "icon" => "seznam",
4941 "title" => "Seznam",
4942 "rule" => array(
4943 "SeznamBot[ /]([0-9.]{1,10})" => "\\1",
4944 "Seznam" => ""
4945 ),
4946 "uri" => "http://www.seznam.cz"
4947 ),
4948 "sharpreader" => array(
4949 "icon" => "sharpreader",
4950 "title" => "SharpReader",
4951 "rule" => array(
4952 "SharpReader[ /]([0-9.]{1,10})" => "\\1"
4953 ),
4954 "uri" => ""
4955 ),
4956 "shelob" => array(
4957 "icon" => "shelob",
4958 "title" => "Sherlock Spider",
4959 "rule" => array(
4960 "^Shelob" => ""
4961 ),
4962 "uri" => "http://www.gmx.net"
4963 ),
4964 "sherlockspider" => array(
4965 "icon" => "robot",
4966 "title" => "Sherlock Spider",
4967 "rule" => array(
4968 "sherlock_spider" => ""
4969 ),
4970 "uri" => ""
4971 ),
4972 "shim" => array(
4973 "icon" => "robot",
4974 "title" => "Shim Crawler",
4975 "rule" => array(
4976 "shim[ \-]crawler" => ""
4977 ),
4978 "uri" => ""
4979 ),
4980 "shopwiki" => array(
4981 "icon" => "shopwiki",
4982 "title" => "ShopWiki",
4983 "rule" => array(
4984 "^ShopWiki[ /]([0-9.]{1,10})" => "\\1"
4985 ),
4986 "uri" => ""
4987 ),
4988 "shoula" => array(
4989 "icon" => "robot",
4990 "title" => "Shoula",
4991 "rule" => array(
4992 "^Shoula.com Crawler ([0-9.]{1,10})" => "\\1"
4993 ),
4994 "uri" => "http://www.shoula.com"
4995 ),
4996 "siege" => array(
4997 "icon" => "robot",
4998 "title" => "Siege",
4999 "rule" => array(
5000 "Siege[ /]([0-9.]{1,10})" => "\\1"
5001 ),
5002 "uri" => ""
5003 ),
5004 "siets" => array(
5005 "icon" => "robot",
5006 "title" => "Siets",
5007 "rule" => array(
5008 "SietsCrawler[ /]([0-9.]{1,10})" => "\\1"
5009 ),
5010 "uri" => ""
5011 ),
5012 "simpy" => array(
5013 "icon" => "simpy",
5014 "title" => "Simpy",
5015 "rule" => array(
5016 "^(argus|simpy)[ /]([0-9.]{1,10})" => "\\2",
5017 ),
5018 "uri" => ""
5019 ),
5020 "singingfish" => array(
5021 "icon" => "singingfish",
5022 "title" => "SingingFish",
5023 "rule" => array(
5024 "asterias[ /]([0-9.]{1,10})" => "\\1",
5025 "Asterias Crawler v([0-9.]{1,10})" => "\\1",
5026 "asterias" => ""
5027 ),
5028 "uri" => ""
5029 ),
5030 "sirketce" => array(
5031 "icon" => "robot",
5032 "title" => "Sirketce",
5033 "rule" => array(
5034 "Sirketcebot[ /v]+([0-9.]{1,10})" => "\\1"
5035 ),
5036 "uri" => "http://www.sirketce.com/bot.html"
5037 ),
5038 "sirobot" => array(
5039 "icon" => "robot",
5040 "title" => "SiroBot",
5041 "rule" => array(
5042 "sirobot" => ""
5043 ),
5044 "uri" => ""
5045 ),
5046 "sistrix" => array(
5047 "icon" => "sistrix",
5048 "title" => "SISTRIX",
5049 "rule" => array(
5050 "SISTRIX Crawler" => ""
5051 ),
5052 "uri" => "http://crawler.sistrix.net/"
5053 ),
5054 "sitebar" => array(
5055 "icon" => "sitebar",
5056 "title" => "SiteBar",
5057 "rule" => array(
5058 "SiteBar[ /]([0-9.]{1,10})" => "\\1"
5059 ),
5060 "uri" => ""
5061 ),
5062 "sitebot" => array(
5063 "icon" => "sitebot",
5064 "title" => "SiteBot",
5065 "rule" => array(
5066 "SiteBot[ /]([0-9.]{1,10})" => "\\1"
5067 ),
5068 "uri" => "http://www.sitebot.org/robot/"
5069 ),
5070 "siteexplorer" => array(
5071 "icon" => "siteexplorer",
5072 "title" => "SiteExplorer",
5073 "rule" => array(
5074 "SiteExplorer[ /]([0-9a-z.]{1,10})" => "\\1"
5075 ),
5076 "uri" => "http://siteexplorer.info/"
5077 ),
5078 "sitesell" => array(
5079 "icon" => "sitesell",
5080 "title" => "SiteSell",
5081 "rule" => array(
5082 "SBIder[/ ]([0-9a-z.\-]{1,10})" => "\\1"
5083 ),
5084 "uri" => ""
5085 ),
5086 "sitespider" => array(
5087 "icon" => "robot",
5088 "title" => "SiteSpider",
5089 "rule" => array(
5090 "^SiteSpider" => ""
5091 ),
5092 "uri" => ""
5093 ),
5094 "sitesucker" => array(
5095 "icon" => "sitesucker",
5096 "title" => "SiteSucker",
5097 "rule" => array(
5098 "Sitesucker[ /]([0-9.]{1,10})" => "\\1"
5099 ),
5100 "uri" => "http://www.sitesucker.us/"
5101 ),
5102 "sitidi" => array(
5103 "icon" => "robot",
5104 "title" => "SitiDi",
5105 "rule" => array(
5106 "SitiDiBot[ /]([0-9.]{1,10})" => "\\1"
5107 ),
5108 "uri" => ""
5109 ),
5110 "sixy" => array(
5111 "icon" => "robot",
5112 "title" => "Sixy.ch",
5113 "rule" => array(
5114 "sixy.ch[ /]([0-9a-z.]{1,10})" => "\\1"
5115 ),
5116 "uri" => "http://sixy.ch"
5117 ),
5118 "skaffe" => array(
5119 "icon" => "robot",
5120 "title" => "Skaffe",
5121 "rule" => array(
5122 "Skampy[ /]([0-9.\-]{1,10})" => "\\1"
5123 ),
5124 "uri" => "http://www.skaffe.com"
5125 ),
5126 "skizzle" => array(
5127 "icon" => "skizzle",
5128 "title" => "Skizzle",
5129 "rule" => array(
5130 "SKIZZLE! Distributed Internet Spider[ /v]+([0-9a-z.\-]{1,10})" => "\\1"
5131 ),
5132 "uri" => "http://www.skizzle.com"
5133 ),
5134 "slider" => array(
5135 "icon" => "robot",
5136 "title" => "Slider",
5137 "rule" => array(
5138 "^Slider[ /]([0-9.]{1,10})" => "\\1"
5139 ),
5140 "uri" => ""
5141 ),
5142 "slugch" => array(
5143 "icon" => "robot",
5144 "title" => "Slugch",
5145 "rule" => array(
5146 "^slug\.ch crawl ([0-9a-z.\-]{1,10})" => "\\1"
5147 ),
5148 "uri" => ""
5149 ),
5150 "smartware" => array(
5151 "icon" => "robot",
5152 "title" => "SmartWareSoft",
5153 "rule" => array(
5154 "^SWSBot-Images[ /]([0-9.]{1,10})" => "\\1"
5155 ),
5156 "uri" => "http://www.smartwaresoft.com/swsbot12.html"
5157 ),
5158 "snookit" => array(
5159 "icon" => "snookit",
5160 "title" => "Snookit",
5161 "rule" => array(
5162 "^snookit" => ""
5163 ),
5164 "uri" => "http://www.snookit.com/"
5165 ),
5166 "snoopy" => array(
5167 "icon" => "robot",
5168 "title" => "Snoopy",
5169 "rule" => array(
5170 "^Snoopy.+([0-9.]{1,10})" => "\\1",
5171 "sna-([0-9.]{1,10})" => "\\1"
5172 ),
5173 "uri" => "http://snoopy.sourceforge.net/"
5174 ),
5175 "snyke" => array(
5176 "icon" => "robot",
5177 "title" => "Snyke",
5178 "rule" => array(
5179 "^SnykeBot[ /]([0-9.]{1,10})" => "\\1"
5180 ),
5181 "uri" => "http://www.snyke.com"
5182 ),
5183 "socialradar" => array(
5184 "icon" => "socialradar",
5185 "title" => "Social Radar",
5186 "rule" => array(
5187 "Socialradarbot[ /]([0-9.]{1,10})" => "\\1"
5188 ),
5189 "uri" => "http://infegy.com/"
5190 ),
5191 "soegning" => array(
5192 "icon" => "soegning",
5193 "title" => "Søgning",
5194 "rule" => array(
5195 "soegning\.dk[/ ]spider[ /]([0-9.]{1,10})" => "\\1"
5196 ),
5197 "uri" => ""
5198 ),
5199 "soft411" => array(
5200 "icon" => "soft411",
5201 "title" => "Soft411",
5202 "rule" => array(
5203 "SOFT411 Directory" => ""
5204 ),
5205 "uri" => ""
5206 ),
5207 "sogou" => array(
5208 "icon" => "sogou",
5209 "title" => "Sogou",
5210 "rule" => array(
5211 "Sogou web spider[ /]([0-9.]{1,10})" => "\\1"
5212 ),
5213 "uri" => "http://www.sogou.com/docs/help/webmasters.htm#07"
5214 ),
5215 "sohu" => array(
5216 "icon" => "robot",
5217 "title" => "Sohu",
5218 "rule" => array(
5219 "sohu[ \-](agent|search)" => ""
5220 ),
5221 "uri" => ""
5222 ),
5223 "somewhere" => array(
5224 "icon" => "robot",
5225 "title" => "Somewhere.com",
5226 "rule" => array(
5227 "Mozilla\@somewhere\.com" => "\\1"
5228 ),
5229 "uri" => "http://www.somewhere.com/"
5230 ),
5231 "sopheus" => array(
5232 "icon" => "robot",
5233 "title" => "Sopheus",
5234 "rule" => array(
5235 "Sopheus Project[ /]([0-9.]{1,10})" => "\\1"
5236 ),
5237 "uri" => "http://www.thenetplanet.com"
5238 ),
5239 "soso" => array(
5240 "icon" => "soso",
5241 "title" => "Soso",
5242 "rule" => array(
5243 "^Soso(image)?spider" => ""
5244 ),
5245 "uri" => "http://help.soso.com/soso-image-spider.htm"
5246 ),
5247 "souppot" => array(
5248 "icon" => "robot",
5249 "title" => "SoupPot",
5250 "rule" => array(
5251 "SoupPotBot" => ""
5252 ),
5253 "uri" => ""
5254 ),
5255 "specificmedia" => array(
5256 "icon" => "specificmedia",
5257 "title" => "Specific Media",
5258 "rule" => array(
5259 "^SMBot[ /]([0-9.]{1,10})" => "\\1"
5260 ),
5261 "uri" => ""
5262 ),
5263 "sphider" => array(
5264 "icon" => "sphider",
5265 "title" => "Sphider",
5266 "rule" => array(
5267 "Sphider" => ""
5268 ),
5269 "uri" => "http://www.sphider.eu"
5270 ),
5271 "spinn3r" => array(
5272 "icon" => "robot",
5273 "title" => "Spinn3r",
5274 "rule" => array(
5275 "Spinn3r[ /]([0-9.]{1,10})" => "\\1"
5276 ),
5277 "uri" => "http://spinn3r.com/robot"
5278 ),
5279 "sproose" => array(
5280 "icon" => "robot",
5281 "title" => "Sproose",
5282 "rule" => array(
5283 "^sproose[ /]([0-9a-z.]{1,10})" => "\\1"
5284 ),
5285 "uri" => "http://www.sproose.com/bot.html"
5286 ),
5287 "spurlbot" => array(
5288 "icon" => "robot",
5289 "title" => "SpurlBot",
5290 "rule" => array(
5291 "SpurlBot[/ ]([0-9.]{1,10})" => "\\1"
5292 ),
5293 "uri" => ""
5294 ),
5295 "stardownloader" => array(
5296 "icon" => "stardownloader",
5297 "title" => "Star Downloader",
5298 "rule" => array(
5299 "^Star Downloader( Pro)?" => ""
5300 ),
5301 "uri" => ""
5302 ),
5303 "steeler" => array(
5304 "icon" => "robot",
5305 "title" => "Steeler",
5306 "rule" => array(
5307 "Steeler[ /]([0-9.]{1,10})" => "\\1"
5308 ),
5309 "uri" => ""
5310 ),
5311 "strategicboard" => array(
5312 "icon" => "strategicboard",
5313 "title" => "Strategic Board",
5314 "rule" => array(
5315 "Strategic Board Bot" => ""
5316 ),
5317 "uri" => "http://www.strategicboard.com"
5318 ),
5319 "suchbaer" => array(
5320 "icon" => "robot",
5321 "title" => "Suchbaer.de",
5322 "rule" => array(
5323 "^suchbaer\.de" => ""
5324 ),
5325 "uri" => "http://www.suchbaer.de/"
5326 ),
5327 "suchbot" => array(
5328 "icon" => "robot",
5329 "title" => "Suchbot",
5330 "rule" => array(
5331 "^suchbot" => ""
5332 ),
5333 "uri" => ""
5334 ),
5335 "suchende" => array(
5336 "icon" => "suchende",
5337 "title" => "Suchen.de",
5338 "rule" => array(
5339 "^gonzo([0-9]{1,2}).*www.suchen.de" => "\\1",
5340 "^gonzo/([0-9.]{1,10})" => "\\1"
5341 ),
5342 "uri" => "http://www.suchen.de/"
5343 ),
5344 "suchknecht" => array(
5345 "icon" => "robot",
5346 "title" => "Suchknecht",
5347 "rule" => array(
5348 "^Suchknecht.at-Robot" => ""
5349 ),
5350 "uri" => "http://www.suchknecht.at/"
5351 ),
5352 "suchpad" => array(
5353 "icon" => "robot",
5354 "title" => "Suchpad",
5355 "rule" => array(
5356 "^suchpadbot[ /]([0-9.]{1,10})" => "\\1"
5357 ),
5358 "uri" => "http://www.suchpad.de"
5359 ),
5360 "sunrise" => array(
5361 "icon" => "sunrise",
5362 "title" => "Sunrise",
5363 "rule" => array(
5364 "^Sunrise[ /]([0-9a-z.]{1,10})" => "\\1"
5365 ),
5366 "uri" => ""
5367 ),
5368 "superbot" => array(
5369 "icon" => "superbot",
5370 "title" => "SuperBot",
5371 "rule" => array(
5372 "SuperBot[ /]([0-9.]{1,10})" => "\\1"
5373 ),
5374 "uri" => ""
5375 ),
5376 "surfcontrol" => array(
5377 "icon" => "robot",
5378 "title" => "SurfControl",
5379 "rule" => array(
5380 "SurfControl" => "",
5381 "ScSpider[ /]([0-9.]{1,10})" => "\\1"
5382 ),
5383 "uri" => ""
5384 ),
5385 "surfnet" => array(
5386 "icon" => "robot",
5387 "title" => "SURFnet",
5388 "rule" => array(
5389 "AVSearch[ \-]([0-9.]{1,10})" => "\\1"
5390 ),
5391 "uri" => ""
5392 ),
5393 "surfsafely" => array(
5394 "icon" => "robot",
5395 "title" => "Surfsafely",
5396 "rule" => array(
5397 "Submission Spider at surfsafely.com" => ""
5398 ),
5399 "uri" => "http://www.surfsafely.com"
5400 ),
5401 "surphace" => array(
5402 "icon" => "spherescout",
5403 "title" => "Surphace",
5404 "rule" => array(
5405 "Sphere Scout.+([0-9.]{1,10})" => "\\1",//Previous called Sphere Scout
5406 "Surphace.+v([0-9.]{1,10})" => "\\1"
5407 ),
5408 "uri" => "http://www.surphace.com"
5409 ),
5410 "surveybot" => array(
5411 "icon" => "surveybot",
5412 "title" => "Whois Survey",
5413 "rule" => array(
5414 "SurveyBot[ /]([0-9.]{1,10})" => "\\1"
5415 ),
5416 "uri" => ""
5417 ),
5418 "swoogle" => array(
5419 "icon" => "robot",
5420 "title" => "Swoogle",
5421 "rule" => array(
5422 "^Swooglebot[ /]([0-9.]{1,10})" => "\\1"
5423 ),
5424 "uri" => "http://swoogle.umbc.edu/swooglebot.htm"
5425 ),
5426 "swse" => array(
5427 "icon" => "robot",
5428 "title" => "SWSE",
5429 "rule" => array(
5430 "sw\.deri\.org" => ""
5431 ),
5432 "uri" => "http://sw.deri.org/2006/04/multicrawler/robots.html"
5433 ),
5434 "swish-e" => array(
5435 "icon" => "swish-e",
5436 "title" => "Swish-e",
5437 "rule" => array(
5438 "^swish-e" => ""
5439 ),
5440 "uri" => "http://swish-e.org/"
5441 ),
5442 "sygol" => array(
5443 "icon" => "sygol",
5444 "title" => "Sygol",
5445 "rule" => array(
5446 "www.sygol.(com|net)" => ""
5447 ),
5448 "uri" => "http://www.sygol.com"
5449 ),
5450 "syllabs" => array(
5451 "icon" => "syllabs",
5452 "title" => "Syllabs",
5453 "rule" => array(
5454 "Focal[-]([0-9.]{1,10})" => "\\1"
5455 ),
5456 "uri" => "http://www.syllabs.com/crawler.html"
5457 ),
5458 "synapse" => array(
5459 "icon" => "robot",
5460 "title" => "Synapse",
5461 "rule" => array(
5462 " Synapse\)" => ""
5463 ),
5464 "uri" => "http://ws.apache.org/synapse/"
5465 ),
5466 "sync2it" => array(
5467 "icon" => "robot",
5468 "title" => "Sync2it",
5469 "rule" => array(
5470 "^\!Susie" => ""
5471 ),
5472 "uri" => "http://www.sync2it.com/bms/susie.php"
5473 ),
5474 "syncit" => array(
5475 "icon" => "robot",
5476 "title" => "Syncit",
5477 "rule" => array(
5478 "^SyncIT[ /]([0-9.]{1,10})" => "\\1"
5479 ),
5480 "uri" => "http://www.syncit.com/"
5481 ),
5482 "syndic8" => array(
5483 "icon" => "syndic8",
5484 "title" => "Syndic8",
5485 "rule" => array(
5486 "Syndic8[ /]([0-9.]{1,10})" => "\\1"
5487 ),
5488 "uri" => "http://www.syndic8.com/"
5489 ),
5490 "syndicatie" => array(
5491 "icon" => "robot",
5492 "title" => "Syndicatie.nl",
5493 "rule" => array(
5494 "Syndicatie\.nl robot v ([0-9.]{1,10})" => "\\1",
5495 "Syndicatie\.nl robot;" => ""
5496 ),
5497 "uri" => ""
5498 ),
5499 "synomia" => array(
5500 "icon" => "robot",
5501 "title" => "Synomia",
5502 "rule" => array(
5503 "^SynoBot" => ""
5504 ),
5505 "uri" => ""
5506 ),
5507 "synoo" => array(
5508 "icon" => "robot",
5509 "title" => "SynooBot",
5510 "rule" => array(
5511 "SynooBot[ /]([0-9.]{1,10})" => "\\1",
5512 ),
5513 "uri" => ""
5514 ),
5515 "szukacz" => array(
5516 "icon" => "szukacz",
5517 "title" => "Szukacz",
5518 "rule" => array(
5519 "Szukacz[ /]([0-9.]{1,10})" => "\\1"
5520 ),
5521 "uri" => ""
5522 ),
5523 "tagoo" => array(
5524 "icon" => "tagoobot",
5525 "title" => "Tagoo",
5526 "rule" => array(
5527 "Tagoobot[ /]([0-9.]{1,10})" => "\\1"
5528 ),
5529 "uri" => "http://www.tagoo.ru"
5530 ),
5531 "tagword" => array(
5532 "icon" => "tagword",
5533 "title" => "Tagword",
5534 "rule" => array(
5535 "^Tagword" => ""
5536 ),
5537 "uri" => "http://tagword.com/dmoz_survey.php"
5538 ),
5539 "trailfire" => array(
5540 "icon" => "trailfire",
5541 "title" => "Trailfire",
5542 "rule" => array(
5543 "^Trailfire-bot[ /]([0-9.]{1,10})" => "\\1"
5544 ),
5545 "uri" => "http://trailfire.com"
5546 ),
5547 "tamu" => array(
5548 "icon" => "tamu",
5549 "title" => "Tamu Crawler",
5550 "rule" => array(
5551 "IRLbot[ /]([0-9.]{1,10})" => "\\1",
5552 "TAMU_CS_IRL_CRAWLER[ /]([0-9.]{1,10})" => "\\1"
5553 ),
5554 "uri" => "http://irl.cs.tamu.edu/crawler/"
5555 ),
5556 "taptubot" => array(
5557 "icon" => "taptubot",
5558 "title" => "Taptu",
5559 "rule" => array(
5560 "taptubot" => ""
5561 ),
5562 "uri" => "http://www.taptu.com/corp/taptubot"
5563 ),
5564 "targetseek" => array(
5565 "icon" => "robot",
5566 "title" => "TargetSeek",
5567 "rule" => array(
5568 "TargetSeek[ /]([0-9.]{1,10})" => "\\1"
5569 ),
5570 "uri" => "http://www.targetgroups.net/TargetSeek.html"
5571 ),
5572 "taw" => array(
5573 "icon" => "taw",
5574 "title" => "TAW",
5575 "rule" => array(
5576 "TAW[ /]([0-9.]{1,10})" => "\\1"
5577 ),
5578 "uri" => "http://www.tawdis.net"
5579 ),
5580 "tcd" => array(
5581 "icon" => "tcd",
5582 "title" => "Trinity College Dublin",
5583 "rule" => array(
5584 "^TCDBOT/Nutch-([0-9.]{1,10})" => "\\1"
5585 ),
5586 "uri" => "http://www.tcd.ie"
5587 ),
5588 "technorati" => array(
5589 "icon" => "technorati",
5590 "title" => "Technorati",
5591 "rule" => array(
5592 "Technoratibot[ /]([0-9.]{1,10})" => "\\1"
5593 ),
5594 "uri" => ""
5595 ),
5596 "teleport" => array(
5597 "icon" => "teleport",
5598 "title" => "Teleport",
5599 "rule" => array(
5600 "Teleport[ \-]?Pro" => ""
5601 ),
5602 "uri" => ""
5603 ),
5604 "terrar" => array(
5605 "icon" => "robot",
5606 "title" => "Terrar",
5607 "rule" => array(
5608 "^Fresh Search :: Terrar" => ""
5609 ),
5610 "uri" => ""
5611 ),
5612 "theophrastus" => array(
5613 "icon" => "robot",
5614 "title" => "Theophrastus",
5615 "rule" => array(
5616 "Theophrastus[ /]([0-9.]{1,10})" => "\\1"
5617 ),
5618 "uri" => "http://users.cs.cf.ac.uk/N.A.Smith/theophrastus.php"
5619 ),
5620 "thumbnailscz" => array(
5621 "icon" => "robot",
5622 "title" => "Thumbnails.cz",
5623 "rule" => array(
5624 "^thumbnail\.cz robot[ /]([0-9.]{1,10})" => "\\1"
5625 ),
5626 "uri" => ""
5627 ),
5628 "thumbshot" => array(
5629 "icon" => "robot",
5630 "title" => "Thumbshots",
5631 "rule" => array(
5632 "^thumbshots.*(Version: |v)([0-9.]{2,10})e" => "\\1",
5633 "^thumbshots-de" => ""
5634 ),
5635 "uri" => "http://www.thumbshots.de"
5636 ),
5637 "thunderstone" => array(
5638 "icon" => "thunderstone",
5639 "title" => "Thunderstone",
5640 "rule" => array(
5641 "T-H-U-N-D-E-R-S-T-O-N-E" => "",
5642 "search.thunderstone.com" => ""
5643 ),
5644 "uri" => "http://search.thunderstone.com/"
5645 ),
5646 "timbobot" => array(
5647 "icon" => "robot",
5648 "title" => "TimboBot",
5649 "rule" => array(
5650 "timboBot" => ""
5651 ),
5652 "uri" => ""
5653 ),
5654 "topsy" => array(
5655 "icon" => "topsy",
5656 "title" => "Topsy",
5657 "rule" => array(
5658 "Butterfly[ /]([0-9.]{1,10})" => "\\1"
5659 ),
5660 "uri" => "http://labs.topsy.com/butterfly.html"
5661 ),
5662 "trayce" => array(
5663 "icon" => "robot",
5664 "title" => "Trayce",
5665 "rule" => array(
5666 "traycebot[ /]([0-9a-z.\-]{1,10})" => "\\1"
5667 ),
5668 "uri" => ""
5669 ),
5670 "tricus" => array(
5671 "icon" => "robot",
5672 "title" => "Tricus",
5673 "rule" => array(
5674 "B_l_i_t_z_B_O_T_@_t_r_i_c_u_s_\._c_o_m" => ""
5675 ),
5676 "uri" => ""
5677 ),
5678 "topicblogs" => array(
5679 "icon" => "robot",
5680 "title" => "Topicblogs",
5681 "rule" => array(
5682 "topicblogs[ /]([0-9.]{1,10})" => "\\1"
5683 ),
5684 "uri" => ""
5685 ),
5686 "touche" => array(
5687 "icon" => "touche",
5688 "title" => "Touché",
5689 "rule" => array(
5690 "^Touche" => ""
5691 ),
5692 "uri" => "http://touche.com.ve"
5693 ),
5694 "tuezilla" => array(
5695 "icon" => "robot",
5696 "title" => "TÃœzilla",
5697 "rule" => array(
5698 "tuezilla.de" => ""
5699 ),
5700 "uri" => "http://tuezilla.de/t_st-odp-entries-agent.html"
5701 ),
5702 "turnitin" => array(
5703 "icon" => "turnitin",
5704 "title" => "Turnitin",
5705 "rule" => array(
5706 "TurnitinBot[ /]([0-9.]{1,10})" => "\\1",
5707 "^Turnitin" => ""
5708 ),
5709 "uri" => ""
5710 ),
5711 "tutorgig" => array(
5712 "icon" => "robot",
5713 "title" => "TutorGig",
5714 "rule" => array(
5715 "TutorGig(Bot)?[ /]([0-9.]{1,10})" => "\\2"
5716 ),
5717 "uri" => ""
5718 ),
5719 "twiceler" => array(
5720 "icon" => "cuill",
5721 "title" => "Cuill",
5722 "rule" => array(
5723 "Twiceler[ /-]([0-9.]{1,10})" => "\\1",
5724 "Twiceler" => ""
5725 ),
5726 "uri" => "http://www.cuill.com/twiceler/robot.html"
5727 ),
5728 "twingly" => array(
5729 "icon" => "twingly",
5730 "title" => "Twingly",
5731 "rule" => array(
5732 "Twingly Recon" => ""
5733 ),
5734 "uri" => "http://www.twingly.com/"
5735 ),
5736 "twitter" => array(
5737 "icon" => "twitter",
5738 "title" => "Twitter",
5739 "rule" => array(
5740 "Twitterbot[ /-]([0-9.]{1,10})" => "\\1"
5741 ),
5742 "uri" => "https://dev.twitter.com/cards/getting-started#crawling"
5743 ),
5744 "typepad" => array(
5745 "icon" => "typepad",
5746 "title" => "TypePad",
5747 "rule" => array(
5748 "TypePad/([0-9a-z.]{1,10})" => "\\1"
5749 ),
5750 "uri" => ""
5751 ),
5752 "udmsearch" => array(
5753 "icon" => "robot",
5754 "title" => "UdmSearch",
5755 "rule" => array(
5756 "UdmSearch[/ ]([0-9.]{1,10})" => "\\1"
5757 ),
5758 "uri" => ""
5759 ),
5760 "ukwizz" => array(
5761 "icon" => "ukwizz",
5762 "title" => "UKWizz",
5763 "rule" => array(
5764 "^Mackster.*ukwizz" => ""
5765 ),
5766 "uri" => "http://www.ukwizz.com"
5767 ),
5768 "ultraseek" => array(
5769 "icon" => "robot",
5770 "title" => "Ultraseek",
5771 "rule" => array(
5772 "Ultraseek" => ""
5773 ),
5774 "uri" => ""
5775 ),
5776 "ultraspider" => array(
5777 "icon" => "robot",
5778 "title" => "UltraSpider",
5779 "rule" => array(
5780 "UltraSpider3000[/ ]([0-9.]{1,10})" => "\\1"
5781 ),
5782 "uri" => "http://www.search.ch"
5783 ),
5784 "umai" => array(
5785 "icon" => "robot",
5786 "title" => "Umai",
5787 "rule" => array(
5788 "umai[/ ]([0-9.]{1,10})" => "\\1"
5789 ),
5790 "uri" => ""
5791 ),
5792 "unchaos" => array(
5793 "icon" => "robot",
5794 "title" => "Unchaos",
5795 "rule" => array(
5796 "unchaos_crawler[_ /]([0-9.]{1,10})" => "\\1",
5797 "unchaos" => ""
5798 ),
5799 "uri" => ""
5800 ),
5801 "unido" => array(
5802 "icon" => "robot",
5803 "title" => "UNIdo",
5804 "rule" => array(
5805 "^unido-bot" => "\\1"
5806 ),
5807 "uri" => "http://mobicom.cs.uni-dortmund.de/bot.html"
5808 ),
5809 "updated" => array(
5810 "icon" => "robot",
5811 "title" => "Updated",
5812 "rule" => array(
5813 "updated[ /]([0-9a-z.]{1,10})" => "\\1"
5814 ),
5815 "uri" => ""
5816 ),
5817 "uptimebot" => array(
5818 "icon" => "robot",
5819 "title" => "UptimeBot",
5820 "rule" => array(
5821 "^UptimeBot" => ""
5822 ),
5823 "uri" => "http://www.uptimebot.com/"
5824 ),
5825 "urifetch" => array(
5826 "icon" => "robot",
5827 "title" => "URI::Fetch",
5828 "rule" => array(
5829 "^URI::Fetch[ /]([0-9.]{1,10})" => "\\1"
5830 ),
5831 "uri" => ""
5832 ),
5833 "urlbase" => array(
5834 "icon" => "robot",
5835 "title" => "URLBase",
5836 "rule" => array(
5837 "URLBase[ /]([0-9.]{1,10})" => "\\1"
5838 ),
5839 "uri" => ""
5840 ),
5841 "urlblaze" => array(
5842 "icon" => "robot",
5843 "title" => "URLBlaze",
5844 "rule" => array(
5845 "^URLBlaze" => ""
5846 ),
5847 "uri" => ""
5848 ),
5849 "urlcontr" => array(
5850 "icon" => "robot",
5851 "title" => "MS URL Control",
5852 "rule" => array(
5853 "Microsoft URL[ \-]?Control" => ""
5854 ),
5855 "uri" => ""
5856 ),
5857 "urlgetfile" => array(
5858 "icon" => "robot",
5859 "title" => "URLGetFile",
5860 "rule" => array(
5861 "^URLGetFile" => ""
5862 ),
5863 "uri" => ""
5864 ),
5865 "urlscope" => array(
5866 "icon" => "robot",
5867 "title" => "UrlScope",
5868 "rule" => array(
5869 "UrlScope" => ""
5870 ),
5871 "uri" => ""
5872 ),
5873 "urltrends" => array(
5874 "icon" => "urltrends",
5875 "title" => "UrlTrends",
5876 "rule" => array(
5877 "Snappy/([0-9.]{1,10})" => "\\1",
5878 ),
5879 "uri" => ""
5880 ),
5881 "usww" => array(
5882 "icon" => "usww",
5883 "title" => "USWW",
5884 "rule" => array(
5885 "usww\.com" => "",
5886 "Mozilla/5\.0 URL-Spider" => ""
5887 ),
5888 "uri" => "http://www.usww.com/"
5889 ),
5890 "usyd" => array(
5891 "icon" => "robot",
5892 "title" => "USyd-NLP-Spider",
5893 "rule" => array(
5894 "^USyd-NLP-Spider" => ""
5895 ),
5896 "uri" => "http://www.it.usyd.edu.au/~vinci/bot.html"
5897 ),
5898 "vagabondo" => array(
5899 "icon" => "wiseguys",
5900 "title" => "WiseGuys",
5901 "rule" => array(
5902 "Vagabondo[ /]([0-9.]{1,10})" => "\\1",
5903 "Vagabondo-WAP[ /]([0-9.]{1,10})" => "\\1"
5904 ),
5905 "uri" => ""
5906 ),
5907 "unicorn" => array(
5908 "icon" => "w3c",
5909 "title" => "W3C Unicorn",
5910 "rule" => array(
5911 "Unicorn[ /]([0-9.]{1,10})" => "\\1",
5912 ),
5913 "uri" => "http://validator.w3.org/unicorn/"
5914 ),
5915 "validator" => array(
5916 "icon" => "w3c",
5917 "title" => "W3C Validator",
5918 "rule" => array(
5919 "W3C_Validator[ /]([0-9.]{1,10})" => "\\1"
5920 ),
5921 "uri" => "http://validator.w3.org/"
5922 ),
5923 "validator.nu" => array(
5924 "icon" => "validatornu",
5925 "title" => "Validator.nu",
5926 "rule" => array(
5927 "^Validator.nu[ /]([0-9.]{1,10})" => "\\1",
5928 "^Validator.nu/LV" => "\\1"
5929 ),
5930 "uri" => "http://validator.nu/"
5931 ),
5932 "validome" => array(
5933 "icon" => "validome",
5934 "title" => "Validome",
5935 "rule" => array(
5936 "web-validator[ /]([0-9.]{1,10})" => "\\1",
5937 "web-validator" => "\\1"
5938 ),
5939 "uri" => "https://validome.org/"
5940 ),
5941 "verity" => array(
5942 "icon" => "robot",
5943 "title" => "Verity",
5944 "rule" => array(
5945 "^vspider[ /]([0-9.]{1,10})" => "\\1",
5946 "^vspider" => ""
5947 ),
5948 "uri" => "http://www.verity.com/"
5949 ),
5950 "versionsproject" => array(
5951 "icon" => "robot",
5952 "title" => "Versions-project",
5953 "rule" => array(
5954 "InfoFly[ /]([0-9.]{1,10})" => "\\1"
5955 ),
5956 "uri" => "http://www.versions-project.org/"
5957 ),
5958 "verticalmatch" => array(
5959 "icon" => "robot",
5960 "title" => "VerticalMatch",
5961 "rule" => array(
5962 "^VMBot[ /]([0-9.]{1,10})" => "\\1"
5963 ),
5964 "uri" => "http://www.VerticalMatch.com/"
5965 ),
5966 "verzamelgids" => array(
5967 "icon" => "robot",
5968 "title" => "Verzamelgids",
5969 "rule" => array(
5970 "Verzamelgids[ /]([0-9.]{1,10})" => "\\1"
5971 ),
5972 "uri" => "http://www.verzamelgids.nl/"
5973 ),
5974 "vestris" => array(
5975 "icon" => "vestris",
5976 "title" => "Vestris",
5977 "rule" => array(
5978 "AlkalineBOT[ /]([0-9.]{1,10})" => "\\1"
5979 ),
5980 "uri" => "http://alkaline.vestris.com/"
5981 ),
5982 "vindex" => array(
5983 "icon" => "vindex",
5984 "title" => "Vindex",
5985 "rule" => array(
5986 "Vindex[ /]([0-9.]{1,10})" => "\\1"
5987 ),
5988 "uri" => ""
5989 ),
5990 "visvo" => array(
5991 "icon" => "robot",
5992 "title" => "Visvo",
5993 "rule" => array(
5994 "VisBot[ /]([0-9.]{1,10})" => "\\1"
5995 ),
5996 "uri" => "http://www.visvo.com"
5997 ),
5998 "voila" => array(
5999 "icon" => "voila",
6000 "title" => "Voila",
6001 "rule" => array(
6002 "VoilaBot[ /]?[a-z ]*([0-9.]{1,10})" => "\\1",
6003 "VoilaBot;[ /]([0-9.]{1,10})" => "\\1"
6004 ),
6005 "uri" => ""
6006 ),
6007 "vonna" => array(
6008 "icon" => "robot",
6009 "title" => "Vonna",
6010 "rule" => array(
6011 "Vonna.com b o t" => ""
6012 ),
6013 "uri" => ""
6014 ),
6015 "vortex" => array(
6016 "icon" => "robot",
6017 "title" => "Vortex",
6018 "rule" => array(
6019 "Vortex[ /]([0-9.]{1,10})" => "\\1"
6020 ),
6021 "uri" => "http://marty.anstey.ca/robots/vortex/"
6022 ),
6023 "w3sitesearch" => array(
6024 "icon" => "w3sitesearch",
6025 "title" => "W3SiteSearch",
6026 "rule" => array(
6027 "^W3SiteSearch Crawler[\_v]*([0-9.]{1,10})" => "\\1"
6028 ),
6029 "uri" => "http://www.w3sitesearch.de"
6030 ),
6031 "wagger" => array(
6032 "icon" => "robot",
6033 "title" => "Wagger",
6034 "rule" => array(
6035 "^Waggr" => ""
6036 ),
6037 "uri" => "http://www.waggr.com/"
6038 ),
6039 "wanadoo" => array(
6040 "icon" => "robot",
6041 "title" => "Wanadoo",
6042 "rule" => array(
6043 "^SurferF3[ /]([0-9./]{1,10})" => "\\1"
6044 ),
6045 "uri" => "http://www.wanadoo.fr/"
6046 ),
6047 "wapalizer" => array(
6048 "icon" => "robot",
6049 "title" => "Wapalizer",
6050 "rule" => array(
6051 "wapalizer[ /]([0-9.]{1,10})" => "\\1"
6052 ),
6053 "uri" => "http://www.wapdrive.com/"
6054 ),
6055 "watson" => array(
6056 "icon" => "addy",
6057 "title" => "Dr.Watson",
6058 "rule" => array(
6059 "Watson[ /]([0-9.]{1,10})" => "\\1",
6060 "watson\.addy\.com" => ""
6061 ),
6062 "uri" => ""
6063 ),
6064 "wavefire" => array(
6065 "icon" => "robot",
6066 "title" => "Wavefire",
6067 "rule" => array(
6068 "^Wavefire[ /]([0-9.]{1,10})" => "\\1"
6069 ),
6070 "uri" => ""
6071 ),
6072 "waypath" => array(
6073 "icon" => "waypath",
6074 "title" => "Waypath",
6075 "rule" => array(
6076 "Waypath[ \-]?Scout" => "",
6077 "Waypath (development )?crawler" => ""
6078 ),
6079 "uri" => ""
6080 ),
6081 "wauuu" => array(
6082 "icon" => "wauuu",
6083 "title" => "Wauuu",
6084 "rule" => array(
6085 "Wauuu[/ ]([0-9.]{1,10})" => "\\2"
6086 ),
6087 "uri" => "http://www.wauuu.com"
6088 ),
6089 "wdg" => array(
6090 "icon" => "wdg",
6091 "title" => "WDG Validator",
6092 "rule" => array(
6093 "^WDG_(Site)?Validator[/ ]([0-9.]{1,10})" => "\\2"
6094 ),
6095 "uri" => "http://www.htmlhelp.com/tools/validator/"
6096 ),
6097 "webagogo" => array(
6098 "icon" => "webagogo",
6099 "title" => "Webagogo",
6100 "rule" => array(
6101 "^Webagogo" => ""
6102 ),
6103 "uri" => "http://www.webagogo.be/"
6104 ),
6105 "webalta" => array(
6106 "icon" => "webalta",
6107 "title" => "WebAlta",
6108 "rule" => array(
6109 "^WebAlta( Crawler)?[/ ]([0-9.]{1,10})" => "\\2"
6110 ),
6111 "uri" => "http://www.webalta.net/ru/about_webmaster.html"
6112 ),
6113 "webdigity" => array(
6114 "icon" => "robot",
6115 "title" => "Webdigity Whois Service",
6116 "rule" => array(
6117 "^webdigity whois service" => ""
6118 ),
6119 "uri" => "http://www.webdigity.com/ws"
6120 ),
6121 "webelixir" => array(
6122 "icon" => "webelixir",
6123 "title" => "Webelixir",
6124 "rule" => array(
6125 "^webelixir" => ""
6126 ),
6127 "uri" => "http://www.webelixir.net/"
6128 ),
6129 "webbotru" => array(
6130 "icon" => "robot",
6131 "title" => "Webbot.ru",
6132 "rule" => array(
6133 " Webbot[/ ]([0-9.]{1,10})" => "\\1"
6134 ),
6135 "uri" => "http://www.webbot.ru/bot.html"
6136 ),
6137 "webcapture" => array(
6138 "icon" => "robot",
6139 "title" => "WebCapture",
6140 "rule" => array(
6141 "WebCapture[/ ]([0-9.]{1,10})" => "\\1"
6142 ),
6143 "uri" => ""
6144 ),
6145 "webcollage" => array(
6146 "icon" => "robot",
6147 "title" => "Webcollage",
6148 "rule" => array(
6149 "webcollage" => ""
6150 ),
6151 "uri" => ""
6152 ),
6153 "webcopier" => array(
6154 "icon" => "webcopier",
6155 "title" => "WebCopier",
6156 "rule" => array(
6157 "WebCopier[/ ]v?([0-9.]{1,10})" => "\\1"
6158 ),
6159 "uri" => ""
6160 ),
6161 "webcorp" => array(
6162 "icon" => "webcorp",
6163 "title" => "WebCorp",
6164 "rule" => array(
6165 "WebCorp[/ ]+([0-9.]{1,10})" => "\\1"
6166 ),
6167 "uri" => "http://www.webcorp.org.uk/"
6168 ),
6169 "webcrawl" => array(
6170 "icon" => "robot",
6171 "title" => "WebCrawl",
6172 "rule" => array(
6173 "webcrawl\.net" => ""
6174 ),
6175 "uri" => ""
6176 ),
6177 "webdownloader" => array(
6178 "icon" => "robot",
6179 "title" => "Web Downloader",
6180 "rule" => array(
6181 "Web Downloader[/ ]([0-9.]{1,10})" => "\\1"
6182 ),
6183 "uri" => ""
6184 ),
6185 "webfetch" => array(
6186 "icon" => "robot",
6187 "title" => "WebFetch",
6188 "rule" => array(
6189 "^webfetch[/ ]([0-9.]{1,10})" => "\\1"
6190 ),
6191 "uri" => ""
6192 ),
6193 "webfind" => array(
6194 "icon" => "robot",
6195 "title" => "WebFind",
6196 "rule" => array(
6197 "^WebFindBot" => ""
6198 ),
6199 "uri" => "http://www.web-find.com"
6200 ),
6201 "webglimpse" => array(
6202 "icon" => "robot",
6203 "title" => "Webglimpse",
6204 "rule" => array(
6205 "^Webglimpse[/ ]([0-9.]{1,10})" => "\\1"
6206 ),
6207 "uri" => "http://webglimpse.net"
6208 ),
6209 "webgobbler" => array(
6210 "icon" => "robot",
6211 "title" => "webGobbler",
6212 "rule" => array(
6213 "^webGobbler[/ ]([0-9.]{1,10})" => "\\1"
6214 ),
6215 "uri" => ""
6216 ),
6217 "webimages" => array(
6218 "icon" => "webimages",
6219 "title" => "WebImages",
6220 "rule" => array(
6221 "^WebImages[/ ]([0-9.]{1,10})" => "\\1"
6222 ),
6223 "uri" => "http://herbert.groot.jebbink.nl/"
6224 ),
6225 "weblight" => array(
6226 "icon" => "robot",
6227 "title" => "WebLight",
6228 "rule" => array(
6229 "^WebLight[/ ]([0-9.]{1,10})" => "\\1"
6230 ),
6231 "uri" => "http://www.illumit.com/Products/weblight/"
6232 ),
6233 "weblinks" => array(
6234 "icon" => "robot",
6235 "title" => "WebLink's",
6236 "rule" => array(
6237 "^Weblink.s checker" => ""
6238 ),
6239 "uri" => ""
6240 ),
6241 "webmeasurement" => array(
6242 "icon" => "robot",
6243 "title" => "Webmeasurement",
6244 "rule" => array(
6245 "^webmeasurement-bot" => ""
6246 ),
6247 "uri" => "http://rvs.informatik.uni-leipzig.de"
6248 ),
6249 "webminer" => array(
6250 "icon" => "robot",
6251 "title" => "WebMiner",
6252 "rule" => array(
6253 "^WebMiner[/ ]([0-9.]{1,10})" => "\\1"
6254 ),
6255 "uri" => ""
6256 ),
6257 "webmin" => array(
6258 "icon" => "webmin",
6259 "title" => "Webmin",
6260 "rule" => array(
6261 "^webmin" => ""
6262 ),
6263 "uri" => ""
6264 ),
6265 "webmon" => array(
6266 "icon" => "webmon",
6267 "title" => "Webmon",
6268 "rule" => array(
6269 "WebMon[ /]([0-9.]{1,10})" => "\\1"
6270 ),
6271 "uri" => "http://www.markwell.btinternet.co.uk/webmon/"
6272 ),
6273 "webox" => array(
6274 "icon" => "robot",
6275 "title" => " WeBoX",
6276 "rule" => array(
6277 "WeBoX[/ ]([0-9.]{1,10})" => "\\1"
6278 ),
6279 "uri" => ""
6280 ),
6281 "webpatrol" => array(
6282 "icon" => "webpatrol",
6283 "title" => "WebPatrol",
6284 "rule" => array(
6285 "^WebPatrol[ /]([0-9.]{1,10})" => "\\1"
6286 ),
6287 "uri" => "http://soft.macfeeling.com/WebPatrol.html"
6288 ),
6289 "webpix" => array(
6290 "icon" => "webpix",
6291 "title" => "WebPix",
6292 "rule" => array(
6293 "WebPix[/ ]([0-9.]{1,10})" => "\\1"
6294 ),
6295 "uri" => ""
6296 ),
6297 "webrace" => array(
6298 "icon" => "robot",
6299 "title" => "WebRACE",
6300 "rule" => array(
6301 "^WebRACE[/ ]([0-9.]{1,10})" => "\\1"
6302 ),
6303 "uri" => ""
6304 ),
6305 "webreaper" => array(
6306 "icon" => "webreaper",
6307 "title" => "WebReaper",
6308 "rule" => array(
6309 "^WebReaper " => ""
6310 ),
6311 "uri" => "http://www.webreaper.net/"
6312 ),
6313 "webresult" => array(
6314 "icon" => "robot",
6315 "title" => "Webresult",
6316 "rule" => array(
6317 "Der webresult\.de Robot" => ""
6318 ),
6319 "uri" => ""
6320 ),
6321 "webring" => array(
6322 "icon" => "robot",
6323 "title" => "Webring Checker",
6324 "rule" => array(
6325 "WebRingChecker[/ ]([0-9.]{1,10})" => "\\1"
6326 ),
6327 "uri" => ""
6328 ),
6329 "webripper" => array(
6330 "icon" => "webripper",
6331 "title" => "WebRipper",
6332 "rule" => array(
6333 "^WebRipper" => ""
6334 ),
6335 "uri" => "http://calluna-software.com"
6336 ),
6337 "webscaled" => array(
6338 "icon" => "webscaled",
6339 "title" => "Webscaled",
6340 "rule" => array(
6341 "Swarm" => ""
6342 ),
6343 "uri" => "http://webscaled.com/"
6344 ),
6345 "websearchau" => array(
6346 "icon" => "websearchau",
6347 "title" => "WebSearch.COM.AU",
6348 "rule" => array(
6349 "WebSearch.COM.AU[/ ]+([0-9.]{1,10})" => "\\1"
6350 ),
6351 "uri" => "http://WebSearch.com.au/"
6352 ),
6353 "websearchbench" => array(
6354 "icon" => "robot",
6355 "title" => "WebSearchBench",
6356 "rule" => array(
6357 "WebSearchBench WebCrawler[v/ ]+([0-9.]{1,10})" => "\\1"
6358 ),
6359 "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6360 ),
6361 "websense" => array(
6362 "icon" => "websense",
6363 "title" => "Websense",
6364 "rule" => array(
6365 "(Sqworm|websense|Konqueror/3\.(0|1)(-rc[1-6])?; i686 Linux; 2002[0-9]{4})" => ""
6366 ),
6367 "uri" => ""
6368 ),
6369 "websiteshadow" => array(
6370 "icon" => "websiteshadow",
6371 "title" => "Websiteshadow",
6372 "rule" => array(
6373 "Websiteshadowbot[ /]([0-9.]{1,10})" => "\\1"
6374 ),
6375 "uri" => "http://websiteshadow.com"
6376 ),
6377 "websiteworth" => array(
6378 "icon" => "robot",
6379 "title" => "WebsiteWorth",
6380 "rule" => array(
6381 "WebsiteWorth[v/ ]+([0-9.]{1,10})" => "\\1"
6382 ),
6383 "uri" => "http://directory.sootle.com/website-worth/tata.php"
6384 ),
6385 "websquash" => array(
6386 "icon" => "websquash",
6387 "title" => "Websquash",
6388 "rule" => array(
6389 "webs(quash\.com|ite[ \-]?Monitor)" => ""
6390 ),
6391 "uri" => ""
6392 ),
6393 "webstripper" => array(
6394 "icon" => "robot",
6395 "title" => "WebStripper",
6396 "rule" => array(
6397 "WebStripper[ /]([0-9.]{1,10})" => "\\1"
6398 ),
6399 "uri" => ""
6400 ),
6401 "webzip" => array(
6402 "icon" => "webzip",
6403 "title" => "WebZIP",
6404 "rule" => array(
6405 "Web[ \-]?ZIP[ /]([0-9.]{1,10})" => "\\1"
6406 ),
6407 "uri" => ""
6408 ),
6409 "wep" => array(
6410 "icon" => "robot",
6411 "title" => "WEP Search",
6412 "rule" => array(
6413 "WEP Search[ /]([0-9.]{1,10})" => "\\1"
6414 ),
6415 "uri" => ""
6416 ),
6417 "westwind" => array(
6418 "icon" => "robot",
6419 "title" => "West Wind Internet Protocols",
6420 "rule" => array(
6421 "^West Wind Internet Protocols[ /]([0-9.]{1,10})" => "\\1"
6422 ),
6423 "uri" => "http://www.west-wind.com/wwipstuff.asp"
6424 ),
6425 "wget" => array(
6426 "icon" => "wget",
6427 "title" => "Wget",
6428 "rule" => array(
6429 "Wget[ /]([0-9.]{1,10})" => "\\1",
6430 "Wget" => ""
6431 ),
6432 "uri" => ""
6433 ),
6434 "whizbang" => array(
6435 "icon" => "whizbang",
6436 "title" => "WhizBang",
6437 "rule" => array(
6438 "WhizBang" => ""
6439 ),
6440 "uri" => "http://www.whizbang.com/crawler/"
6441 ),
6442 "whois" => array(
6443 "icon" => "whois",
6444 "title" => "Who.is",
6445 "rule" => array(
6446 "Who.is Bot" => ""
6447 ),
6448 "uri" => "http://www.who.is/"
6449 ),
6450 "wikiwix" => array(
6451 "icon" => "wikiwix",
6452 "title" => "Wikiwix",
6453 "rule" => array(
6454 "wikiwix-bot-([0-9.]{1,10})" => "\\1"
6455 ),
6456 "uri" => "http://www.wikiwix.com/"
6457 ),
6458 "wingflyer" => array(
6459 "icon" => "robot",
6460 "title" => "WingFlyer",
6461 "rule" => array(
6462 "^WebFetch" => ""
6463 ),
6464 "uri" => "http://www.wingflyer.com/"
6465 ),
6466 "wininet" => array(
6467 "icon" => "robot",
6468 "title" => "WinInet",
6469 "rule" => array(
6470 "TeamSoft WinInet Component" => ""
6471 ),
6472 "uri" => "http://www.winsoft.sk/wininet.htm"
6473 ),
6474 "winhttp" => array(
6475 "icon" => "robot",
6476 "title" => "WinHTTP",
6477 "rule" => array(
6478 "WinHttp\.WinHttpRequest\.([0-9.]{1,10})" => "\\1"
6479 ),
6480 "uri" => ""
6481 ),
6482 "wire" => array(
6483 "icon" => "robot",
6484 "title" => "WIRE",
6485 "rule" => array(
6486 "^WIRE[ /]([0-9.]{1,10})" => "\\1"
6487 ),
6488 "uri" => ""
6489 ),
6490 "wmp" => array(
6491 "icon" => "robot",
6492 "title" => "WMP",
6493 "rule" => array(
6494 "^WMP" => ""
6495 ),
6496 "uri" => ""
6497 ),
6498 "woozweb" => array(
6499 "icon" => "woozweb",
6500 "title" => "Woozweb",
6501 "rule" => array(
6502 "woozweb" => ""
6503 ),
6504 "uri" => "http://www.woozweb.com/"
6505 ),
6506 "wordchamp" => array(
6507 "icon" => "robot",
6508 "title" => "WordChamp",
6509 "rule" => array(
6510 "^WordChampBot" => ""
6511 ),
6512 "uri" => "http://www.wordchamp.com/"
6513 ),
6514 "wordpress" => array(
6515 "icon" => "wordpress",
6516 "title" => "WordPress",
6517 "rule" => array(
6518 "WordPress[ /]([0-9.]{1,10})" => "\\1"
6519 ),
6520 "uri" => ""
6521 ),
6522 "worio" => array(
6523 "icon" => "worio",
6524 "title" => "Worio",
6525 "rule" => array(
6526 "woriobot" => ""
6527 ),
6528 "uri" => "http://worio.com/"
6529 ),
6530 "worldlight" => array(
6531 "icon" => "worldlight",
6532 "title" => "WorldLight",
6533 "rule" => array(
6534 "^WorldLight" => ""
6535 ),
6536 "uri" => ""
6537 ),
6538 "worqmada" => array(
6539 "icon" => "robot",
6540 "title" => "WorQmada",
6541 "rule" => array(
6542 "WorQmada[ /]([0-9.]{1,10})" => "\\1"
6543 ),
6544 "uri" => ""
6545 ),
6546 "wotbox" => array(
6547 "icon" => "wotbox",
6548 "title" => "Wotbox",
6549 "rule" => array(
6550 "Wotbox[ /]?[a-z]*([0-9.]{1,10})" => "\\1"
6551 ),
6552 "uri" => ""
6553 ),
6554 "wp" => array(
6555 "icon" => "wp",
6556 "title" => "Wirtualna Polska",
6557 "rule" => array(
6558 "NetSprint[ /\-]{1,4}([0-9.]{1,10})" => "\\1"
6559 ),
6560 "uri" => "http://wp.pl"
6561 ),
6562 "wsb" => array(
6563 "icon" => "robot",
6564 "title" => "WebSearchBench",
6565 "rule" => array(
6566 "WSB WebCrawler V([0-9.]{1,10})" => "\\1",
6567 "WSB " => ""
6568 ),
6569 "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6570 ),
6571 "wume" => array(
6572 "icon" => "robot",
6573 "title" => "WUME Lab's",
6574 "rule" => array(
6575 "^wume_crawler[ /]([0-9.]{1,10})" => "\\1",
6576 ),
6577 "uri" => "http://wume.cse.lehigh.edu/~xiq204/crawler/"
6578 ),
6579 "wusage" => array(
6580 "icon" => "wusage",
6581 "title" => "Wusage",
6582 "rule" => array(
6583 "Wusage[ /]([0-9.]{1,10})" => "\\1",
6584 ),
6585 "uri" => "http://www.boutell.com/wusage/"
6586 ),
6587 "wwgrapevine" => array(
6588 "icon" => "wwgrapevine",
6589 "title" => "WWgrapevine",
6590 "rule" => array(
6591 "wwgrapevine[ /]([0-9.]{1,10})" => "\\1"
6592 ),
6593 "uri" => ""
6594 ),
6595 "wws" => array(
6596 "icon" => "robot",
6597 "title" => "WWSBOT",
6598 "rule" => array(
6599 "WWSBOT[ /]([0-9.]{1,10})" => "\\1",
6600 ),
6601 "uri" => "http://www.analyzer.nu"
6602 ),
6603 "www4mail" => array(
6604 "icon" => "robot",
6605 "title" => "WWW4mail",
6606 "rule" => array(
6607 "^www4mail[ /]([0-9.]{1,10})" => "\\1"
6608 ),
6609 "uri" => "http://www.www4mail.org/"
6610 ),
6611 "wwwc" => array(
6612 "icon" => "wwwc",
6613 "title" => "WWWC",
6614 "rule" => array(
6615 "^WWWC[ /]([0-9.]{1,10})" => "\\1"
6616 ),
6617 "uri" => ""
6618 ),
6619 "wwwd" => array(
6620 "icon" => "robot",
6621 "title" => "WWWD",
6622 "rule" => array(
6623 "^WWWD[ /]([0-9.]{1,10})" => "\\1"
6624 ),
6625 "uri" => ""
6626 ),
6627 "wwweasel" => array(
6628 "icon" => "wwweasel",
6629 "title" => "WWWeasel",
6630 "rule" => array(
6631 "WWWeasel( Robot)?[/ ]v?([0-9.]{1,10})" => "\\2"
6632 ),
6633 "uri" => ""
6634 ),
6635 "wwwfi" => array(
6636 "icon" => "wwwfi",
6637 "title" => "www.fi",
6638 "rule" => array(
6639 "www\.fi crawler" => ""
6640 ),
6641 "uri" => "http://www.fi/"
6642 ),
6643 "wwwmechanize" => array(
6644 "icon" => "robot",
6645 "title" => "WWW-Mechanize",
6646 "rule" => array(
6647 "^WWW-Mechanize[/ ]([0-9.]{1,10})" => "\\1"
6648 ),
6649 "uri" => ""
6650 ),
6651 "wwwoffle" => array(
6652 "icon" => "robot",
6653 "title" => "WWWoffle",
6654 "rule" => array(
6655 "^wwwoffle[/ ]([0-9.]{1,10})" => "\\1"
6656 ),
6657 "uri" => ""
6658 ),
6659 "wwwster" => array(
6660 "icon" => "robot",
6661 "title" => "WWWster",
6662 "rule" => array(
6663 "^wwwster[/ ]([0-9.]{1,10})" => "\\1"
6664 ),
6665 "uri" => ""
6666 ),
6667 "wysigot" => array(
6668 "icon" => "wysigot",
6669 "title" => "Wysigot",
6670 "rule" => array(
6671 "Wysigot[/ ]([0-9.]{1,10})" => "\\1"
6672 ),
6673 "uri" => ""
6674 ),
6675 "xaldon" => array(
6676 "icon" => "xaldon",
6677 "title" => "Xaldon",
6678 "rule" => array(
6679 "Xaldon WebSpider" => ""
6680 ),
6681 "uri" => "http://www.xaldon.de/"
6682 ),
6683 "xenu" => array(
6684 "icon" => "xenu",
6685 "title" => "Xenu Link Sleuth",
6686 "rule" => array(
6687 "Xenu Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6688 "Xenu(&#039;s)? Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6689 "Xenu_Link_Sleuth_([0-9a-z.]{1,10})" => "\\1"
6690 ),
6691 "uri" => "http://home.snafu.de/tilman/xenulink.html"
6692 ),
6693 "xerka" => array(
6694 "icon" => "xerka",
6695 "title" => "Xerka",
6696 "rule" => array(
6697 "^Xerka WebBot v([0-9a-z.]{1,10})" => "\\1"
6698 ),
6699 "uri" => "http://www.diana-teknologia.com/www1/english/xerka.htm"
6700 ),
6701 "xirq" => array(
6702 "icon" => "robot",
6703 "title" => "XIRQ",
6704 "rule" => array(
6705 "^xirq[ /]([0-9a-z.]{1,10})" => "\\1"
6706 ),
6707 "uri" => "http://www.xirq.com"
6708 ),
6709 "xmlslurp" => array(
6710 "icon" => "robot",
6711 "title" => "XMLSlurp",
6712 "rule" => array(
6713 "^XMLSlurp[ /]([0-9a-z.]{1,10})" => "\\1"
6714 ),
6715 "uri" => ""
6716 ),
6717 "xml-sitemaps" => array(
6718 "icon" => "xml-sitemaps",
6719 "title" => "XML-Sitemaps",
6720 "rule" => array(
6721 "XML-Sitemaps[ /]([0-9a-z.]{1,10})" => "\\1"
6722 ),
6723 "uri" => ""
6724 ),
6725 "xmlrpc" => array(
6726 "icon" => "robot",
6727 "title" => "Trackback",
6728 "rule" => array(
6729 "XMLRPC" => ""
6730 ),
6731 "uri" => ""
6732 ),
6733 "xovi" => array(
6734 "icon" => "xovi",
6735 "title" => "Xovi",
6736 "rule" => array(
6737 "XoviBot[ /]([0-9a-z.]{1,10})" => "\\1"
6738 ),
6739 "uri" => "http://www.xovibot.net"
6740 ),
6741 "yacy" => array(
6742 "icon" => "yacy",
6743 "title" => "Yacy",
6744 "rule" => array(
6745 "yacy\.net" => ""
6746 ),
6747 "uri" => ""
6748 ),
6749 "yahoo" => array(
6750 "icon" => "yahoo",
6751 "title" => "Yahoo",
6752 "rule" => array(
6753 "Yahoo(! ([a-z]{1,3} )?Slurp|-)" => "",
6754 "Yahoo-MMCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6755 "Yahoo-VerticalCrawler-FormerWebCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6756 "^AnzwersCrawl[/ ]([0-9a-z.]{1,10})" => "\\1",
6757 "Y!J(-BSC|-SRD)*[/ ]([0-9a-z.]{1,10})" => "\\2",
6758 "Y!OASIS/TEST" => "",
6759 "Harvest-NG[/ ]([0-9a-z.]{1,10})" => "\\1",
6760 "Y!J; for robot study" => "",
6761 "Yahoo Japan; for robot study" => ""
6762 ),
6763 "uri" => "http://www.yahoo.com"
6764 ),
6765 "yahoo-feed" => array(
6766 "icon" => "yahoo",
6767 "title" => "Yahoo Feedseeker",
6768 "rule" => array(
6769 "^YahooFeedSeeker[/ ]([0-9a-z.]{1,10})" => "\\1"
6770 ),
6771 "uri" => "http://www.yahoo.com"
6772 ),
6773 "yandex" => array(
6774 "icon" => "yandex",
6775 "title" => "Yandex",
6776 "rule" => array(
6777 "Yandex[/ ]([0-9.]{1,10})" => "\\1",
6778 "Yandex(Bot|Images|Media|Antivirus)[/ ]([0-9.]{1,10})" => "\\2"
6779 ),
6780 "uri" => "http://yandex.com/bots"
6781 ),
6782 "yanga" => array(
6783 "icon" => "yanga",
6784 "title" => "Yanga",
6785 "rule" => array (
6786 "^Yanga.*v([0-9.]{1,10})" => "\\1"
6787 ),
6788 "uri" => "http://www.yanga.co.uk/"
6789 ),
6790 "yap" => array(
6791 "icon" => "yap",
6792 "title" => "Yap",
6793 "rule" => array(
6794 "^YapBot[_/ ]v([0-9.]{1,10})" => "\\1"
6795 ),
6796 "uri" => "http://www.yapinc.com/"
6797 ),
6798 "yarienavoir" => array(
6799 "icon" => "robot",
6800 "title" => "Yarienavoir",
6801 "rule" => array(
6802 "^yarienavoir.net[/ ]([0-9.]{1,10})" => "\\1"
6803 ),
6804 "uri" => "http://www.yarienavoir.net/"
6805 ),
6806 "yell" => array(
6807 "icon" => "yell",
6808 "title" => "Yell",
6809 "rule" => array(
6810 "YellCrawl[ /]V?([0-9.]{1,10})" => "\\1",
6811 "Yellbot[ /]Nutch-([0-9.]{1,10})" => "\\1",
6812 ),
6813 "uri" => ""
6814 ),
6815 "youdao" => array(
6816 "icon" => "youdao",
6817 "title" => "Youdao",
6818 "rule" => array(
6819 "YodaoBot-(Image|Mobile)?[ /]([0-9.]{1,10})" => "\\2",
6820 "YoudaoBot[ /]([0-9.]{1,10})" => "\\1"
6821 ),
6822 "uri" => "http://www.youdao.com/help/webmaster/spider/"
6823 ),
6824 "yoogli" => array(
6825 "icon" => "yoogli",
6826 "title" => "Yoogli",
6827 "rule" => array(
6828 "yoogliFetchAgent[ /]([0-9.]{1,10})" => "\\1"
6829 ),
6830 "uri" => "http://www.yoogli.com"
6831 ),
6832 "yotta" => array(
6833 "icon" => "robot",
6834 "title" => "Yotta",
6835 "rule" => array(
6836 "Yotta(Shopping|Cars)_Bot[ /]([0-9.]{1,10})" => "\\2",
6837 "OmniExplorer_Bot[ /]([0-9.]{1,10})" => "\\1"
6838 ),
6839 "uri" => "http://www.yottacars.com"
6840 ),
6841 "yoono" => array(
6842 "icon" => "yoono",
6843 "title" => "Yoono",
6844 "rule" => array(
6845 "Yoono" => ""
6846 ),
6847 "uri" => "http://www.yoono.com/"
6848 ),
6849 "yowedo" => array(
6850 "icon" => "robot",
6851 "title" => "Yowedo",
6852 "rule" => array(
6853 "Yowedo[ /]([0-9.]{1,10})" => "\\1"
6854 ),
6855 "uri" => "http://yowedo.com/en/partners.html"
6856 ),
6857 "yuntis" => array(
6858 "icon" => "robot",
6859 "title" => "Yuntis",
6860 "rule" => array(
6861 "Gulper Web Bot[ /]([0-9.]{1,10})" => "\\1"
6862 ),
6863 "uri" => "http://yuntis.ecsl.cs.sunysb.edu/help/robot/"
6864 ),
6865 "zao" => array(
6866 "icon" => "robot",
6867 "title" => "Zao",
6868 "rule" => array(
6869 "Zao[ /]([0-9.]{1,10})" => "\\1",
6870 "Zao-crawler" => ""
6871 ),
6872 "uri" => ""
6873 ),
6874 "zealbot" => array(
6875 "icon" => "zeal",
6876 "title" => "ZealBot",
6877 "rule" => array(
6878 "Zealbot[ /]([0-9.]{1,10})" => "\\1"
6879 ),
6880 "uri" => ""
6881 ),
6882 "zearchit" => array(
6883 "icon" => "zearchit",
6884 "title" => "Zearchit",
6885 "rule" => array(
6886 "Zearchit" => ""
6887 ),
6888 "uri" => "http://www.zearchit.de/"
6889 ),
6890 "zebz" => array(
6891 "icon" => "robot",
6892 "title" => "ze.bz",
6893 "rule" => array(
6894 "^ZeBot_(lseek\.net|www\.ze\.bz)" => ""
6895 ),
6896 "uri" => "http://www.ze.bz/"
6897 ),
6898 "zedzo" => array(
6899 "icon" => "robot",
6900 "title" => "Zedzo",
6901 "rule" => array(
6902 "zedzo.digest[ /]([0-9.]{1,10})" => "\\1"
6903 ),
6904 "uri" => "http://www.zedzo.com/"
6905 ),
6906 "zerx" => array(
6907 "icon" => "zerx",
6908 "title" => "Zerx",
6909 "rule" => array(
6910 "^zerxbot[ /](Version|v)*[ /]*([0-9.]{1,10})" => "\\2"
6911 ),
6912 "uri" => "http://www.zerx.com/"
6913 ),
6914 "zeus" => array(
6915 "icon" => "zeus",
6916 "title" => "Zeus",
6917 "rule" => array(
6918 "Zeus" => ""
6919 ),
6920 "uri" => "http://www.zeus.com"
6921 ),
6922 "zippp" => array(
6923 "icon" => "robot",
6924 "title" => "Zippp",
6925 "rule" => array(
6926 "ZipppBot[ /]([0-9.]{1,10})" => "\\1"
6927 ),
6928 "uri" => ""
6929 ),
6930 "zippy" => array(
6931 "icon" => "robot",
6932 "title" => "Zippy",
6933 "rule" => array(
6934 "^Zippy[ v/]*([0-9.]{1,10})" => "\\1"
6935 ),
6936 "uri" => "http://www.zippyfinder.com"
6937 ),
6938 "zoeky" => array(
6939 "icon" => "robot",
6940 "title" => "Zoeky",
6941 "rule" => array(
6942 "Zoekybot[ /]([0-9.]{1,10})" => "\\1"
6943 ),
6944 "uri" => ""
6945 ),
6946 "zoom" => array(
6947 "icon" => "zoom",
6948 "title" => "ZoomSpider",
6949 "rule" => array(
6950 "^ZoomSpider" => ""
6951 ),
6952 "uri" => "http://www.wrensoft.com/"
6953 ),
6954 "zspider" => array(
6955 "icon" => "robot",
6956 "title" => "Zspider",
6957 "rule" => array(
6958 "zspider[ /]([0-9.a-z]{1,10})" => "\\1"
6959 ),
6960 "uri" => "http://feedback.redkolibri.com/"
6961 ),
6962 "zumbot" => array(
6963 "icon" => "robot",
6964 "title" => "ZUM Search",
6965 "rule" => array(
6966 "ZumBot[ /]([0-9.]{1,10})" => "\\1"
6967 ),
6968 "uri" => "http://help.zum.com/inquiry"
6969 ),
6970 "zyborg" => array(
6971 "icon" => "zyborg",
6972 "title" => "WiseNutBot",
6973 "rule" => array(
6974 "(WISE|Zy)bo(rg|t)[ /]([0-9.]{1,10})" => "\\3"
6975 ),
6976 "uri" => ""
6977 ),
6978 // Catch up for the originals, they got to stay in that order.
6979 "blogbot" => array(
6980 "icon" => "blogbot",
6981 "title" => "BlogBot",
6982 "rule" => array(
6983 "Blog[ \-]?Bot" => ""
6984 ),
6985 "uri" => "http://www.blogbot.com/"
6986 ),
6987 "centrum" => array(
6988 "icon" => "centrum",
6989 "title" => "Centrum",
6990 "rule" => array(
6991 "holmes[/ ]([0-9.]{1,10})" => "\\1",
6992 "^Centrum-checker" => ""
6993 ),
6994 "uri" => ""
6995 ),
6996 "httpclient" => array(
6997 "icon" => "robot",
6998 "title" => "HTTPClient",
6999 "rule" => array(
7000 "HTTP[ \-]?Client[ /]([0-9.]{1,10})" => "\\1",
7001 "HTTP[ \-]?Client" => ""
7002 ),
7003 "uri" => "http://www.innovation.ch/java/HTTPClient/"
7004 ),
7005 "incywincy" => array(
7006 "icon" => "robot",
7007 "title" => "IncyWincy",
7008 "rule" => array(
7009 "^IncyWincy[ /]([0-9.]{1,10})" => "\\1",
7010 "^IncyWincy" => ""
7011 ),
7012 "uri" => ""
7013 ),
7014 "java" => array(
7015 "icon" => "java",
7016 "title" => "Java",
7017 "rule" => array(
7018 "^java[ /]*([0-9.a-z]{1,10})" => "\\1"
7019 ),
7020 "uri" => ""
7021 ),
7022 "libfetch" => array(
7023 "icon" => "robot",
7024 "title" => "Libfetch",
7025 "rule" => array(
7026 "^(fetch )?libfetch[ /]([0-9.]{1,10})" => "\\2"
7027 ),
7028 "uri" => "http://www.freebsd.org/"
7029 ),
7030 "libwww" => array(
7031 "icon" => "libwww",
7032 "title" => "LibWWW",
7033 "rule" => array(
7034 "^libww(w|w-perl|w-FM)[ /]([0-9.]{1,10})" => "\\2",
7035 "^libww(w|w-perl|w-FM)" => "",
7036 "MyApp.*libww(w|w-perl|w-FM)" => ""
7037 ),
7038 "uri" => ""
7039 ),
7040 "litefinder" => array(
7041 "icon" => "litefinder",
7042 "title" => "LiteFinder",
7043 "rule" => array(
7044 "LiteFinder[ /]([0-9.]{1,10})" => "\\1"
7045 ),
7046 "uri" => "http://www.litefinder.net/about.html"
7047 ),
7048 "nutchorg" => array(
7049 "icon" => "nutchorg",
7050 "title" => "Nutch",
7051 "rule" => array(
7052 "Nutc(hOrg|hCVS|h)?[ /]([0-9.]{1,10})" => "\\2",
7053 "Nutch" => ""
7054 ),
7055 "uri" => "http://lucene.apache.org/nutch/"
7056 ),
7057 "pythonurl" => array(
7058 "icon" => "pythonurl",
7059 "title" => "Python",
7060 "rule" => array(
7061 "python-requests[ /]([0-9.]{1,10})" => "\\1",
7062 "python-httpx[ /]([0-9.]{1,10})" => "\\1",
7063 "Python[ \-]?urllib" => ""
7064 ),
7065 "uri" => ""
7066 ),
7067 // Know Robots as SPAM BOTS
7068 "SPAM" => array(
7069 "icon" => "robot",
7070 "title" => "SPAM",
7071 "rule" => array(
7072 "NASA Search[/ ]([0-9.]{1,10})" => "\\1",
7073 "^PHOTO CHECK" => "",
7074 "^FOTOCHECKER" => "",
7075 "^IPTC CHECK" => "",
7076 "^DataCha0s" => "",
7077 "Datenprovider" => "",
7078 "nbertaupete95" => "",
7079 "BLEXBot" => "",
7080 "Softpile" => "",
7081 "Expanse" => "",
7082 "Hello World" => "",
7083 "Linux Gnu (cow)" => "",
7084 "l9tcpid" => "",
7085 "Mozilliqa" => "",
7086 "cyberscan.io" => "",
7087 "OPENVASVT" => "",
7088 "researchscan" => "",
7089 "CensysInspect[/ ]([0-9.]{1,10})" => "",
7090 "InternetMeasurement[/ ]([0-9.]{1,10})" => "",
7091 "seocompany[/ ]([0-9.]{1,10})" => "",
7092 "tchelebi[/ ]([0-9.]{1,10})" => "",
7093 "masscan[/ ]([0-9.]{1,10})" => "",
7094 "zgrab[/ ]([0-9.]{1,10})" => "",
7095 "^Mac Finder" => "",
7096 "^Missigua Locator[ /]([0-9.]{1,10})" => "\\1",
7097 "^Missouri College Browse" => "",
7098 "Email[ \-]?Siphon" => "",
7099 "atSpider" => "",
7100 "autoemailspider" => "",
7101 "^Demo Bot" => "",
7102 "^Program Shareware" => "",
7103 "^Snapbot" => "",
7104 "^snap.com" => "",
7105 "^Guestbook Auto Submitter" => "",
7106 "panscient.com" => "",
7107 ),
7108 "uri" => ""
7109 ),
7110 // Things we don't know by now
7111 "robot" => array(
7112 "icon" => "robot",
7113 "title" => "Robot",
7114 "rule" => array(
7115 "(robot|spider|harvest|(?<!orange)bot|(?<!msie)crawler)" => ""
7116 )
7117 )
7118 );
7119 ?>

Properties

Name Value
svn:keywords Id