]> git.ipfire.org Git - thirdparty/AWStats.git/commitdiff
Alternative robots.pm and search_engines.pm
authorvisualperception <github@litody.net>
Fri, 2 Sep 2016 03:58:49 +0000 (04:58 +0100)
committerGitHub <noreply@github.com>
Fri, 2 Sep 2016 03:58:49 +0000 (04:58 +0100)
both files have many additions and corrections. Especially search_engines.pm which has had all google countries added to it and split into:
google country name
google country name images
google country name catchall (for any subdomains we don't know about yet)

wwwroot/cgi-bin/lib/robots.pm
wwwroot/cgi-bin/lib/search_engines.pm

index f6124146f2eb27af5e404cbe7132a65e8ba9987b..a77760a9bcf44eeb65aede90981f235ce74d5378 100644 (file)
-# AWSTATS ROBOTS DATABASE
-#-------------------------------------------------------
-# If you want to add robots to extend AWStats database detection capabilities,
-# you must add an entry in RobotsSearchIDOrder_listx and RobotsHashIDLib.
-
-# The entry in RobotsSearchIDOrder_listx is a Perl regular expression
-# (see http://perldoc.perl.org/perlreref.html). AWSTats applies these
-# expressions to the user agent string in the order given by the lists. The
-# first match specifies the robot.
-#
-# Note: This regular expression must not contain any whitespace.
-# Otherwise AWStats will produce lines in the database that
-# will be misinterpreted and as a consequence the corresponding data in the
-# generated HTML reports will be wrong. If you want to match whitespace in
-# the user agent string, use other constructs like '\s', '[:blank:]',
-# '\p{IsSpace}', '\x20' etc.
-#
-# The corresponding entry in RobotsHashIDLib contains the regular expression
-# as key, followed by a string containing HTML-text. AWStats inserts this
-# text into reports to describe the bot. If possible the text should contain
-# a link to the bot home page. This makes it easier for sysadmins to find
-# the information necessary e.g. to adapt the robots.txt file.
-#
-# An entry in the RobotsAffiliateLib is not necessary. An entry in this list
-# contains as first part the regular expression specifying the bot. The
-# second part is a string that gives the Company or product managing the bot.
-# This information is not used yet.
-#
-# There are several sorts of bots that AWStats is not able to detect and
-# therefore a considerable amount of bot generated traffic counts
-# as user traffic:
-#
-# a) A crawler that identifies itself in the referrer string, but not in
-#    the user agent string. An example is the crawler from semalt.semalt.com.
-#
-# b) Crawlers that correctly access robots.txt but identify themselves in
-#    in the user agent string only once or just a few times. Most of the
-#    time a user agent string ist used that does not contain hints that
-#    a bot is involved. An example is the iCjobs spider.
-#    msnbot-UDiscovery/2.0b seems to show this behaviour too.
-#
-#
-#
-#-------------------------------------------------------
-
-# 2005-08-19 Sean Carlos http://www.antezeta.com/awstats.html
-#              added dipsie (not tested with real data).
-#              added DomainsDB.net http://domainsdb.net/
-#              added ia_archiver-web.archive.org (was inadvertently grouped with Alexa traffic)
-#              added Nutch (used by looksmart (furl?))
-#              added rssImagesBot
-#              added Sqworm
-#              added t\-h\-u\-n\-d\-e\-r\-s\-t\-o\-n\-e
-#              added w3c css-validator
-#              added documentation link to bot home pages for above and selected major bots.
-#                    In the case of international bots, choose .com page.
-#                    Included tool tip (html "title").
-#                    To do: parameterize to match both AWStats language and tooltips settings.
-#                    To do: add html links for all bots based on current documentation in source
-#                           files referenced below.
-#              changed '\wbot[\/\-]', to '\wbot[\/\-]' (removed comma)
-#              made minor grammar corrections to notes below
-# 2005-08-24   added YahooSeeker-Testing
-#                      added w3c-checklink
-#                      updated url for ask.com
-# 2005-08-24           added Girafabot http://www.girafa.com/
-# 2005-08-30           added PluckFeedCrawler http://www.pluck.com/
-#              added Gaisbot/3.0 (robot05@gais.cs.ccu.edu.tw; )
-#              dded geniebot (wgao@genieknows.com)
-#              added BecomeBot link http://www.become.com/site_owners.html
-#              added topicblogs http://www.topicblogs.com/
-#              added Powermarks; seen used by referrer spam
-#              added YahooSeeker
-#              added NG/2. http://www.exabot.com/
-# 2005-09-15   added link for Walhello appie
-#              added bender focused_crawler
-#              updated YahooSeeker description (blog crawler)
-# 2005-09-16   added link for http://linkchecker.sourceforge.net
-#              added ConveraCrawler/0.9d ( http://www.authoritativeweb.com/crawl)
-#              added Blogslive  info@blogslive.com intelliseek.com
-#              added BlogPulse (ISSpider-3.0) intelliseek.com
-# 2005-09-26   added Feedfetcher-Google (http://www.google.com/feedfetcher.html)
-#              added EverbeeCrawler
-#              added Yahoo-Blogs http://help.yahoo.com/help/us/ysearch/crawling/crawling-02.html
-#              added link for Bloglines http://www.bloglines.com
-# 2005-10-19   fixed Feedfetcher-Google (http://www.google.com/feedfetcher.html)
-#              added Blogshares Spiders (Synchronized V1.5.1)
-#              added yacy
-# 2005-11-21   added Argus www.simpy.com
-#              added BlogsSay :: RSS Search Crawler (http://www.blogssay.com/)
-#              added MJ12bot http://majestic12.co.uk/bot.php
-#              added OpenTaggerBot (http://www.opentagger.com/opentaggerbot.htm)
-#              added OutfoxBot/0.3 (For internet experiments; outfox.agent@gmail.com)
-#              added RufusBot Rufus Web Miner http://64.124.122.252.webaroo.com/feedback.html
-#              added Seekbot (http://www.seekbot.net/bot.html)
-#              added Yahoo-MMCrawler/3.x (mms-mmcrawler-support@yahoo-inc.com)
-#               added link for BaiDuSpider
-#              added link for Blogshares Spider
-#              added link for StackRambler http://www.rambler.ru/doc/faq.shtml
-#              added link for WISENutbot
-#              added link for ZyBorg/1.0 (wn-14.zyborg@looksmart.net; http://www.WISEnutbot.com.  Moved location to above wisenut to avoid classification as wisenut
-# 2005-12-15
-#              added FAST Enteprise Crawler/6 (www dot fastsearch dot com). Note spelling Enteprise not Enterprise.
-#              added findlinks http://wortschatz.uni-leipzig.de/findlinks/
-#              added IBM Almaden Research Center WebFountainâ„¢ http://www.almaden.ibm.com/cs/crawler [hc3]
-#              added INFOMINE/8.0 VLCrawler (http://infomine.ucr.edu/useragents)
-#              added lmspider (lmspider@scansoft.com) http://www.nuance.com/
-#              added noxtrumbot http://www.noxtrum.com/
-#              added SandCrawler (Microsoft)
-#              added SBIder http://www.sitesell.com/sbider.html
-#              added SeznamBot http://fulltext.seznam.cz/
-#              added sohu-search http://corp.sohu.com/ (looked for //robots.txt not /robots.txt)
-#              added the ruffle SemanticWeb crawler v0.5 - http://www.unreach.net
-#              added WebVulnCrawl/1.0 libwww-perl/5.803 (looked for //robots.txt not /robots.txt)
-#              added Yahoo! Japan keyoshid http://www.yahoo.co.jp/
-#              added Y!J http://help.yahoo.co.jp/help/jp/search/indexing/indexing-15.html
-#              added link for GigaBot
-#              added link for MagpieRSS
-#              added link for MSIECrawler
-# 2005-12-21
-#              added aipbot http://www.aipbot.com aipbot@aipbot.com [matthys70 users.sourceforge.net]
-#              added Everest-Vulcan Inc./0.1 (R&D project; http://everest.vulcan.com/crawlerhelp)
-#              added Fast-Search-Engine http://www.fast-search-engine.com/ [matthys70  users.sourceforge.net]
-#              added g2Crawler (nobody@airmail.net) http://crawler.instantnetworks.net/
-#              added Jakarta commons-httpclient http://jakarta.apache.org/commons/httpclient/ (hit robots.txt).  May be used as robot or browser - a site may want to remove this entry.
-#              added OmniExplorer_Bot http://www.omni-explorer.com/ [matthys70 users.sourceforge.net]
-#              added USTC-Semantic-Group ai.ustc.edu.cn/mas/en/research/index.php ?
-# 2005-12-22
-#              added EARTHCOM.info www.earthcom.info
-#              added HTTrack off-line browser 'httrack','HTTrack', http://www.httrack.com/ [Moizes Gabor]
-#              added KummHttp http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&template=detail.html&match=\bid_g_l_301105_2\b [Moizes Gabor]
-# 2006-01-01
-#              added Dulance http://www.dulance.com/bot.jsp
-#              added MojeekBot http://www.mojeek.com/bot.html
-#              added nicebot http://www.egghelp.org/setup.htm ?
-#              added Snappy http://www.urltrends.com/faq.php
-#              added sohu agent
-#              added VORTEX http://marty.anstey.ca/robots/vortex/ [matthys70 users.sourceforge.net]
-#              added zspider http://feedback.redkolibri.com/
-# 2006-01-13
-#              added boitho.com-dc http://www.boitho.com/dcbot.html
-#              added IRLbot http://irl.cs.tamu.edu/crawler
-#              added virus_detector virus_harvester@securecomputing.com
-#              added Wavefire http://www.wavefire.com; info@wavefire.com
-#              added WebFilter Robot
-# 2006-01-24
-#              added Shim-Crawler http://www.logos.ic.i.u-tokyo.ac.jp/crawler/; crawl@logos.ic.i.u-tokyo.ac.jp
-#              added Exabot exabot.com
-#              added LetsCrawl.com http://letscrawl.com
-#              added ichiro http://help.goo.ne.jp/door/crawlerE.html
-# 2006-01-27    additional 22 robots from a list provided by Moizes Gabor
-#              added ALeadSoftbot      http://www.aleadsoft.com/bot.htm
-#              added CipinetBot        http://www.cipinet.com/bot.html
-#              added Cuasarbot http://www.cuasar.com/
-#              added Dumbot    http://www.dumbfind.com/
-#              added Extreme_Picture_Finder    http://www.exisoftware.com/
-#              added Fooky.com/ScorpionBot/ScoutOut    http://www.fooky.com/scorpionbots
-#              added IlTrovatore-Setaccio      http://www.iltrovatore.it/aiuto/motore_di_ricerca.html  bot@iltrovatore.it
-#              added InsurancoBot      http://www.fastspywareremoval.com/
-#              added InternetArchive   http://lucene.apache.org/nutch/bot.html         nutch-agent@lucene.apache.org
-#              added KazoomBot http://www.kazoom.ca/bot.html   kazoombot@kazoom.ca
-#              added Kurzor    http://www.easymail.hu/ cursor@easymail.hu
-#              added NutchCVS  http://lucene.apache.org/nutch/bot.html nutch-agent@lucene.apache.org
-#              added NutchOSU-VLIB     http://lucene.apache.org/nutch/bot.html nutch-agent@lucene.apache.org
-#              added Orbiter   http://www.dailyorbit.com/bot.htm
-#              added PHP_version_tracker       http://www.nexen.net/phpversion/bot.php
-#              added SuperBot  http://www.sparkleware.com/superbot/
-#              added SynooBot  http://www.synoo.de/bot.html    webmaster@synoo.com
-#              added TestBot   http://www.agbrain.com/
-#              added TutorGigBot       http://www.tutorgig.info/
-#              added WebIndexer        mailto://webindexerv1@yahoo.com
-#              added WebMiner  http://64.124.122.252/feedback.html
-# 2006-02-01
-#              added heritrix https://sourceforge.net/forum/message.php?msg_id=3550202
-#              added Zeus Webster Pro https://sourceforge.net/forum/message.php?msg_id=3141164
-#               additional robots from a list provided by Moizes Gabor [ mojzi -a-t- free mail hu ]
-#              added Candlelight_Favorites_Inspector
-#              added DomainChecker
-#              added EasyDL
-#              added FavOrg
-#              added Favorites_Sweeper
-#              added Html_Link_Validator
-#              added Internet_Ninja
-#              added JRTwine_Software_Check_Favorites_Utility
-#              fixed Microsoft_URL_Control
-#              added miniRank
-#              added Missigua_Locator
-#              added NPBot
-#              added Ocelli
-#              added Onet.pl_SA
-#              added proodleBot
-#              added SearchGuild_DMOZ_Experiment
-#              added Susie
-#              added Website_Monitoring_Bot
-#              added Xenu_Link_Sleuth
-# 2006-05-15
-#              added ASPseek http://www.aspseek.org/
-#              added AdamM Bot http://home.blic.net/adamm/
-#              added archive.org_bot http://crawls.archive.org/collections/bncf/crawl.html
-#              added arianna.libero.it (Italian Portal/search engine)
-#              added Biz360 spider http://www.biz360.com
-#              added BlogBridge Service http://www.blogbridge.com/
-#              added BlogSearch http://www.icerocket.com/
-#              added libcrawl
-#              added edgeio-relanshanbottriever http://www.edgeio.com
-#              added FeedFlow http://feedflow.com/about
-#              added Biblioteca Nazionale Centrale di Firenze (Italian National Archive) http://www.bncf.firenze.sbn.it/raccolta.txt
-#              added Java catchall - used by many spam bots
-#              added lanshanbot http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&amp;template=detail.html&amp;match=%5Cbid_g_l_140406_1%5Cb
-#              added msnbot-media http://search.msn.com/msnbot.htm
-#              added MT::Telegraph::Agent
-#              added Netluchs http://www.netluchs.de/ (German SE bot)
-#              added oBot http://www.webmasterworld.com/forum11/1616.htm
-#              added Onfolio http://www.onfolio.com/  (IE Toolbar plugin) - hit rss feeds.
-#              added ping.blo.gs http://blo.gs/ping.php blog bot
-#              added Sphere Scout http://www.sphere.com/
-#              added sproose crawler http://www.sproose.com/bot.html
-#              added SyndicAPI http://syndicapi.com/bot.html
-#              added Yahoo! Mindset http://mindset.research.yahoo.com/
-#              added msrabot
-#              added Vagabondo & Vagabondo-WAP http://www.wise-guys.nl/Contact/index.php?botselected=webagents&amp;lang=uk
-#              fixed Missigua Locator detection (Missigua_Locator -> Missigua Locator)
-#              changed echo to echo! to avoid conflict with the bonecho (Firefox 2.0) browser.
-#                      This requires you to reprocess historic logs if you want EchO! to be recognized for older reports.
-# 2006-05-17
-#              added Alpha Search Agent # 62.152.125.60 Eurologon Srl
-#              added Krugle http://www.krugle.com/crawler/info.html the search engine for developers
-#              added Octora Beta Bot http://www.octora.com/ # Blog and Rss Search Engine
-#              added UbiCrawler http://law.dsi.unimi.it/ubicrawler/
-#              added Yahoo! Slurp China http://misc.yahoo.com.cn/help.html
-#                      You must reprocess old logs for the Yahoo! Slurp China bot to be detected in old reports
-# 2006-05-20
-#              added 1-More Scanner http://www.myzips.com/software/1-More-Scanner.phtml
-#              added Accoona-AI-Agent http://www.accoona.com/
-#              added ActiveBookmark http://www.libmaster.com/active_bookmark.php
-#              added BIGLOTRON http://www.biglotron.com/robot.html
-#              added Bookmark-Manager http://bkm.sourceforge.net/
-#              added cbn00glebot
-#              added Cerberian Drtrs http://www.pgts.com.au/cgi-bin/psql?robot_info=25240
-#              added CFNetwork http://www.cocoadev.com/index.pl?CFNetwork
-#              added CheckWeb link validator http://p.duby.free.fr/chkweb.htm
-#              added Computer and Automation Research Institute Crawler http://www.ilab.sztaki.hu/~stamas/publications/p184-benczur.html
-#              added ConveraCrawler http://www.authoritativeweb.com/crawl/
-#              added ConveraMultiMediaCrawler http://www.authoritativeweb.com/crawl/
-#              added CSE HTML Validator Lite Online http://online.htmlvalidator.com/php/onlinevallite.php
-#              added Cursor http://adcenter.hu/docs/en/bot.html
-#              added Custo http://www.netwu.com/custo/
-#              added DataFountains/DMOZ Downloader http://infomine.ucr.edu/
-#              added Deepindex http://www.deepindex.net/faq.php
-#              added DNSGroup http://www.dnsgroup.com/
-#              added DoCoMo http://www.nttdocomo.co.jp/
-#              added dumm.de-Bot http://www.dumm.de/
-#              added ETS v http://www.freetranslation.com/help/
-#              added eventax http://www.eventax.de/
-#              added FAST Enterprise Crawler * crawleradmin.t-info@telekom.de http://www.telekom.de/
-#              added FAST Enterprise Crawler http://www.fast.no/
-#              added FAST Enterprise Crawler * T-Info_BI_cluster crawleradmin.t-info@telekom.de http://www.telekom.de/
-#              added FeedValidator http://feedvalidator.org/
-#              added FilmkameraBot http://www.filmkamera.at/bot.html
-#              added Findexa Crawler http://www.findexa.no/gulesider/article26548.ece
-#              added Global Fetch http://www.wesonet.com/
-#              added GOFORITBOT http://www.goforit.com/about/
-#              added GoForIt.com http://www.goforit.com/about/
-#              added GPU p2p crawler http://gpu.sourceforge.net/search_engine.php
-#              added HooWWWer http://cosco.hiit.fi/search/hoowwwer/
-#              added HPPrint
-#              added HTMLParser http://htmlparser.sourceforge.net/
-#              added Hundesuche.com-Bot http://www.hundesuche.com/
-#              added InfoBot http://www.infobot.org/
-#              added InfociousBot http://corp.infocious.com/tech_crawler.php
-#              added InternetSupervision http://internetsupervision.com/
-#              added isearch2006 http://www.yahoo.com.cn/
-#              added IUPUI_Research_Bot http://spamhuntress.com/2005/04/25/a-mail-harvester-visits/
-#              added KalamBot http://64.124.122.251/feedback.html
-#              added kamano.de NewsFeedVerzeichnis http://www.kamano.de/
-#              added Kevin http://dznet.com/kevin/
-#              added KnowItAll http://www.cs.washington.edu/research/knowitall/
-#              added Knowledge.com http://www.knowledge.com/
-#              added Kouaa Krawler http://www.kouaa.com/
-#              added ksibot http://ego.ms.mff.cuni.cz/
-#              added Link Valet Online http://www.htmlhelp.com/tools/valet/
-#              added lwp-request http://search.cpan.org/~gaas/libwww-perl-5.69/bin/lwp-request
-#              added lwp-trivial http://search.cpan.org/src/GAAS/libwww-perl-5.805/lib/LWP/Simple.pm
-#              added MapoftheInternet.com http://MapoftheInternet.com/
-#              added Matrix S.p.A. - FAST Enterprise Crawler http://tin.virgilio.it/
-#              added Megite http://www.megite.com/
-#              added Metaspinner http://index.meta-spinner.de/
-#              added Mini-reptile
-#              added Misterbot http://www.misterbot.fr/
-#              added Miva http://www.miva.com/
-#              added Mizzu Labs http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&amp;template=detail.html&amp;match=\bid_m_141105_2\b
-#              added MSRBOT http://research.microsoft.com/research/sv/msrbot/
-#              added MS SharePoint Portal Server - MS Search 4.0 Robot http://support.microsoft.com/default.aspx?scid=kb;en-us;284022
-#              added Mydoyouhike http://www.doyouhike.net/my
-#              added NASA Search http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&template=detail.html&match=\bid_n_s_140506_2\b
-#              added NetSprint http://www.netsprint.pl/serwis/
-#              added NimbleCrawler http://www.healthline.com/
-#              added OpenWebSpider http://www.openwebspider.org/
-#              added Oracle Ultra Search http://www.oracle.com/technology/products/ultrasearch/index.html
-#              added OSSProxy http://www.marketscore.com/FAQ.Aspx
-#              added passwordmaker.org http://passwordmaker.org/
-#              added PEAR HTTP Request class http://pear.php.net/
-#              added PEERbot http://www.peerbot.com/
-#              added PHP version tracker http://www.nexen.net/phpversion/bot.php
-#              added PictureOfInternet http://malfunction.org/poi/
-#              added plinki http://www.plinki.com/
-#              added Port Huron Labs http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&amp;template=detail.html&amp;match=\bid_n_s_1133\b
-#              added PostFavorites http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&amp;template=detail.html&amp;match=\bid_n_s_1135\b
-#              added ProjectWF-java-test-crawler
-#              added PyQuery http://sourceforge.net/projects/pyquery/
-#              added Schizozilla http://spamhuntress.com/2005/03/18/gizmo/
-#              added Scumbot
-#              added Sensis Web Crawler http://www.sensis.com.au/
-#              added snap.com beta crawler http://www.snap.com/
-#              added Steeler http://www.tkl.iis.u-tokyo.ac.jp/~crawler/
-#              added STEROID  Download http://faqs.org.ru/progr/pascal/delphi_internet2.htm
-#              added Suchfin-Bot http://www.suchfin.de/
-#              added Sunrise http://www.sunrisexp.com/
-#              added Tagyu Agent http://www.tagyu.com/
-#              added Tcl http client package http://www.tcl.tk/man/tcl8.4/TclCmd/http.htm
-#              added TeragramCrawlerSURF http://www.teragram.com/
-#              added Test Crawler http://netp.ath.cx/
-#              added UnChaos Bot Hybrid Web Search Engine http://www.unchaos.com/
-#              added unido-bot http://www.unchina.org/unido/unido/our_projects/3_3.html
-#              added UniversalFeedParser http://feedparser.org/ (seen from md301000.inktomisearch.com)
-#              added updated http://www.updated.com/
-#              added Vermut http://vermut.aol.com
-#              added versus crawler from eda.baykan@epfl.ch http://www.epfl.ch/Eindex.html
-#              added Vespa Crawler (Yahoo Norway?) http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&template=detail.html&match=%5Cbid_t_z_030406_1%5Cb
-#              added VSE http://www.vivisimo.com/
-#              added webcrawl.net http://www.webcrawl.net/
-#              added Web Downloader http://www.krasu.ru/soft/chuchelo/
-#              added Webdup http://www.webdup.com/en/index.html
-#              added Wells Search http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&amp;template=detail.html&amp;match=\bid_t_z_1484\b
-#              added WordPress http://wordpress.org/
-#              added wume crawler http://wume.cse.lehigh.edu/~xiq204/crawler/
-#              added Xenu's Link Sleuth (with ')
-#              added xirq http://www.xirq.com/
-#              added yoogliFetchAgent http://www.yoogli.com/
-#              added Z-Add Link Checker http://w3.z-add.co.uk/linkcheck/
-#              -- fix - some robots were reported with _ where _ should have been a space.
-#              changed Xenu Link Sleuth
-#              changed microsoft[_+\s]url[_+\s]control -> microsoft_url_control
-#              changed favorites_sweeper -> favorites_sweeper
-#              -- updates
-#              updated AskJeeves to Ask
-# 2012-06-05 Albrecht Mueller
-#              added Grabber from SDSC (San Diego Supercomputer Center).
-# 2013-09-30 Albrecht Mueller
-# AWStats probably cannot detect this bot as it identifies itself in
-# the referrer field and not in the user agent string.
-#92.113.100.35 - - [29/Sep/2013:17:22:46 +0200] "GET /robots.txt HTTP/1.1" 200 516 "-" "Mozilla/5.0 (Windows NT 6.1; WOW64; rv:5.0) Gecko/20100101 Firefox/5.0" "-"
-#92.113.100.35 - - [29/Sep/2013:17:22:49 +0200] "GET /tghome.htm HTTP/1.1" 200 4445 "http://extrabot.com/help/frytygativyheku.htm" "Mozilla/5.0 (Windows NT 6.1; WOW64; rv:5.0) Gecko/20100101 Firefox/5.0" "-"
-#92.113.100.35 - - [29/Sep/2013:17:22:51 +0200] "GET / HTTP/1.1" 200 5467 "http://extrabot.com/help/frytygativyheku.htm" "Mozilla/5.0 (Windows NT 6.1; WOW64; rv:5.0) Gecko/20100101 Firefox/5.0" "-"
-
-# to do  MS Search 4.0 Robot
-
-#package AWSROB;
-
-
-# Robots list was found at http://www.robotstxt.org/wc/active/all.txt
-# Other robots can be found at http://www.jafsoft.com/searchengines/webbots.html
-# Rem: To avoid bad detection, some robot's ids were removed from this list:
-#      - Robots with ID of 3 letters only
-#      - Robots called 'webs' and 'tcl'
-# Rem: directhit changed into direct_hit (its real id)
-# Rem: calif changed into calif[^r] to avoid confusion between Tiscalifreenet browser
-# Rem: fish changed into [^a]fish to avoid confusion between Madsafish browser
-# Rem: roadrunner changed into road_runner
-# Rem: lycos changed to lycos_ to avoid confusion with lycos-online browser
-# Rem: voyager changed into ^voyager\/ to avoid to exclude voyager and amigavoyager browser
-
-# RobotsSearchIDOrder
-# It contains all matching criteria to search for in log fields. This list is
-# used to know in which order to search Robot IDs.
-# Most frequent ones are in list1, used when LevelForRobotsDetection is 1 or more
-# Minor robots are in list2, used when LevelForRobotsDetection is 2 or more
-# Note: Robots IDs are in lower case, '_', ' ' and '+' are changed into '[_+\s]' and are quoted.
-#-------------------------------------------------------
-@RobotsSearchIDOrder_list1 = (
-# Common robots (In robot file)
-'appie',
-'architext',
-'bingpreview',
-'bjaaland',
-'contentmatch',
-'ferret',
-'googlebot\-image',
-'googlebot',
-'google\-sitemaps',
-'google[_+\s]web[_+\s]preview',
-'grabber',
-'gulliver',
-'virus[_+\s]detector',         # Must be before harvest
-'harvest',
-'htdig',
-'jeeves',
-'linkwalker',
-'lilina',
-'lycos[_+\s]',
-'moget',
-'muscatferret',
-'myweb',
-'nomad',
-'scooter',
-'slurp',
-'^voyager\/',
-'weblayers',
-# Common robots (Not in robot file)
-'antibot',
-'bruinbot',
-'digout4u',
-'echo!',
-'fast\-webcrawler',
-'ia_archiver\-web\.archive\.org', # Must be before ia_archiver to avoid confusion with alexa
-'ia_archiver',
-'jennybot',
-'mercator',
-'netcraft',
-'msnbot\-media',
-'msnbot-udiscovery',
-'msnbot',
-'petersnews',
-'relevantnoise\.com',
-'unlost_web_crawler',
-'voila',
-'webbase',
-'webcollage',
-'cfetch',
-'zyborg',      # Must be before wisenut
-'wisenutbot'
-);
-@RobotsSearchIDOrder_list2 = (
-# Less common robots (In robot file)
-'007ac9',
-'[^a]fish',
-'abcdatos',
-'abonti\.com',
-'acme\.spider',
-'ahoythehomepagefinder',
-'ahrefsbot',
-'alkaline',
-'anthill',
-'arachnophilia',
-'arale',
-'araneo',
-'aretha',
-'ariadne',
-'powermarks',
-'arks',
-'aspider',
-'atn\.txt',
-'atomz',
-'auresys',
-'backrub',
-'bbot',
-'bigbrother',
-'blackwidow',
-'blindekuh',
-'bloodhound',
-'borg\-bot',
-'brightnet',
-'bspider',
-'cactvschemistryspider',
-'calif[^r]',
-'cassandra',
-'cgireader',
-'checkbot',
-'christcrawler',
-'churl',
-'cienciaficcion',
-'cms\scrawler',
-'collective',
-'combine',
-'conceptbot',
-'coolbot',
-'core',
-'cosmos',
-'crazywebcrawler',
-'cruiser',
-'cusco',
-'cyberspyder',
-'desertrealm',
-'deweb',
-'dienstspider',
-'digger',
-'diibot',
-'direct_hit',
-'dnabot',
-'domainappender',
-'download_express',
-'dragonbot',
-'dwcp',
-'e\-collector',
-'ebiness',
-'elfinbot',
-'emacs',
-'emcspider',
-'esther',
-'evliyacelebi',
-'fastcrawler',
-'feedcrawl',
-'fdse',
-'felix',
-'fetchrover',
-'fido',
-'finnish',
-'fireball',
-'fouineur',
-'francoroute',
-'freecrawl',
-'funnelweb',
-'gama',
-'gazz',
-'gcreep',
-'getbot',
-'geturl',
-'golem',
-'gougou',
-'grapnel',
-'griffon',
-'gromit',
-'gulperbot',
-'hambot',
-'havindex',
-'hometown',
-'htmlgobble',
-'hyperdecontextualizer',
-'iajabot',
-'iaskspider',
-'hl_ftien_spider',
-'sogou',
-'icjobs\.de',
-'iconoclast',
-'ilse',
-'imagelock',
-'incywincy',
-'informant',
-'infoseek',
-'infoseeksidewinder',
-'infospider',
-'inspectorwww',
-'intelliagent',
-'irobot',
-'iron33',
-'israelisearch',
-'javabee',
-'jbot',
-'jcrawler',
-'jobo',
-'jobot',
-'joebot',
-'jubii',
-'jumpstation',
-'kapsi',
-'katipo',
-'kilroy',
-'ko[_+\s]yappo[_+\s]robot',
-'kummhttp',
-'labelgrabber\.txt',
-'larbin',
-'legs',
-'linkidator',
-'linkscan',
-'lockon',
-'logo_gif',
-'macworm',
-'magpie',
-'marvin',
-'mattie',
-'mediafox',
-'merzscope',
-'meshexplorer',
-'mindcrawler',
-'mnogosearch',
-'momspider',
-'monster',
-'motor',
-'muncher',
-'mwdsearch',
-'ndspider',
-'nederland\.zoek',
-'netcarta',
-'netmechanic',
-'netscoop',
-'newscan\-online',
-'nhse',
-'northstar',
-'nzexplorer',
-'objectssearch',
-'occam',
-'octopus',
-'openfind',
-'orb_search',
-'packrat',
-'pageboy',
-'parasite',
-'patric',
-'pegasus',
-'perignator',
-'perlcrawler',
-'phantom',
-'phpdig',
-'piltdownman',
-'pimptrain',
-'pioneer',
-'pitkow',
-'pjspider',
-'plumtreewebaccessor',
-'poppi',
-'portalb',
-'psbot',
-'python',
-'raven',
-'rbse',
-'resumerobot',
-'rhcs',
-'road_runner',
-'robbie',
-'robi',
-'robocrawl',
-'robofox',
-'robozilla',
-'roverbot',
-'rules',
-'safetynetrobot',
-'semalt', #Note: This entry will not work as this crawler identifies itself
-# in the referrer string and not in the user agent string
-'search\-info',
-'search_au',
-'searchprocess',
-'senrigan',
-'sgscout',
-'shaggy',
-'shaihulud',
-'sift',
-'simbot',
-'sistrix', #Virus/trojan-infection? fr-crawler, ca-crawler? See https://www.projecthoneypot.org/ip_37.59.55.128, https://www.projecthoneypot.org/ip_198.27.80.144
-'site\-valet',
-'sitetech',
-'skymob',
-'slcrawler',
-'smartspider',
-'snooper',
-'solbot',
-'speedy',
-'spider[_+\s]monkey',
-'spiderbot',
-'spiderline',
-'spiderman',
-'spiderview',
-'spry',
-'sqworm',
-'ssearcher',
-'suke',
-'sunrise',
-'suntek',
-'sven',
-'tach_bw',
-'tagyu_agent',
-'tailrank',
-'tarantula',
-'tarspider',
-'techbot',
-'templeton',
-'titan',
-'titin',
-'tkwww',
-'tlspider',
-'ucsd',
-'udmsearch',
-'universalfeedparser',
-'urlck',
-'valkyrie',
-'verticrawl',
-'victoria',
-'visionsearch',
-'voidbot',
-'vwbot',
-'w3index',
-'w3m2',
-'wallpaper',
-'wanderer',
-'wapspIRLider',
-'webbandit',
-'webcatcher',
-'webcopy',
-'webfetcher',
-'webfoot',
-'webinator',
-'weblinker',
-'webmirror',
-'webmoose',
-'webquest',
-'webreader',
-'webreaper',
-'websnarf',
-'webspider',
-'webvac',
-'webwalk',
-'webwalker',
-'webwatch',
-'whatuseek',
-'whowhere',
-'wired\-digital',
-'wmir',
-'wolp',
-'wombat',
-'wordpress',
-'worm',
-'woozweb',
-'wwwc',
-'wz101',
-'xenu\slink\ssleuth',
-'xget',
-# Other robots reported by users
-'^finbot', #UA string starts with "finbot", should not match "elfinbot"
-'^webindex$', #UA should not match "webindexer"
-'1\-more_scanner',
-'360spider',
-'a6-indexer',
-'accoona\-ai\-agent',
-'activebookmark',
-'adamm_bot',
-'adsbot-google',
-'advbot',
-'affectv\.co\.uk',
-'almaden',
-'aipbot',
-'aleadsoftbot',
-'alpha_search_agent',
-'allrati',
-'aport',
-'applebot',
-'archive\-de\.com',
-'archive\.org_bot',
-'argus',               # Must be before nutch
-'arianna\.libero\.it',
-'aspseek',
-'asterias',
-'awbot',
-'backlinktest\.com',
-'baiduspider',
-'becomebot',
-'bender',
-'betabot',
-'biglotron',
-'bittorrent_bot',
-'biz360[_+\s]spider',
-'blexbot',
-'blogbridge[_+\s]service',
-'bloglines',
-'blogpulse',
-'blogsearch',
-'blogshares',
-'blogslive',
-'blogssay',
-'bncf\.firenze\.sbn\.it\/raccolta\.txt',
-'bobby',
-'boitho\.com\-dc',
-'bookmark\-manager',
-'boris',
-'bubing',
-'bumblebee',
-'candlelight[_+\s]favorites[_+\s]inspector',
-'careerbot',
-'cbn00glebot',
-'ccbot',
-'cerberian_drtrs',
-'cfnetwork',
-'cipinetbot',
-'checkweb_link_validator',
-'cliqzbot',
-'commons\-httpclient',
-'computer_and_automation_research_institute_crawler',
-'converamultimediacrawler',
-'converacrawler',
-'copubbot',
-'cscrawler',
-'cse_html_validator_lite_online',
-'cuasarbot',
-'cursor',
-'custo',
-'datafountains\/dmoz_downloader',
-'dataprovider\.com',
-'daumoa',
-'daviesbot',
-'daypopbot',
-'deepindex',
-'deusu',
-'dipsie\.bot',
-'dnsgroup',
-'doccheckbot',
-'domainchecker',
-'domainsdb\.net',
-'dotbot',
-'duckduckgo-favicons-bot',
-'dulance',
-'dumbot',
-'dumm\.de\-bot',
-'earthcom\.info',
-'easydl',
-'eccp',
-'edgeio\-retriever',
-'ernst[:blank:]2\.0',
-'ets_v',
-'exactseek',
-'extreme[_+\s]picture[_+\s]finder',
-'eventax',
-'everbeecrawler',
-'everest\-vulcan',
-'ezresult',
-'enteprise',
-'facebook',
-'facebot',
-'fast_enterprise_crawler.*crawleradmin\.t\-info@telekom\.de',
-'fast_enterprise_crawler.*t\-info_bi_cluster_crawleradmin\.t\-info@telekom\.de',
-'finderlein[_+\s]research[_+\s]crawler',
-'matrix_s\.p\.a\._\-_fast_enterprise_crawler', # must come before fast enterprise crawler
-'fast_enterprise_crawler',
-'fast\-search\-engine',
-'fastbot',
-'favicon',
-'favorg',
-'favorites_sweeper',
-'feedburner',
-'feedfetcher\-google',
-'feedflow',
-'feedster',
-'feedsky',
-'feedvalidator',
-'fetchbot',
-'filmkamerabot',
-'filterdb\.iss\.net',
-'findlinks',
-'findexa_crawler',
-'firmilybot',
-'foaf-search\.net',
-'fooky\.com\/ScorpionBot',
-'g2crawler',
-'gaisbot',
-'geniebot',
-'genieo',
-'gigablastopensource',
-'gigabot',
-'girafabot',
-'global_fetch',
-'gnodspider',
-'goforit\.com',
-'goforitbot',
-'gonzo',
-'grapeshot',
-'grub',
-'gpu_p2p_crawler',
-'henrythemiragorobot',
-'heritrix',
-'holmes',
-'hoowwwer',
-'hpprint',
-'htmlparser',
-'html[_+\s]link[_+\s]validator',
-'httrack',
-'hundesuche\.com\-bot',
-'i-bot',
-'icarus6j',
-'ichiro',
-'idmarch',
-'iltrovatore\-setaccio',
-'implisensebot',
-'infobot',
-'infociousbot',
-'infohelfer',
-'infomine',
-'insurancobot',
-'integromedb\.org',
-'internet[_+\s]ninja',
-'internetarchive',
-'internetseer',
-'internetsupervision',
-'ips\-agent',
-'irlbot',
-'isearch2006',
-'istellabot',
-'iupui_research_bot',
-'izsearch',
-'james\sbot',
-'jobboerse', #AWStats seems not to find this one despite the fact that "JobboerseBot" and "jobboerse.com" appear in the UA-string, maybe some previous entry matches
-'jrtwine[_+\s]software[_+\s]check[_+\s]favorites[_+\s]utility',
-'justview',
-'kalambot',
-'kamano\.de_newsfeedverzeichnis',
-'kazoombot',
-'kevin',
-'keyoshid', # Must come before Y!J
-'kinjabot',
-'kinja\-imagebot',
-'knowitall',
-'knowledge\.com',
-'kouaa_krawler',
-'krugle',
-'ksibot',
-'kurzor',
-'lanshanbot',
-'letscrawl\.com',
-'libcrawl',
-'linkbot',
-'linkdex\.com',
-'link_valet_online',
-'metager\-linkchecker',        # Must be before linkchecker
-'linkchecker',
-'linkstats\sbot',
-'lipperhey',
-'livejournal\.com',
-'lmspider',
-'loadtimebot',
-'lssrocketcrawler',
-'ltbot',
-'ltx71',
-'lwp\-request',
-'lwp\-trivial',
-'madaali\.de',
-'magpierss',
-'mail\.ru',
-'mapoftheinternet\.com',
-'meanpathbot',
-'mediabot',
-'mediapartners\-google',
-'megaindex',
-'megite',
-'memorybot',
-'metager2-verification-bot',
-'metajobbot', #Does not show up in the results of Sep. 2015 despite the fact that the corresponing log file has about 40 entries containing "MetaJobBot" in the UA string - strange.
-'metaspinner',
-'miadev',
-'microsoft\sbits',
-'microsoft.*discovery', # = 'microsoft (?:office (?:protocol|existence)|data access internet publishing provider protocol) discovery',
-'microsoft[_+\s]url[_+\s]control',
-'mindupbot',
-'mini\-reptile',
-'minirank',
-'missigua_locator',
-'misterbot',
-'miva',
-'mizzu_labs',
-'mj12bot',
-'mojeekbot',
-'msiecrawler',
-'ms[_+\s]search[_+\s]6\.0[_+\s]robot',
-'ms_search_4\.0_robot',
-'msrabot',
-'msrbot',
-'mt::telegraph::agent',
-'mydoyouhike',
-'nagios',
-'nasa_search',
-'netestate\sne\scrawler',
-'netluchs',
-'netsprint',
-'newsgatoronline',
-'nicebot',
-'nimblecrawler',
-'noxtrumbot',
-'npbot',
-'loocalcrawler/nutch',
-'nutchcvs',
-'nutchosu\-vlib',
-'nutch',  # Must come after other nutch versions
-'ocelli',
-'octora_beta_bot',
-'omniexplorer[_+\s]bot',
-'onet\.pl[_+\s]sa',
-'onfolio',
-'opentaggerbot',
-'openwebspider',
-'optimizer',
-'oracle_ultra_search',
-'orangebot',
-'orbiter',
-'yodaobot',
-'qihoobot',
-'qwantify',
-'passwordmaker\.org',
-'pear_http_request_class',
-'peerbot',
-'perman',
-'php[_+\s]version[_+\s]tracker',
-'phpcrawl',
-'picmole',
-'pictureofinternet',
-'ping\.blo\.gs',
-'plinki',
-'pluckfeedcrawler',
-'plukkie',
-'pogodak',
-'pompos',
-'popdexter',
-'port_huron_labs',
-'postfavorites',
-'projectwf\-java\-test\-crawler',
-'proodlebot',
-'publiclibraryarchive',
-'pyquery',
-'rambler',
-'redalert',
-'riddler',
-'rogerbot',
-'rojo',
-'rssimagesbot',
-'ruffle',
-'rufusbot',
-'safeads\.xyz',
-'safesearch',
-'sandcrawler',
-'savetheworldheritage',
-'sbider',
-'schizozilla',
-'scumbot',
-'searchguild[_+\s]dmoz[_+\s]experiment',
-'searchmetricsbot',
-'seekbot',
-'semrushbot',
-'sensis_web_crawler',
-'seodiver',
-'seokicks\.de',
-'seoscanners',
-'seznambot',
-'shim\-crawler',
-'shoutcast',
-'sitedomain-bot',
-'siteexplorer\.info',
-'skimbot',
-'slysearch',
-'smtbot',
-'snap\.com_beta_crawler',
-'sohu\-search',
-'sohu', # "sohu agent"
-'snappy',
-'spbot',
-'sphere_scout',
-'spiderlytics',
-'spip',
-'sproose_crawler',
-'ssearch_bot',
-'steeler',
-'steroid__download',
-'stq_bot',
-'suchfin\-bot',
-'superbot',
-'surveybot',
-'susie',
-'syndic8',
-'syndicapi',
-'synoobot',
-'tcl_http_client_package',
-'technoratibot',
-'teragramcrawlersurf',
-'test_crawler',
-'testbot',
-'thumbsniper',
-'t\-h\-u\-n\-d\-e\-r\-s\-t\-o\-n\-e',
-'topicblogs',
-'turnitinbot',
-'turtlescanner',               # Must be before turtle
-'turtle',
-'tutorgigbot',
-'twiceler',
-'ubicrawler',
-'ultraseek',
-'unchaos_bot_hybrid_web_search_engine',
-'unido\-bot',
-'unisterbot',
-'updated',
-'ustc\-semantic\-group',
-'vagabondo\-wap',
-'vagabondo',
-'vebidoobot',
-'vermut',
-'versus_crawler_from_eda\.baykan@epfl\.ch',
-'vespa_crawler',
-'voltron',
-'vortex',
-'vse\/',
-'w3c\-checklink',
-'w3c[_+\s]css[_+\s]validator[_+\s]jfouffa',
-'w3c_validator',
-'watchmouse',
-'wavefire',
-'waybackarchive\.org',
-'wbsearchbot',
-'webclipping\.com',
-'webcompass',
-'webcrawl\.net',
-'web_downloader',
-'webdup',
-'webfilter',
-'webindexer',
-'webminer',
-'website[_+\s]monitoring[_+\s]bot',
-'webvulncrawl',
-'wells_search',
-'wer-liefert-was',
-'wesee:search',
-'wevikabot',
-'wonderer',
-'wotbox',
-'wume_crawler',
-'wwweasel',
-'xenu\'s_link_sleuth',
-'xenu_link_sleuth',
-'xirq',
-'xovibot',
-'y!j', # Must come after keyoshid Y!J
-'yacy',
-'yahoo\-blogs',
-'yahoo\-verticalcrawler',
-'yahoofeedseeker',
-'yahooseeker\-testing',
-'yahooseeker',
-'yahoo\-mmcrawler',
-'yahoo!_mindset',
-'yandex',
-'flexum',
-'yanga',
-'yet-another-spider',
-'yisouspider',
-'yooglifetchagent',
-'z\-add_link_checker',
-'zealbot',
-'zhuaxia',
-'zspider',
-'zeus',
-'ng\/1\.', # put at end to avoid false positive
-'ng\/2\.', # put at end to avoid false positive
-'exabot',  # put at end to avoid false positive
-# Additional bots found by Sussex.
-'^[1-3]$', # Hiding bots. Doesn't appear to be a valid user agent.
-'alltop',
-'applesyndication',
-'asynchttpclient',
-'bingbot',
-'blogged_crawl',
-'bloglovin',
-'butterfly',
-'buzztracker',
-'carpathia',
-'catbot',
-'chattertrap',
-'check_http', #(nagios) a monitoring tool
-'coldfusion',
-'covario',
-'daylifefeedfetcher',
-'discobot',
-'dlvr\.it',
-'dreamwidth',
-'drupal',
-'ezoom',
-'feedmyinbox',
-'feedroll\.com',
-'feedzira',
-'fever\/',
-'freenews',
-'geohasher',
-'hanrss',
-'inagist',
-'jacobin\sclub',
-'jakarta',
-'js\-kit',
-'largesmall\scrawler',
-'linkedinbot',
-'longurl',
-'metauri',
-'microsoft\-webdav\-miniredir',
-'^motorola$',
-'movabletype',
-# These appear to be bots trying to hide. All of the usual architecture data is missing.
-'^mozilla\/3\.0\s\(compatible$',
-'^mozilla\/4\.0$',
-'^mozilla\/4\.0\s\(compatible;\)$',
-'^mozilla\/5\.0$',
-'^mozilla\/5\.0\s\(compatible;$',
-'^mozilla\/5\.0\s\(en\-us\)$',
-'^mozilla\/5\.0\sfirefox\/3\.0\.5$',
-'^msie',
-# End of hiding bots.
-'netnewswire',
-'\snetseer\s',
-'netvibes',
-'newrelicpinger',
-'newsfox',
-'nextgensearchbot',
-'ning',
-'pingdom',
-'pita',
-'postpost',
-'postrank',
-'printfulbot',
-'protopage',
-'proximic',
-'quipply',
-'r6\_',
-'ratingburner',
-'regator',
-'rome\sclient',
-'rpt\-httpclient',
-'rssgraffiti',
-'sage\+\+',
-'scoutjet',
-'simplepie',
-'sitebot',
-'summify\.com',
-'superfeedr',
-'synthesio',
-'teoma',
-'topblogsinfo',
-'topix\.net',
-'trapit',
-'trileet',
-'tweetedtimes',
-'twisted\spagegetter',
-'twitterbot',
-'twitterfeed',
-'unwindfetchor',
-'wazzup',
-'windows\-rss\-platform',
-'wiumi',
-'xydo',
-'yahoo!\sslurp',
-'yahoo\spipes',
-'yahoo\-newscrawler',
-'yahoocachesystem',
-'yahooexternalcache',
-'yahoo!\ssearchmonkey',
-'yahooysmcm',
-'yammer',
-# 'yandexbot', #already covered by 'yandex'
-'yeti',
-'yie8',
-'youdao',
-'yourls',
-'zemanta',
-'zend_http_client',
-'zumbot',
-# Other id that are 99% of robots
-'wget',
-'libwww',
-'^java\/[0-9]'   # put at end to avoid false positive
-);
-@RobotsSearchIDOrder_listgen = (
-# Generic robot
-'robot',
-'checker',
-'crawl',
-'discovery',
-'hunter',
-'scanner',
-'spider',
-'sucker',
-'bot[\s_+:,\.\;\/\\\-]',
-# Identifies
-#"Mozilla/5.0 (Linux; U; Android 4.2.2; de-de; CUBOT P9 Build/JDQ39) AppleWebKit/534.30 (KHTML, like Gecko) Version/4.0 Mobile Safari/534.30"
-#as a but. There is a Android mobile phone called "CUBOT P9", so this is probably not a bot.
-'[\s_+:,\.\;\/\\\-]bot',
-'curl',
-'php',
-'ruby\/',
-'no_user_agent'
-);
-
-
-
-# RobotsHashIDLib
-# List of robots names ('robot id','robot clear text')
-#-------------------------------------------------------
-%RobotsHashIDLib   = (
-# Common robots (In robot file)
-'appie','<a href="http://www.walhello.com/" title="Bot home page [new window]" target="_blank">Walhello appie</a>',
-'architext','ArchitextSpider',
-'bingpreview','Bing Preview bot',
-'bjaaland','Bjaaland',
-'ferret','Wild Ferret Web Hopper #1, #2, #3',
-'contentmatch','<a href="http://p4p.cn.yahoo.com">Yahoo!China ContentMatch Crawler</a>',
-'googlebot\-image','<a href="http://www.google.com/bot.html" title="Bot home page [new window]" target="_blank">Googlebot-Image</a>',
-'googlebot','<a href="http://www.google.com/bot.html" title="Bot home page [new window]" target="_blank">Googlebot</a>',
-'google\-sitemaps', 'Google Sitemaps',
-'grabber', '<a href="http://www.sdsc.edu/" title="Seltsame Aktivitaeten vom San Diego Supercomputer Center [new window]" target="_blank">Grabber (SDSC)</a>',
-'google[_+\s]web[_+\s]preview', 'Google Web Preview',
-'gulliver','Northern Light Gulliver',
-'virus[_+\s]detector','<a href="http://www.securecomputing.com/" title="virus_harvester@securecomputing.com; Bot home page [new window]" target="_blank">virus_detector</a>',
-'harvest','Harvest',
-'htdig','ht://Dig',
-'jeeves','<a href="http://sp.ask.com/docs/about/tech_crawling.html" title="Bot home page [new window]" target="_blank">Ask</a>',
-'linkwalker','LinkWalker',
-'lilina','Lilina',
-'lycos[_+\s]','Lycos',
-'moget','moget',
-'muscatferret','Muscat Ferret',
-'myweb','Internet Shinchakubin',
-'nomad','Nomad',
-'scooter','Scooter',
-'slurp','<a href="http://help.yahoo.com/help/us/ysearch/slurp/" title="Bot home page [new window]" target="_blank">Yahoo Slurp</a>',
-'^voyager\/','Voyager',
-'weblayers','Weblayers',
-# Common robots (Not in robot file)
-'antibot','Antibot',
-'bruinbot','<a href="http://web.archive.org/" title="BruinBot home page [new window]" target="_blank">The web archive</a>',
-'digout4u','Digout4u',
-'echo!','EchO!',
-'fast\-webcrawler','Fast-Webcrawler',
-'ia_archiver\-web\.archive\.org','<a href="http://web.archive.org/" title="Bot home page [new window]" target="_blank">The web archive (IA Archiver)</a>',
-'ia_archiver','<a href="http://www.alexa.com/" title="Bot home page [new window]" target="_blank">Alexa (IA Archiver)</a>',
-'jennybot','JennyBot',
-'mercator','Mercator',
-'msnbot\-media','<a href="http://search.msn.com/msnbot.htm" title="Bot home page [new window]" target="_blank">MSNBot-media</a>',
-'msnbot-udiscovery', '<a href="http://search.msn.com/msnbot.htm" title="Feb 18, 2015: UA contains indentification during robots.txt access only." target="_blank">msnbot-UDiscovery</a> Note: AWStats counts most of its traffic as user traffic',
-'msnbot','<a href="http://search.msn.com/msnbot.htm" title="Bot home page [new window]" target="_blank">MSNBot</a>',
-'netcraft','<a href="http://www.netcraft.com/survey/" title="Bot home page [new window]" target="_blank">Netcraft</a>',
-'petersnews','Petersnews',
-'unlost_web_crawler','Unlost Web Crawler',
-'voila','Voila',
-'webbase', 'WebBase',
-'zyborg','<a href="http://www.WISEnutbot.com/" title="wn-14.zyborg@looksmart.net Bot home page [new window]" target="_blank">ZyBorg</a>',
-'wisenutbot','<a href="http://www.WISEnutbot.com/" title="Bot home page [new window]" target="_blank">WISENutbot</a>',
-'webcollage','<a href="http://www.jwz.org/webcollage/" title="WebCollage home page [new window]" target="_blank">WebCollage</a>',
-'cfetch','<a href="http://www.kosmix.com/crawler.html" title="kosmix home page [new window]" target="_blank">Cfetch</a>',
-# Less common robots (In robot file)
-'007ac9',  '<a href="http://crawler.007ac9.net/" rel="nofollow" title="007ac9 Crawler Page [new window]" target="_blank">007ac9 Crawler</a>, seems to belong to <a href="http://www.sistrix.com/" rel="nofollow" title="SISTRIX Home Page [new window]" target="_blank">SISTRIX</a>',
-'[^a]fish','Fish search',
-'abcdatos','ABCdatos BotLink',
-'abonti\.com','<a href="http://www.abonti.com/" title="Abonti WebSearch [new window]" target="_blank">Abonti WebSearch</a>',
-'acme\.spider','Acme.Spider',
-'ahoythehomepagefinder','Ahoy! The Homepage Finder',
-'ahrefsbot', '<a href="http://ahrefs.com/robot/" title="Bot home page [new window]" target="_blank">AhrefsBot</a>',
-'alkaline','Alkaline',
-'anthill','Anthill',
-'arachnophilia','Arachnophilia',
-'arale','Arale',
-'araneo','Araneo',
-'aretha','Aretha',
-'ariadne','ARIADNE',
-'powermarks','<a href="http://www.kaylon.com/power.html" title="Bot home page [new window]" target="_blank">Powermarks</a>', # must come before Arks; seen used by referrer spam
-'arks','arks',
-'aspider','ASpider (Associative Spider)',
-'atn\.txt','ATN Worldwide',
-'atomz','Atomz.com Search Robot',
-'auresys','AURESYS',
-'backrub','BackRub',
-'bbot','BBot',
-'bigbrother','Big Brother',
-'blackwidow','BlackWidow',
-'blindekuh','Die Blinde Kuh',
-'bloodhound','Bloodhound',
-'borg\-bot','Borg-Bot',
-'brightnet','bright.net caching robot',
-'bspider','BSpider',
-'cactvschemistryspider','CACTVS Chemistry Spider',
-'calif[^r]','Calif',
-'cassandra','Cassandra',
-'cgireader','Digimarc Marcspider/CGI',
-'checkbot','Checkbot',
-'christcrawler','ChristCrawler.com',
-'churl','churl',
-'cienciaficcion','cIeNcIaFiCcIoN.nEt',
-'cms\scrawler', '<a href="http://www.cmscrawler.com" rel="nofollow" title="CMS Crawler Home Page [new window]" target="_blank">CMS Crawler</a>',
-'collective','Collective',
-'combine','Combine System',
-'conceptbot','Conceptbot',
-'coolbot','CoolBot',
-'core','Web Core / Roots',
-'cosmos','XYLEME Robot',
-'crazywebcrawler', '<a href="http://www.crazywebcrawler.com/" rel="nofollow" title="CrazyWeb Crawler Home Page [new window]" target="_blank">CrazyWeb Crawler</a>',
-'cruiser','Internet Cruiser Robot',
-'cusco','Cusco',
-'cyberspyder','CyberSpyder Link Test',
-'desertrealm','Desert Realm Spider',
-'deweb','DeWeb(c) Katalog/Index',
-'dienstspider','DienstSpider',
-'digger','Digger',
-'diibot','Digital Integrity Robot',
-'direct_hit','Direct Hit Grabber',
-'dnabot','DNAbot',
-'domainappender',  '<a href="http://www.profound.net/domainappender" rel="nofollow" title="DomainAppender Home Page [new window]" target="_blank">DomainAppender</a>',
-'download_express','DownLoad Express',
-'dragonbot','DragonBot',
-'dwcp','DWCP (Dridus\' Web Cataloging Project)',
-'e\-collector','e-collector',
-'ebiness','EbiNess',
-'elfinbot','ELFINBOT',
-'emacs','Emacs-w3 Search Engine',
-'emcspider','ananzi',
-'esther','Esther',
-'evliyacelebi','Evliya Celebi',
-'fastcrawler','FastCrawler',
-'feedcrawl','FeedCrawl by feed@aobo.com',
-'fdse','Fluid Dynamics Search Engine robot',
-'felix','Felix IDE',
-'fetchrover','FetchRover',
-'fido','fido',
-'finnish','Finnish',
-'fireball','KIT-Fireball',
-'fouineur','Fouineur',
-'francoroute','Robot Francoroute',
-'freecrawl','Freecrawl',
-'funnelweb','FunnelWeb',
-'gama','gammaSpider, FocusedCrawler',
-'gazz','gazz',
-'gcreep','GCreep',
-'getbot','GetBot',
-'geturl','GetURL',
-'golem','Golem',
-'gougou','GouGou',
-'grapnel','Grapnel/0.01 Experiment',
-'griffon','Griffon',
-'gromit','Gromit',
-'gulperbot','Gulper Bot',
-'hambot','HamBot',
-'havindex','havIndex',
-'hometown','Hometown Spider Pro',
-'htmlgobble','HTMLgobble',
-'hyperdecontextualizer','Hyper-Decontextualizer',
-'iajabot','iajaBot',
-'iaskspider','<a href="http://www.iask.com/" target="_blank">Sina Iask Spider</a>',
-'hl_ftien_spider','<a href="http://www.hylanda.com/" target="_blank">Hylanda</a>',
-'sogou','<a href="http://www.sogou.com/" target="_blank">Sogou Spider</a>',
-'icjobs\.de', '<a href="http://www.icjobs.de/" title="April 10, 2014: UA contains indentification during the first and second page access only." target="_blank">iCjobs Spider</a> Note: Most traffic counts as user traffic',
-#20130805 The user agent string of the icjobs-spider contained the
-#identifying string only when it accessed the robots.txt file.
-#When it accessed the actual content it did not identify itself as
-#a spider. Thus traffic of this spider was counted as user traffic.
-#The behavious seems to have changed now - the spider identifies itself
-#when it accesses content pages.
-#20141401 Behavior as before: Does identify itself when it accesses
-# robots.txt and the root page. The following traffic does not contain
-# the identification string and is therefore counted as user traffic.
-'iconoclast','Popular Iconoclast',
-'ilse','Ingrid',
-'imagelock','Imagelock',
-'incywincy','IncyWincy',
-'informant','Informant',
-'infoseek','InfoSeek Robot 1.0',
-'infoseeksidewinder','Infoseek Sidewinder',
-'infospider','InfoSpiders',
-'inspectorwww','Inspector Web',
-'intelliagent','IntelliAgent',
-'ips\-agent', 'ips-agent Verisign(?) - no reliable information found.',
-'irobot','I, Robot',
-'iron33','Iron33',
-'israelisearch','Israeli-search',
-'javabee','JavaBee',
-'jbot','JBot Java Web Robot',
-'jcrawler','JCrawler',
-'jobo','JoBo Java Web Robot',
-'jobot','Jobot',
-'joebot','JoeBot',
-'jubii','The Jubii Indexing Robot',
-'jumpstation','JumpStation',
-'kapsi','image.kapsi.net',
-'katipo','Katipo',
-'kilroy','Kilroy',
-'ko[_+\s]yappo[_+\s]robot','KO_Yappo_Robot',
-'kummhttp','<a href="http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&template=detail.html&match=\bid_g_l_301105_2\b" title="Bot documentation page [new window]" target="_blank">KummHttp</a>',
-'labelgrabber\.txt','LabelGrabber',
-'larbin','<a href="http://para.inria.fr/~ailleret/larbin/index-eng.html" title="Bot home page [new window]" target="_blank">larbin</a>',
-'legs','legs',
-'linkidator','Link Validator',
-'linkscan','LinkScan',
-'lockon','Lockon',
-'logo_gif','logo.gif Crawler',
-'macworm','Mac WWWWorm',
-'lmspider','<a href="http://www.nuance.com/" title="Bot home page lmspider@scansoft.com [new window]" target="_blank">lmspider</a>',
-'lwp\-request','<a href="http://search.cpan.org/~gaas/libwww-perl-5.69/bin/lwp-request" title="lwp-request home page [new window]" target="_blank">lwp-request</a>',
-'lwp\-trivial','<a href="http://search.cpan.org/src/GAAS/libwww-perl-5.805/lib/LWP/Simple.pm" title="lwp-trivial home page [new window]" target="_blank">lwp-trivial</a>',
-'magpie','<a href="http://magpierss.sf.net/" title="Bot home page [new window]" target="_blank">MagpieRSS</a>',
-'marvin','marvin/infoseek',
-'mattie','Mattie',
-'mediafox','MediaFox',
-'merzscope','MerzScope',
-'meshexplorer','NEC-MeshExplorer',
-'mindcrawler','MindCrawler',
-'mnogosearch','mnoGoSearch search engine software',
-'momspider','MOMspider',
-'monster','Monster',
-'motor','Motor',
-'muncher','Muncher',
-'mwdsearch','Mwd.Search',
-'ndspider','NDSpider',
-'nederland\.zoek','Nederland.zoek',
-'netcarta','NetCarta WebMap Engine',
-'netmechanic','<a href="http://www.netmechanic.com/" title="Bot home page [new window]" target="_blank">NetMechanic</a>',
-'netscoop','NetScoop',
-'newscan\-online','newscan-online',
-'nhse','NHSE Web Forager',
-'northstar','The NorthStar Robot',
-'nzexplorer','nzexplorer',
-'objectssearch','ObjectsSearch',
-'occam','Occam',
-'octopus','HKU WWW Octopus',
-'openfind','Openfind data gatherer',
-'orb_search','Orb Search',
-'packrat','Pack Rat',
-'pageboy','PageBoy',
-'parasite','ParaSite',
-'patric','Patric',
-'pegasus','pegasus',
-'perignator','The Peregrinator',
-'perlcrawler','PerlCrawler 1.0',
-'phantom','Phantom',
-'phpdig','PhpDig',
-'piltdownman','PiltdownMan',
-'pimptrain','Pimptrain.com\'s robot',
-'pioneer','Pioneer',
-'pitkow','html_analyzer',
-'pjspider','Portal Juice Spider',
-'plumtreewebaccessor','PlumtreeWebAccessor',
-'poppi','Poppi',
-'portalb','PortalB Spider',
-'psbot','<a href="http://www.picsearch.com/bot.html" title="Bot home page" target="_blank">psbot</a>',
-'python','<a href="http://docs.python.org/library/urllib.html" title="Tools developed using a Python library" target="_blank">Python-urllib</a>',
-'raven','Raven Search',
-'rbse','RBSE Spider',
-'resumerobot','Resume Robot',
-'rhcs','RoadHouse Crawling System',
-'road_runner','Road Runner: The ImageScape Robot',
-'robbie','Robbie the Robot',
-'robi','ComputingSite Robi/1.0',
-'robocrawl','RoboCrawl Spider',
-'robofox','RoboFox',
-'robozilla','Robozilla',
-'roverbot','Roverbot',
-'rules','RuLeS',
-'safetynetrobot','SafetyNet Robot',
-'semalt', '<a href="http://semalt.semalt.com/" rel="nofollow" title="seamalt.com Home Page [new window]" target="_blank">seamalt.com</a>',
-'search\-info','Sleek',
-'search_au','Search.Aus-AU.COM',
-'searchprocess','SearchProcess',
-'senrigan','Senrigan',
-'sgscout','SG-Scout',
-'shaggy','ShagSeeker',
-'shaihulud','Shai\'Hulud',
-'sift','Sift',
-'simbot','Simmany Robot Ver1.0',
-'sistrix', '<a href="http://crawler.sistrix.net/" rel="nofollow" title="SISTRIX Crawler Page [new window]" target="_blank">SISTRIX Crawler</a>',
-'site\-valet','Site Valet',
-'sitetech','SiteTech-Rover',
-'skymob','Skymob.com',
-'slcrawler','SLCrawler',
-'smartspider','Smart Spider',
-'snooper','Snooper',
-'solbot','Solbot',
-'speedy','<a href="http://www.entireweb.com/about/search_tech/speedyspider/" title="Speedy Spider home page [new window]" target="_blank">Speedy Spider</a>',
-'spider[_+\s]monkey','Spider monkey',
-'spiderbot','SpiderBot',
-'spiderline','Spiderline Crawler',
-'spiderlytics', 'Spiderlytics: No homepage, e-mail only: spider (at) spiderlytics.com',
-'spiderman','<a href="http://www.iscrawling.com" title="Spiderman home page [new window]" target="_blank">Spiderman</a>',
-'spiderview','SpiderView(tm)',
-'spry','Spry Wizard Robot',
-'ssearcher','Site Searcher',
-'sqworm','<a href="http://www.websense.com/" title="Bot home page (source: http://www.pgts.com.au/) [new window]" target="_blank">Sqworm</a>',
-'suke','Suke',
-'sunrise','<a href="http://www.sunrisexp.com/" title="Sunrise home page [new window]" target="_blank">Sunrise</a>',
-'suntek','suntek search engine',
-'sven','Sven',
-'tach_bw','TACH Black Widow',
-'tagyu_agent','<a href="http://www.tagyu.com/" title="Bot home page [new window]" target="_blank">Tagyu Agent</a>',
-'tarantula','Tarantula',
-'tarspider','tarspider',
-'tailrank','<a href="http://tailrank.com/robot">TailRank</a>',
-'techbot','TechBOT',
-'templeton','Templeton',
-'titan','TITAN',
-'titin','TitIn',
-'tkwww','The TkWWW Robot',
-'tlspider','TLSpider',
-'ucsd','UCSD Crawl',
-'udmsearch','UdmSearch',
-'universalfeedparser','<a href="http://feedparser.org/" title="Bot home page [new window]" target="_blank">UniversalFeedParser</a>',
-'urlck','URL Check',
-'valkyrie','Valkyrie',
-'verticrawl','Verticrawl',
-'victoria','Victoria',
-'visionsearch','vision-search',
-'voidbot','void-bot',
-'vwbot','VWbot',
-'w3index','The NWI Robot',
-'w3m2','W3M2',
-'wallpaper','WallPaper (alias crawlpaper)',
-'wanderer','the World Wide Web Wanderer',
-'wapspider','w@pSpider by wap4.com',
-'webbandit','WebBandit Web Spider',
-'webcatcher','WebCatcher',
-'webcopy','WebCopy',
-'webfetcher','webfetcher',
-'webfoot','The Webfoot Robot',
-'webinator','Webinator',
-'weblinker','WebLinker',
-'webmirror','WebMirror',
-'webmoose','The Web Moose',
-'webquest','WebQuest',
-'webreader','Digimarc MarcSpider',
-'webreaper','WebReaper',
-'websnarf','Websnarf',
-'webspider','WebSpider',
-'webvac','WebVac',
-'webwalk','webwalk',
-'webwalker','WebWalker',
-'webwatch','WebWatch',
-'whatuseek','whatUseek Winona',
-'whowhere','WhoWhere Robot',
-'wired\-digital','Wired Digital',
-'wmir','w3mir',
-'wolp','WebStolperer',
-'wombat','The Web Wombat',
-'wordpress','<a href="http://wordpress.org/" title="WordPress home page [new window]" target="_blank">WordPress</a>',
-'worm','The World Wide Web Worm',
-'woozweb','Woozweb Monitoring',
-'wwwc','WWWC Ver 0.2.5',
-'wz101','WebZinger',
-'xenu\slink\ssleuth', '<a href="http://home.snafu.de/tilman/xenulink.html" rel="nofollow" title="Description, Download, FAQ Page [new window]" target="_blank">Xenu'. "'" . 's Link Sleuth <sup>(TM)</sup></a>, see <a href="http://en.wikipedia.org/wiki/Xenu%27s_Link_Sleuth" rel="nofollow" title="Wikipedia on Xenu'. "'" . 's Link Sleuth [new window]" target="_blank">Wikipedia</a>',
-'xget','XGET',
-# Other robots reported by users
-'^finbot', '<span title="As on Sep. 10, 2015, the user agent string did not contain a web address.">finbot</span>',
-'^webindex$', '<span title="As on Oct. 28, 2015, the user agent string did not contain a web address.">WebIndex</span>',
-'1\-more_scanner','<a href="http://www.myzips.com/software/1-More-Scanner.phtml" title="1-More Scanner home page [new window]" target="_blank">1-More Scanner</a>',
-'360spider','<a href="https://www.google.com/search?q=360spider+-Ferrari" title="No home page, using Google search instead [new window]" target="_blank">360spider</a>',
-'a6-indexer',  '<a href="http://www.a6corp.com/a6-web-scraping-policy/" rel="nofollow" title="A6-Indexer [new window]" target="_blank">A6-Indexer</a>',
-'accoona\-ai\-agent','<a href="http://www.accoona.com/" title="Accoona-AI-Agent home page [new window]" target="_blank">Accoona-AI-Agent</a>',
-'activebookmark','<a href="http://www.libmaster.com/active_bookmark.php" title="ActiveBookmark home page [new window]" target="_blank">ActiveBookmark</a>',
-'adamm_bot','<a href="http://home.blic.net/adamm/" title="Bot home page [new window]" target="_blank">AdamM Bot</a>',
-'adsbot-google', '<a href="http://www.google.com/adsbot.html" rel="nofollow" title="AdsBot-Google home page [new window]" target="_blank">AdsBot-Google</a>',
-'advbot', '<a href="http://advbot.net/bot.html" rel="nofollow" title="AdvBot Home Page [new window]" target="_blank">AdvBot</a>',
-'affectv\.co\.uk', '<a href="http://www.affectv.co.uk" rel="nofollow" title="affectv.co.uk Home Page [new window]" target="_blank">affectv.co.uk</a>',
-'almaden','<a href="http://www.almaden.ibm.com/cs/crawler" title="IBM Almaden Research Center WebFountain&trade; Bot home page [new window]" target="_blank">IBM Almaden</a> Research Center WebFountain&trade;',
-'aipbot','<a href="http://www.aipbot.com/" title="aipbot@aipbot.com Bot home page [new window]" target="_blank">aipbot</a>',
-'aleadsoftbot','<a href="http://www.aleadsoft.com/bot.htm" title="ALeadSoftbot home page [new window]" target="_blank">ALeadSoftbot</a>',
-'alpha_search_agent','Alpha Search Agent',
-'allrati','Allrati',
-'aport', 'Aport',
-'applebot', '<a href="http://www.apple.com/go/applebot" rel="nofollow" title="Applebot Home Page [new window]" target="_blank">Applebot</a>',
-'archive\-de\.com',  '<a href="http://archive-de.com/bot" rel="nofollow" title="Archive-de.com Home Page [new window]" target="_blank">Archive-de.com</a>',
-'archive\.org_bot','<a href="http://crawls.archive.org/collections/bncf/crawl.html" title="Bot home page [new window]" target="_blank">archive.org bot</a>',
-'argus','<a href="http://www.simpy.com/bot.html" title="feedback@simpy.com Bot home page [new window]" target="_blank">Argus</a>',
-'arianna\.libero\.it','<a href="http://arianna.libero.it/" title="Bot home page [new window]" target="_blank">arianna.libero.it</a>',
-'aspseek','<a href="http://www.aspseek.org/" title="Bot home page [new window]" target="_blank">ASPseek</a>',
-'asterias', 'Asterias',
-'awbot', 'AWBot',
-'backlinktest\.com', '<a href="http://www.backlinktest.com/crawler.html" title="BacklinkCrawler [new window]" target="_blank">BacklinkCrawler</a>',
-'baiduspider','<a href="http://www.baidu.com/search/spider.html" title="Bot home page [new window]" target="_blank">BaiDuSpider</a>',
-'becomebot', '<a href="http://www.become.com/site_owners.html" title="Bot home page [new window]" target="_blank">BecomeBot</a>',
-'bender','<a href="http://bender.ucr.edu/" title="Bot home page [new window]" target="_blank">bender</a> <a href="http://ivia.ucr.edu/manuals/NiFC/current/index.shtml" title="Bot home page [new window]" target="_blank">focused_crawler</a>',
-'betabot','BetaBot',
-'biglotron','<a href="http://www.biglotron.com/robot.html" title="Bot home page [new window]" target="_blank">Biglotron</a>',
-'bittorrent_bot','<a href="http://www.bittorrent.com/" title="Bot home page [new window]" target="_blank">BitTorrent Bot</a>',
-'biz360[_+\s]spider','<a href="http://www.biz360.com/" title="blogsmanager@biz360.com Bot home page [new window]" target="_blank">Biz360 spider</a>',
-'blexbot', '<a href="http://webmeup-crawler.com" rel="nofollow" title="BLEXBot Home Page [new window]" target="_blank">BLEXBot</a>, seems to belong to the <a href="http://webmeup.com/" rel="nofollow" title="WebMeUp Home Page [new window]" target="_blank">WebMeUp backlink tool</a>',
-'blogbridge[_+\s]service','<a href="http://www.blogbridge.com/" title="Bot home page [new window]" target="_blank">BlogBridge Service</a>',
-'bloglines','<a href="http://www.bloglines.com/" title="Bot home page [new window]" target="_blank">Bloglines</a>',
-'blogpulse','<a href="http://www.intelliseek.com/" title="Bot home page [new window]" target="_blank">BlogPulse ISSpider intelliseek.com</a>',
-'blogsearch','<a href="http://www.icerocket.com/" title="Bot home page [new window]" target="_blank">BlogSearch</a>',
-'blogshares','<a href="http://blogshares.com/help.php?node=7" title="Bot home page [new window]" target="_blank">Blogshares Spiders</a>',
-'blogslive','<a href="http://www.blogslive.com/" title="info@blogslive.com Bot home page [new window]" target="_blank">Blogslive</a>',
-'blogssay','<a href="http://www.blogssay.com/" title="Bot home page [new window]" target="_blank">BlogsSay :: RSS Search Crawler</a>',
-'bncf\.firenze\.sbn\.it\/raccolta\.txt','<a href="http://www.bncf.firenze.sbn.it/raccolta.txt" title="Bot home page [new window]" target="_blank">Biblioteca Nazionale Centrale di Firenze</a>',
-'bobby', 'Bobby',
-'boitho\.com\-dc','<a href="http://www.boitho.com/dcbot.html" title="Bot home page [new window]" target="_blank">boitho.com-dc</a>',
-'bookmark\-manager','<a href="http://bkm.sourceforge.net/" title="Bookmark-Manager home page [new window]" target="_blank">Bookmark-Manager</a>',
-'boris', 'Boris',
-'bubing', '<a href="http://law.di.unimi.it/BUbiNG.html" title="BUbiNG [new window]" target="_blank">BUbiNG</a>',
-'bumblebee', 'Bumblebee (relevare.com)',
-'candlelight[_+\s]favorites[_+\s]inspector','<a href="http://www.candlelight.com/home.html" title="Candlelight_Favorites_Inspector  home page [new window]" target="_blank">Candlelight_Favorites_Inspector</a>',
-'careerbot',  '<a href="http://www.career-x.de/bot.html" rel="nofollow" title="CareerBot home page [new window]" target="_blank">CareerBot</a>',
-'cbn00glebot','cbn00glebot',
-'ccbot', '<a href="http://commoncrawl.org/faq/" rel="nofollow" title="Common Crawl FAQ Page [new window]" target="_blank">Common Crawl</a>',
-'cerberian_drtrs','<a href="http://www.pgts.com.au/cgi-bin/psql?robot_info=25240" title="Bot home page [new window]" target="_blank">Cerberian Drtrs</a>',
-'cfnetwork','<a href="http://www.cocoadev.com/index.pl?CFNetwork" title="CFNetwork home page [new window]" target="_blank">CFNetwork</a>',
-'cipinetbot','<a href="http://www.cipinet.com/bot.html" title="CipinetBot home page [new window]" target="_blank">CipinetBot</a>',
-'checkweb_link_validator','<a href="http://p.duby.free.fr/chkweb.htm" title="CheckWeb link validator home page [new window]" target="_blank">CheckWeb link validator</a>',
-'cliqzbot', '<a href="http://cliqz.com/company/cliqzbot" rel="nofollow" title="Cliqzbot Home Page [new window]" target="_blank">Cliqzbot</a>',
-'commons\-httpclient','<a href="http://jakarta.apache.org/commons/httpclient/" title="Bot home page [new window]" target="_blank">Jakarta commons-httpclient</a>',
-'computer_and_automation_research_institute_crawler','<a href="http://www.ilab.sztaki.hu/~stamas/publications/p184-benczur.html" title="Computer and Automation Research Institute Crawler home page [new window]" target="_blank">Computer and Automation Research Institute Crawler</a>',
-'converamultimediacrawler','<a href="http://www.authoritativeweb.com/crawl/" title="ConveraMultiMediaCrawler home page [new window]" target="_blank">ConveraMultiMediaCrawler</a>',
-'converacrawler','<a href="http://www.authoritativeweb.com/crawl/" title="ConveraCrawler home page [new window]" target="_blank">ConveraCrawler</a>',
-'copubbot', '<a href="http://www.copub.com/bot.php" rel="nofollow" title="CoPubbot Home Page [new window] Note: Access to bot home page gave a 404 error on Dec 21, 2013" target="_blank">CoPubbot</a>',
-'cscrawler','CsCrawler',
-'cse_html_validator_lite_online','<a href="http://online.htmlvalidator.com/php/onlinevallite.php" title="CSE HTML Validator Lite Online home page [new window]" target="_blank">CSE HTML Validator Lite Online</a>','cuasarbot','<a href="http://www.cuasar.com/" title="Cuasarbot home page [new window]" target="_blank">Cuasarbot</a>',
-'cursor','<a href="http://adcenter.hu/docs/en/bot.html " title="Cursor home page [new window]" target="_blank">Cursor</a>',
-'custo','<a href="http://www.netwu.com/custo/" title="Custo home page [new window]" target="_blank">Custo</a>',
-'datafountains\/dmoz_downloader','<a href="http://infomine.ucr.edu/ " title="DataFountains/DMOZ Downloader home page [new window]" target="_blank">DataFountains/DMOZ Downloader</a>',
-'dataprovider\.com', '<a href="http://www.dataprovider.com/" title="Dataprovider Site Explorer [new window]" target="_blank">Dataprovider Site Explorer</a>',
-'daumoa', '<a href="http://tab.search.daum.net/aboutWebSearch.html" title="Daum [new window]" target="_blank">Daum</a>',
-'daviesbot', 'DaviesBot',
-'daypopbot', 'DayPop',
-'deepindex','<a href="http://www.deepindex.net/faq.php" title="Deepindex home page [new window]" target="_blank">Deepindex</a>',
-'deusu', '<a href="https://deusu.de/robot.html" rel="nofollow" title="DeuSu [new window]" target="_blank">DeuSu</a>',
-'dipsie\.bot','<a href="http://www.dipsie.com/bot/" title="Bot home page [new window]" target="_blank">Dipsie</a>',
-'dnsgroup','<a href="http://www.dnsgroup.com/" title="DNSGroup home page [new window]" target="_blank">DNSGroup</a>',
-'doccheckbot', 'doccheckbot/1.0, known to <a href="http://www.projecthoneypot.org/ip_46.229.160.208" rel="nofollow" title="Info to IP 46.229.160.208 [new window]" target="_blank">Project Honey Pot</a>',
-'domainchecker','<a href="http://net-promoter.com/" title="DomainChecker home page (not confirmed) [new window]" target="_blank">DomainChecker</a>',
-'domainsdb\.net','<a href="http://domainsdb.net/" title="Bot home page [new window]" target="_blank">DomainsDB.net</a>',
-'dotbot',  '<a href="http://www.opensiteexplorer.org/dotbot" rel="nofollow" title="Home Page [new window]" target="_blank">DotBot, Open Site Explorer</a>',
-'duckduckgo-favicons-bot', '<a href="http://duckduckgo.com" rel="nofollow" title="DuckDuckGo Home Page [new window]" target="_blank">DuckDuckGo-Favicons-Bot</a>',
-'dulance','<a href="http://www.dulance.com/bot.jsp" title="Bot home page [new window]" target="_blank">Dulance</a>',
-'dumbot','<a href="http://www.dumbfind.com/" title="Dumbot home page [new window]" target="_blank">Dumbot</a>',
-'dumm\.de\-bot','<a href="http://www.dumm.de/" title="dumm.de-Bot home page [new window]" target="_blank">dumm.de-Bot</a>',
-'earthcom\.info','<a href="http://www.earthcom.info/" title="Bot home page [new window]" target="_blank">EARTHCOM.info</a>',
-'easydl','<a href="http://keywen.com/Encyclopedia/Bot/" title="EasyDL  home page [new window]" target="_blank">EasyDL</a>',
-'eccp', '<a href="http://www.eniro.com/" rel="nofollow" title="Eniro Sverige home page [new window]" target="_blank">Eniro Sverige, email: search (at) eniro.com</a>',
-'edgeio\-retriever','<a href="http://www.edgeio.com/" title="Bot home page [new window]" target="_blank">edgeio-retriever</a>',
-'ernst[:blank:]2\.0', 'Ernst 2.0 (does not provide any further information)',
-'ets_v','<a href="http://www.freetranslation.com/help/" title="ETS home page [new window]" target="_blank">ETS</a> Enterprise Translation Server',
-'exactseek','ExactSeek Crawler',
-'extreme[_+\s]picture[_+\s]finder','<a href="http://www.exisoftware.com/" title="Extreme_Picture_Finder home page [new window]" target="_blank">Extreme_Picture_Finder</a>',
-'eventax','<a href="http://www.eventax.de/" title="eventax home page [new window]" target="_blank">eventax</a>',
-'everbeecrawler','EverbeeCrawler',
-'everest\-vulcan','<a href="http://everest.vulcan.com/crawlerhelp" title="Bot home page [new window]" target="_blank">Everest-Vulcan</a>',
-'ezresult', 'Ezresult',
-'enteprise','<a href="http://www.fastsearch.com/" title="Bot home page [new window]" target="_blank">Fast Enteprise Crawler</a>',
-'facebook','FaceBook bot',
-'facebot', '<a href="https://developers.facebook.com/docs/opengraph/howtos/maximizing-distribution-media-content" rel="nofollow" title=" Home Page [new window]" target="_blank">Facebot (Facebook bot?)</a>',
-'fast\-search\-engine','<a href="http://www.fast-search-engine.com/" title="Bot home page [new window]" target="_blank">Fast-Search-Engine</a> (not fastsearch.com)',
-'fast_enterprise_crawler','<a href="http://www.fast.no/" title="FAST Enterprise Crawler home page [new window]" target="_blank">FAST Enterprise Crawler</a>',
-'fast_enterprise_crawler.*scrawleradmin\.t\-info@telekom\.de','<a href="http://www.telekom.de/" title="FAST Enterprise Crawler * crawleradmin.t-info@telekom.de home page [new window]" target="_blank">FAST Enterprise Crawler * crawleradmin.t-info@telekom.de</a>',
-'finderlein[_+\s]research[_+\s]crawler', 'Finderlein Research Crawler 1.0 (no contact information given)',
-'matrix_s\.p\.a\._\-_fast_enterprise_crawler','<a href="http://tin.virgilio.it/" title="Matrix S.p.A. - FAST Enterprise Crawler home page [new window]" target="_blank">Matrix S.p.A. - FAST Enterprise Crawler</a>',
-'fast_enterprise_crawler.*t\-info_bi_cluster_crawleradmin\.t\-info@telekom\.de','<a href="http://www.telekom.de/" title="FAST Enterprise Crawler * T-Info_BI_cluster crawleradmin.t-info@telekom.de home page [new window]" target="_blank">FAST Enterprise Crawler * T-Info_BI_cluster crawleradmin.t-info@telekom.de</a>',
-'fastbot', '<a href="http://www.fastbot.de" rel="nofollow" title="fastbot Home Page [new window]" target="_blank">fastbot</a>',
-'favicon','FavIconizer',
-'favorg','<a href="http://www.pcmag.com/article2/0,4149,108438,00.asp" title="FavOrg home page [new window]" target="_blank">FavOrg</a>',
-'favorites_sweeper','<a href="http://www.manitools.com/favsweep/" title="Favorites_Sweeper home page [new window]" target="_blank">Favorites Sweeper</a>',
-'feedburner', 'Feedburner',
-'feedfetcher\-google','<a href="http://www.google.com/feedfetcher.html" title="Bot home page [new window]" target="_blank">Feedfetcher-Google</a>',
-'feedflow','<a href="http://feedflow.com/about" title="Bot home page [new window]" target="_blank">FeedFlow</a>',
-'feedster','<a href="http://www.feedster.com/" title="Bot home page [new window]" target="_blank">Feedster</a>',
-'feedsky','<a href="http://www.feedsky.com/" title="Bot home page [new window]" target="_blank">FeedSky</a>',
-'feedvalidator','<a href="http://feedvalidator.org/" title="FeedValidator home page [new window]" target="_blank">FeedValidator</a>',
-'fetchbot', '<a href="https://github.com/PuerkitoBio/fetchbot" rel="nofollow" title="Fetchbot Home Page [new window]" target="_blank">Fetchbot</a>',
-'filmkamerabot','<a href="http://www.filmkamera.at/bot.html" title="FilmkameraBot home page [new window]" target="_blank">FilmkameraBot</a>',
-'filterdb\.iss\.net',  '<a href="http://filterdb.iss.net/crawler/" title="oBot Home Page [new window]" target="_blank">oBot</a>',
-'findexa_crawler','<a href="http://www.findexa.no/gulesider/article26548.ece " title="Findexa Crawler home page [new window]" target="_blank">Findexa Crawler</a>',
-'firmilybot', '<a href="http://www.firmily.com/bot.php" title="Firmily Bot [new window]" target="_blank">Firmily Bot Home page (Website was hacked on Oct. 19, 2013)</a>',
-'findlinks','<a href="http://wortschatz.uni-leipzig.de/findlinks/" title="Bot home page [new window]" target="_blank">Findlinks</a>',
-'foaf-search\.net', '<a href="http://www.foaf-search.net/" title="Friend of a friend (FOAF) search engine [new window]" target="_blank">Friend of a friend (FOAF) search engine</a>',
-'fooky\.com\/ScorpionBot','<a href="http://www.fooky.com/scorpionbots" title="Fooky.com/ScorpionBot/ScoutOut home page [new window]" target="_blank">Fooky.com/ScorpionBot/ScoutOut</a>',
-'g2crawler','<a href="http://crawler.instantnetworks.net/" title="Bot home page (nobody@airmail.net) [new window]" target="_blank">G2Crawler</a>',
-'gaisbot','<a href="http://gais.cs.ccu.edu.tw/robot.php" title="Bot home page [new window]" target="_blank">Gaisbot</a>',
-'geniebot','<a href="http://www.genieknows.com/" title="Bot home page [new window]" target="_blank">Geniebot</a>',
-'genieo', '<a href="http://www.genieo.com/webfilter.html" rel="nofollow" title="Genieo [new window]" target="_blank">Genieo</a>',
-'gigablastopensource', '<a href="http://www.gigablast.com/" rel="nofollow" title="Gigablast Home page [new window]"  target="_blank">GigablastOpenSource</a>, an Open Source Search Engine(<a href="https://github.com/gigablast/open-source-search-engine/wiki" rel="nofollow" title="at GitHub [new window]" target="_blank">Wiki</a>)',
-'gigabot','<a href="http://www.gigablast.com/spider.html" title="Bot home page [new window]" target="_blank">GigaBot</a>',
-'girafabot','<a href="http://www.girafa.com/" title="Bot home page [new window]" target="_blank">Girafabot</a>',
-'global_fetch','<a href="http://www.wesonet.com/" title="Global Fetch home page [new window]" target="_blank">Global Fetch</a>',
-'gnodspider','GNOD Spider',
-'goforit\.com','<a href="http://www.goforit.com/about/" title="GoForIt.com home page [new window]" target="_blank">GoForIt.com</a>',
-'goforitbot','<a href="http://www.goforit.com/about/" title="GOFORITBOT home page [new window]" target="_blank">GOFORITBOT</a>',
-'gonzo','<a href="http://www.suchen.de/faq.html" title="Bot home page [new windows]" target="_blank">suchen.de</a>',
-'gpu_p2p_crawler','<a href="http://gpu.sourceforge.net/search_engine.php" title="Bot home page [new window]" target="_blank">GPU p2p crawler</a>',
-'grapeshot', '<a href="http://www.grapeshot.co.uk/crawler.php" title="Grapeshot Crawler [new window]" target="_blank">Grapeshot Crawler</a>',
-'grub','Grub.org',
-'henrythemiragorobot', '<a href="http://www.miragorobot.com/scripts/mrinfo.asp" title="Bot home page [new window]" target="_blank">Mirago</a>',
-'heritrix','<a href="http://crawler.archive.org/" title="(used by a few different companies) Bot home page [new window]" target="_blank">Heritrix</a>',
-'holmes', 'Holmes',
-'hoowwwer','<a href="http://cosco.hiit.fi/search/hoowwwer/" title="HooWWWer home page [new window]" target="_blank">HooWWWer</a>',
-'hpprint','HPPrint',
-'htmlparser','<a href="http://htmlparser.sourceforge.net/" title="HTMLParser home page [new window]" target="_blank">HTMLParser</a>',
-'html[_+\s]link[_+\s]validator','<a href="http://www.lithopssoft.com/ " title="Html_Link_Validator home page [new window]" target="_blank">Html_Link_Validator</a>',
-'httrack','<a href="http://www.httrack.com/" title="Bot home page [new window]" target="_blank">HTTrack off-line browser</a>',
-'hundesuche\.com\-bot','<a href="http://www.hundesuche.com/" title="Hundesuche.com-Bot home page [new window]" target="_blank">Hundesuche.com-Bot</a>',
-'i-bot','i-bot',
-'icarus6j', 'Icarus6j, email address in UA string, no website',
-'ichiro','<a href="http://help.goo.ne.jp/door/crawlerE.html" title="Bot home page [new window]" target="_blank">ichiro</a>',
-'idmarch', '<a href="http://www.idmarch.org/bot.html" rel="nofollow" title=" Home Page [new window]" target="_blank">IDMARCH</a>',
-'iltrovatore\-setaccio','<a href="http://www.iltrovatore.it/aiuto/motore_di_ricerca.html" title="bot@iltrovatore.it IlTrovatore-Setaccio home page [new window]" target="_blank">IlTrovatore-Setaccio</a>',
-'implisensebot', '<span title="As on Sep. 18, 2015, the user agent string did not contain a web address.">ImplisenseBot</span>',
-'infobot','<a href="http://www.infobot.org/" title="InfoBot home page [new window]" target="_blank">InfoBot</a>',
-'infociousbot','<a href="http://corp.infocious.com/tech_crawler.php" title="InfociousBot home page [new window]" target="_blank">InfociousBot</a>',
-'infohelfer','<a href="http://www.infohelfer.de/crawler.php" title="Infohelfer home page [new window]" target="_blank">Infohelfer</a>',
-'infomine','<a href="http://infomine.ucr.edu/useragents" title="Bot home page [new window]" target="_blank">INFOMINE VLCrawler</a>',
-'insurancobot','<a href="http://www.fastspywareremoval.com/" title="InsurancoBot home page [new window]" target="_blank">InsurancoBot</a>',
-'integromedb\.org','<a href="http://www.integromedb.org/Crawler" title="IntegromeDB home page [new window]" target="_blank">IntegromeDB</a>',
-'internet[_+\s]ninja','<a href="http://www.dti.ne.jp/  " title="Internet_Ninja home page [new window]" target="_blank">Internet_Ninja </a>',
-'internetarchive','<a href="http://lucene.apache.org/nutch/bot.html " title="InternetArchive home page [new window]" target="_blank">InternetArchive</a>',
-'internetseer', 'InternetSeer',
-'internetsupervision','<a href="http://internetsupervision.com/" title="InternetSupervision home page [new window]" target="_blank">InternetSupervision</a>',
-'irlbot','<a href="http://irl.cs.tamu.edu/crawler" title="Bot home page [new window]" target="_blank">IRLbot</a>',
-'isearch2006','<a href="http://www.yahoo.com.cn/" title="isearch2006 home page [new window]" target="_blank">isearch2006</a>',
-'istellabot', '<a href="http://www.tiscali.it/" title="IstellaBot [new window]" target="_blank">IstellaBot</a>',
-'iupui_research_bot','<a href="http://spamhuntress.com/2005/04/25/a-mail-harvester-visits/" title="IUPUI_Research_Bot home page [new window]" target="_blank">IUPUI_Research_Bot</a>',
-'izsearch', '<a href="http://izsearch.com/" rel="nofollow" title="iZSearch Home Page [new window]" target="_blank">iZSearch</a>',
-'james\sbot', '<a href="http://cognitiveseo.com/bot.html" rel="nofollow" title="James BOT Home Page [new window]" target="_blank">James BOT</a>',
-'jobboerse', '<a href="http://www.xn--jobbrse-d1a.com" rel="nofollow" title="Jobb&ouml;rse Home Page [new window]" target="_blank">Jobb&ouml;rse</a>',
-'jrtwine[_+\s]software[_+\s]check[_+\s]favorites[_+\s]utility','<a href="http://www.jrtwine.com/Products/CheckFavs/" title="JRTwine_Software_Check_Favorites_Utility  home page [new window]" target="_blank">JRTwine_Software_Check_Favorites_Utility</a>',
-'justview', 'JustView',
-'kalambot','<a href="http://64.124.122.251/feedback.html" title="KalamBot home page [new window]" target="_blank">KalamBot</a>',
-'kamano\.de_newsfeedverzeichnis','<a href="http://www.kamano.de/" title="kamano.de NewsFeedVerzeichnis home page [new window]" target="_blank">kamano.de NewsFeedVerzeichnis</a>',
-'kazoombot','<a href="http://www.kazoom.ca/bot.html" title="kazoombot@kazoom.ca KazoomBot home page [new window]" target="_blank">KazoomBot</a>',
-'kevin','<a href="http://dznet.com/kevin/" title="Kevin home page [new window]" target="_blank">Kevin</a>',
-'keyoshid','<a href="http://www.yahoo.co.jp/" title="Bot home page [new window]" target="_blank">Yahoo! Japan keyoshid robot study</a>',
-'kinjabot', 'Kinjabot',
-'kinja\-imagebot', 'Kinja Imagebot',
-'knowitall','<a href="http://www.cs.washington.edu/research/knowitall/" title="KnowItAll home page [new window]" target="_blank">KnowItAll</a>',
-'knowledge\.com','<a href="http://www.knowledge.com/" title="Knowledge.com home page [new window]" target="_blank">Knowledge.com</a>',
-'kouaa_krawler','<a href="http://www.kouaa.com/" title="Kouaa Krawler home page [new window]" target="_blank">Kouaa Krawler</a>',
-'krugle','<a href="http://www.krugle.com/crawler/info.html" title="Bot home page [new window]" target="_blank">Krugle</a>',
-'ksibot','<a href="http://ego.ms.mff.cuni.cz/" title="Bot home page [new window]" target="_blank">ksibot</a>',
-'kurzor','<a href="http://www.easymail.hu/" title="cursor@easymail.hu Kurzor home page [new window]" target="_blank">Kurzor</a>',
-'lanshanbot','<a href="http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&amp;template=detail.html&amp;match=%5Cbid_g_l_140406_1%5Cb" title="Bot Information [new window]" target="_blank">lanshanbot</a>',
-'letscrawl\.com','<a href="http://letscrawl.com/" title="Bot home page [new window]" target="_blank">LetsCrawl.com</a>',
-'libcrawl','Crawl libcrawl',
-'link_valet_online','<a href="http://www.htmlhelp.com/tools/valet/" title="Link Valet Online home page [new window]" target="_blank">Link Valet Online</a>',
-'linkbot','LinkBot',
-'linkdex\.com', '<a href="http://www.linkdex.com/about/bots/" title="Bot home page [new window]" target="_blank">Linkdex</a>',
-'linkchecker','<a href="http://linkchecker.sourceforge.net" title="Bot home page [new window]" target="_blank">LinkChecker</a>',
-'linkstats\sbot', '<span title="As on Nov. 7, 2015, the user agent string did not contain a web address.">LinkStats Bot</span>',
-'lipperhey', '<a href="http://www.lipperhey.com/" rel="nofollow" title="Lipperhey SEO Service Home Page [new window]" target="_blank">Lipperhey SEO Service</a>',
-'livejournal\.com', 'LiveJournal.com',
-'loadtimebot', '<a href="http://www.loadtime.net/bot.html" rel="nofollow" title="LoadTimeBot Home Page [new window]" target="_blank">LoadTimeBot</a>',
-'lssrocketcrawler', '<span title="Example UA-String &quot;LSSRocketCrawler/1.0 LightspeedSystems&quot;">LSSRocketCrawler (no contact information)</span>',
-'ltbot', '<a href="http://www.language-tools.com/" title="Language Tools Home Page [new window]" target="_blank">Language Tools Bot (ltbot)</a>',
-'ltx71', '<a href="http://ltx71.com/" rel="nofollow" title="ltx71 Home Page [new window]" target="_blank">ltx71</a>',
-'madaali\.de', '<a href="http://www.madaali.de/pfadzurbotseite/bot.html" rel="nofollow" title="Link resulted in a 404 Error on Nov 6, 2014 [new window]" target="_blank">www.madaali.de</a>',
-'magpierss', 'MagpieRSS',
-'mail\.ru', '<a href="http://go.mail.ru/help/robots" title="Mail.ru bot home page [new window]" target="_blank">Mail.ru bot</a>',
-'mapoftheinternet\.com','<a href="http://MapoftheInternet.com/" title="MapoftheInternet.com home page [new window]" target="_blank">MapoftheInternet.com</a>',
-'meanpathbot', '<a href="http://www.meanpath.com/meanpathbot.html" rel="nofollow" title="Meanpathbot Home Page [new window]" target="_blank">Meanpathbot</a>',
-'mediabot', '<a href="http://isdownload.biz" rel="nofollow" title="MediaBot refers to isdownload.biz [new window]" target="_blank">MediaBot</a>',
-'mediapartners\-google','<a href="https://adwords.google.com/" title="Bot home page [new window]" target="_blank">Google AdSense</a>',
-# 'Mediapartners-Google (Feb 12, 2015: no additial information in UA String, seems to use <a href="http://www.gigablast.com/" title="Gigablast Home page [new window]">GigablastOpenSource</a>',
-# Uses UA string "Mediapartners-Google" only, and there were accesses using an UA string "GigablastOpenSource/1.0" from the same IP-Address.
-# Therefore this is probably not related to Google 4.3.2015 Albrecht Müller
-'megaindex', '<a href="http://megaindex.com/crawler" rel="nofollow" title="MegaIndex Crawler Page [new window]" target="_blank">MegaIndex Crawler</a>, seems to belong to <a href="https://www.megaindex.ru/" rel="nofollow" title="MegaIndex.ru Home Page [new window]" target="_blank">MegaIndex.ru</a>',
-'megite','<a href="http://www.megite.com/" title="Megite home page [new window]" target="_blank">Megite</a>',
-'memorybot', '<a href="http://archivethe.net/en/index.php/about/internet_memory1" rel="nofollow" title="Archivethe.net Home Page [new window]" target="_blank">Archivethe.net</a>',
-'metager2-verification-bot', '<a href="http://metager2.de/technology.php" rel="nofollow" title="metager2-verification-bot Home Page [new window]" target="_blank">metager2-verification-bot</a>',
-'metager\-linkchecker','MetaGer LinkChecker',
-'metajobbot', '<a href="http://www.metajob.de/crawler" rel="nofollow" title="MetaJobBot [new window]" target="_blank">MetaJobBot</a>',
-'metaspinner','<a href="http://index.meta-spinner.de/" title="Metaspinner home page [new window]" target="_blank">Metaspinner</a>',
-'miadev',  '<a href="http://www.mia-marktplatz.de/spider" rel="nofollow" title="MiaDev spider [new window]" target="_blank">MiaDev spider</a>',
-'microsoft\sbits', '<a href="http://msdn.microsoft.com/en-us/library/bb968799%28v=vs.85%29.aspx" rel="nofollow" title="Microsoft Background Intelligent Transfer Service (BITS)? [new window]" target="_blank">Microsoft Background Intelligent Transfer Service (BITS)?</a>',
-'microsoft.*discovery', '<a href="http://support.microsoft.com/kb/838028/en-us" title="Microsoft KB838028 [new window]" target="_blank">Microsoft Office Protocol Discovery</a>/<a href="http://blogs.msdn.com/b/vsofficedeveloper/archive/2008/03/11/office-existence-discovery-protocol.aspx" title="Description of the Microsoft Office Existence Discovery [new window]" target="_blank">Microsoft Office Existence Discovery</a>',
-'microsoft[_+\s]url[_+\s]control','<a href="http://www.webmasterworld.com/forum11/1005.htm" title="Microsoft URL Control  home page [new window]" target="_blank">Microsoft URL Control</a>',
-'mindupbot', '<a href="http://datenbutler.de" rel="nofollow" title="DATENBUTLER home page [new window]" target="_blank">mindUpBot (datenbutler.de)</a>',
-'minirank','<a href="http://minirank.com/" title="miniRank home page [new window]" target="_blank">miniRank</a>',
-'mini\-reptile','Mini-reptile',
-'missigua_locator','<a href="http://www.webmasterworld.com/forum11/2690.htm" title="Missigua_Locator  home page [new window]" target="_blank">Missigua_Locator</a>',
-'misterbot','<a href="http://www.misterbot.fr/" title="Misterbot home page [new window]" target="_blank">Misterbot</a>',
-'miva','<a href="http://www.miva.com/" title="Miva home page [new window]" target="_blank">Miva</a>',
-'mizzu_labs','<a href="http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&amp;template=detail.html&amp;match=\bid_m_141105_2\b " title="Mizzu Labs home page [new window]" target="_blank">Mizzu Labs</a>',
-'mj12bot','<a href="http://majestic12.co.uk/bot.php" title="Bot home page. [new window]" target="_blank">MJ12bot</a>',
-'mojeekbot','<a href="http://www.mojeek.com/bot.html" title="Bot home page. [new window]" target="_blank">MojeekBot</a>',
-'msiecrawler','<a href="http://msdn.microsoft.com/workshop/delivery/offline/linkrel.asp" title="Bot home page. [new window]" target="_blank">MSIECrawler</a>',
-'ms[_+\s]search[_+\s]6\.0[_+\s]robot','<a href="http://support.microsoft.com/default.aspx?scid=kb;en-us;284022" title="Microsoft Support Page. [new window]" target="_blank">MS Search 6.0 Robot</a> (MS SharePoint Portal Server?)',
-'ms_search_4\.0_robot','<a href="http://support.microsoft.com/default.aspx?scid=kb;en-us;284022" title="Bot home page. [new window]" target="_blank">MS SharePoint Portal Server - MS Search 4.0 Robot</a>',
-'msrabot','msrabot',
-'msrbot','<a href="http://research.microsoft.com/research/sv/msrbot/" title="MSRBOT home page [new window]" target="_blank">MSRBOT</a>',
-'mt::telegraph::agent','MT::Telegraph::Agent',
-'mydoyouhike','<a href="http://www.doyouhike.net/my" title="Mydoyouhike home page [new window]" target="_blank">Mydoyouhike</a>',
-'nagios','Nagios',
-'nasa_search','<a href="http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&amp;template=detail.html&amp;match=\bid_n_s_140506_2\b" title="NASA Search home page [new window]" target="_blank">NASA Search</a>',
-'netestate\sne\scrawler','<a href="http://www.website-datenbank.de/" title="Website-Datenbank home page [new window]" target="_blank">Website-Datenbank</a>',
-'netluchs','<a href="http://www.netluchs.de/" title="Bot home page. [new window]" target="_blank">Netluchs</a>',
-'netsprint','<a href="http://www.netsprint.pl/serwis/" title="NetSprint home page [new window]" target="_blank">NetSprint</a>',
-'newsgatoronline', 'NewsGator Online',
-'nicebot','<a href="http://www.egghelp.org/setup.htm" title="Bot home page (there may be others) [new window]" target="_blank">nicebot</a>',
-'nimblecrawler','<a href="http://www.healthline.com/" title="NimbleCrawler home page [new window]" target="_blank">NimbleCrawler</a>',
-'noxtrumbot','<a href="http://www.noxtrum.com/" title="Bot home page [new window]" target="_blank">noxtrumbot</a>',
-'npbot','<a href="http://www.nameprotect.com/botinfo.html" title="NPBot home page [new window]" target="_blank">NPBot</a>',
-'loocalcrawler/nutch', '<a href="https://weluse.de/" rel="nofollow" title="https://weluse.de/ [new window]" target="_blank">LoocalCrawler/Nutch</a>',
-'nutchcvs','<a href="http://lucene.apache.org/nutch/bot.html" title="NutchCVS home page [new window]" target="_blank">NutchCVS</a>',
-'nutchosu\-vlib','<a href="http://lucene.apache.org/nutch/bot.html" title="NutchOSU-VLIB home page [new window]" target="_blank">NutchOSU-VLIB</a>',
-'nutch','<a href="http://lucene.apache.org/nutch/" title="Bot home page. Used by many, including Looksmart. [new window]" target="_blank">Nutch</a>',
-'ocelli','<a href="http://www.globalspec.com/Ocelli/" title="Ocelli home page [new window]" target="_blank">Ocelli</a>',
-'octora_beta_bot','<a href="http://www.octora.com/" title="Bot home page [new window]" target="_blank">Octora Beta Bot</a>',
-'omniexplorer[_+\s]bot','<a href="http://www.omni-explorer.com/" title="Bot home page. [new window]" target="_blank">OmniExplorer Bot</a>',
-'onet\.pl[_+\s]sa','<a href="http://szukaj.onet.pl/" title="Onet.pl_SA home page [new window]" target="_blank">Onet.pl_SA</a>',
-'onfolio','<a href="http://www.onfolio.com/" title="Bot home page [new window]">Onfolio</a>',
-'opentaggerbot','<a href="http://www.opentagger.com/opentaggerbot.htm" title="Bot home page [new window]">OpenTaggerBot</a>',
-'openwebspider','<a href="http://www.openwebspider.org/" title="OpenWebSpider home page [new window]" target="_blank">OpenWebSpider</a>',
-'optimizer', '<span title="As on Oct. 2, 2015, the user agent string did not contain a web address.">Optimizer</span>',
-'oracle_ultra_search','<a href="http://www.oracle.com/technology/products/ultrasearch/index.html" title="Oracle Ultra Search home page [new window]" target="_blank">Oracle Ultra Search</a>',
-'orangebot', 'OrangeBot, no website, log entry specifies mail address', # support.orangebot@orange.com
-'orbiter','<a href="http://www.dailyorbit.com/bot.htm" title="Orbiter home page [new window]" target="_blank">Orbiter</a>',
-'yodaobot','<a href="http://www.yodao.com/help/webmaster/spider/" title="YodaoBot">OutfoxBot/YodaoBot</a>',
-'qihoobot','<a href="http://www.qihoo.com/" title="QihooBot">QihooBot</a>',
-'qwantify', '<a href="https://www.qwant.com/" rel="nofollow" title="Qwant Home Page [new window]" target="_blank">Qwant</a>',
-'passwordmaker\.org','<a href="http://passwordmaker.org/" title="passwordmaker.org home page [new window]" target="_blank">passwordmaker.org</a>',
-'pear_http_request_class','<a href="http://pear.php.net/" title="PEAR HTTP Request class home page [new window]" target="_blank">PEAR HTTP Request class</a>',
-'peerbot','<a href="http://www.peerbot.com/" title="PEERbot home page [new window]" target="_blank">PEERbot</a>',
-'perman', 'Perman surfer',
-'php[_+\s]version[_+\s]tracker','<a href="http://www.nexen.net/phpversion/bot.php" title="PHP Version Tracker home page [new window]" target="_blank">PHP version tracker</a>',
-'phpcrawl', '<a href="http://phpcrawl.cuab.de/" rel="nofollow" title="PHPCrawl Home page [new window]" target="_blank">PHPCrawl</a>',
-'picmole', '<a href="http://www.picmole.com/" rel="nofollow" title="Bot home page. [new window]" target="_blank">Specified address www.picmole.com was not reachable on April 21, 2014</a>',
-'pictureofinternet','<a href="http://malfunction.org/poi/" title="PictureOfInternet home page [new window]" target="_blank">PictureOfInternet</a>',
-'ping\.blo\.gs','<a href="http://blo.gs/ping.php" title="Bot home page. [new window]" target="_blank">ping.blo.gs</a>',
-'plinki','<a href="http://www.plinki.com/" title="plinki home page [new window]" target="_blank">plinki</a>',
-'pluckfeedcrawler','<a href="http://www.pluck.com/" title="Bot home page. [new window]" target="_blank">PluckFeedCrawler</a>',
-'plukkie',  '<a href="http://www.botje.com/plukkie.htm" rel="nofollow" title="Plukkie [new window]" target="_blank">Plukkie</a>',
-'pogodak','<a href="http://www.pogodak.com" title="Pogodak home page [new window]" target="_blank">Pogodak.com</a>',
-'pompos','<a href="http://dir.com/pompos.html" title="Bot home page. [new window]" target="_blank">Pompos</a>',
-'popdexter','Popdexter',
-'port_huron_labs','<a href="http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&amp;template=detail.html&amp;match=\bid_n_s_1133\b" title="Port Huron Labs home page [new window]" target="_blank">Port Huron Labs</a>',
-'postfavorites','<a href="http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&amp;template=detail.html&amp;match=\bid_n_s_1135\b " title="PostFavorites home page [new window]" target="_blank">PostFavorites</a>',
-'projectwf\-java\-test\-crawler','ProjectWF-java-test-crawler',
-'proodlebot','<a href="http://www.proodle.com/" title="proodleBot home page [new window]" target="_blank">proodleBot</a>',
-'publiclibraryarchive', '<a href="http://publiclibraryarchive.org" rel="nofollow" title="On 23 June 2014 a page parked at GoDaddy [new window]" target="_blank">publiclibraryarchive.org (related to spiderlytics.com and/or waybackarchive.org?)</a>',
-#Observations 2014-06-23
-#Domain publiclibraryarchive.org is parked at GoDaddy.com
-#from https://www.projecthoneypot.org/
-#81.30.151.220's User Agent Strings (honeypot classified this ip as an mail server, active about 6 years ago)
-#Mozilla/5.0 (compatible; publiclibraryarchive.org/1.0; +crawl@publiclibraryarchive.org)
-#176.9.138.27's User Agent Strings
-#Mozilla/5.0 (compatible; publiclibraryarchive.org/1.0; +crawl@publiclibraryarchive.org)
-#Mozilla/5.0 (compatible; Spiderlytics/1.0; +spider@spiderlytics.com)
-#Mozilla/5.0 (compatible; waybackarchive.org/1.0; +spider@waybackarchive.org)
-#146.0.32.165's User Agent Strings
-#Mozilla/5.0 (compatible; publiclibraryarchive.org/1.0; +crawl@publiclibraryarchive.org)
-#Mozilla/5.0 (compatible; savetheworldheritage.org/1.0; +crawl@savetheworldheritage.org)
-#Mozilla/5.0 (compatible; seoscanners.net/1; +spider@seoscanners.net)
-'pyquery','<a href="http://sourceforge.net/projects/pyquery/" title="PyQuery home page [new window]" target="_blank">PyQuery</a>',
-'rambler','<a href="http://www.rambler.ru/doc/faq.shtml" title="Bot home page [new window]">StackRambler</a>',
-'redalert','Red Alert',
-'relevantnoise\.com', '<a href="http://www.relevantnoise.com/" title="Relevant Noise [new window]" target="_blank">Relevant Noise</a>',
-'riddler', '<a href="http://riddler.io/about" rel="nofollow" title="Riddler [new window]" target="_blank">Riddler</a>',
-'rogerbot', '<a href="http://moz.com/help/pro/what-is-rogerbot-" rel="nofollow" title="Rogerbot Home Page [new window]" target="_blank">Rogerbot</a>',
-'rojo','<a href="http://rojo.com/" title="Bot home page [new window]" target="_blank">RoJo</a> aggregator',
-'rssimagesbot','<a href="http://herbert.groot.jebbink.nl/?app=rssImages" title="Bot home page [new window]" target="_blank">rssImagesBot</a>',
-'ruffle','<a href="http://www.unreach.net/" title="Bot home page [new window]" target="_blank">ruffle SemanticWeb crawler</a>',
-'rufusbot','<a href="http://64.124.122.252.webaroo.com/feedback.html" title="Bot home page [new window]" target="_blank">RufusBot Rufus Web Miner</a>',
-'safeads\.xyz', '<a href="http://www.safeads.xyz/" rel="nofollow" title="SafeAds.xyz [new window]" target="_blank">SafeAds.xyz</a>',
-'safesearch',  '<a href="https://safesearch.avira.com" rel="nofollow" title="Avira SafeSearch Home Page [new window]" target="_blank">Avira SafeSearch</a>',
-'sandcrawler','<a href="http://www.microsoft.com/" title="Bot home page [new window]" target="_blank">SandCrawler (Microsoft)</a>',
-'savetheworldheritage', '<a href="http://savetheworldheritage.org" rel="nofollow" title="On March 4, 2015 a page parked at GoDaddy [new window]" target="_blank">savetheworldheritage.org (related to spiderlytics.com, waybackarchive.org and/or publiclibraryarchive.org?)</a>',
-'sbider','<a href="http://www.sitesell.com/sbider.html" title="Bot home page [new window]" target="_blank">SBIder</a>',
-'schizozilla','<a href="http://spamhuntress.com/2005/03/18/gizmo/ " title="Schizozilla home page [new window]" target="_blank">Schizozilla</a>',
-'scumbot','Scumbot',
-'searchguild[_+\s]dmoz[_+\s]experiment','<a href="http://www.searchguild.com/" title="SearchGuild_DMOZ_Experiment  home page [new window]" target="_blank">SearchGuild_DMOZ_Experiment</a>',
-'searchmetricsbot','<a href="http://www.searchmetrics.com/en/searchmetrics-bot/" rel="nofollow" title="SearchmetricsBot [new window]" target="_blank">SearchmetricsBot</a>',
-'seekbot','<a href="http://www.seekbot.net/bot.html" title="Bot home page [new window]">Seekbot</a>',
-'semrushbot', '<a href="http://www.semrush.com/bot.html" rel="nofollow" title="SemrushBot [new window]" target="_blank">SemrushBot</a>',
-'sensis_web_crawler','<a href="http://www.sensis.com.au/" title="Sensis Web Crawler home page [new window]" target="_blank">Sensis Web Crawler</a>',
-'seodiver', '<a href="http://www.seodiver.com/bot" rel="nofollow" title="SEO DIVER Bot Home Page [new window]" target="_blank">SEO DIVER</a>',
-'seokicks\.de', '<a href="http://www.seokicks.de/robot.html" rel="nofollow" title="SEOkicks Webcrawler home page [new window]" target="_blank">SEOkicks Webcrawler</a>',
-'seoscanners', '<a href="http://seoscanners.net" rel="nofollow" title="On August 4, 2015 a page parked at GoDaddy [new window]" target="_blank">seoscanners.net</a> (related to publiclibraryarchive.org and savetheworldheritage.org?)',
-'seznambot','<a href="http://fulltext.seznam.cz/" title="Bot home page [new window]" target="_blank">SeznamBot</a>',
-'shim\-crawler','<a href="http://www.logos.ic.i.u-tokyo.ac.jp/crawler/" title="crawl@logos.ic.i.u-tokyo.ac.jp Bot home page [new window]" target="_blank">Shim-Crawler</a>',
-'shoutcast','Shoutcast Directory Service',
-'sitedomain-bot', '<a href="http://www.sitedomain.de/sitedomain-bot/" rel="nofollow" title="Sitedomain-Bot Home Page [new window]" target="_blank">Sitedomain.de</a>',
-'siteexplorer\.info', '<a href="http://siteexplorer.info/" title="Site Explorer home page [new window]" target="_blank">Site Explorer</a>',
-'skimbot', '<a href="http://www.skimlinks.com" rel="nofollow" title="SkimBot [new window]" target="_blank">SkimBot</a>',
-'slysearch','SlySearch',
-'smtbot', '<a href="http://www.similartech.com/smtbot" rel="nofollow" title="SMTBot Home Page [new window]" target="_blank">SMTBot</a>',
-'snap\.com_beta_crawler','<a href="http://www.snap.com/" title="snap.com beta crawler home page [new window]" target="_blank">snap.com beta crawler</a>',
-'sohu\-search','<a href="http://corp.sohu.com/" title="Bot home page [new window]" target="_blank">sohu-search</a>',
-'sohu','<a href="http://corp.sohu.com/" title="Bot home page [new window]" target="_blank">sohu agent</a>',
-'snappy','<a href="http://www.urltrends.com/faq.php" title="Bot home page [new window]" target="_blank">Snappy</a>',
-'spbot', '<a href="http://www.seoprofiler.com/bot" rel="nofollow" title="SEOprofiler Bot [new window]" target="_blank">SEOprofiler Bot</a>',
-'sphere_scout','<a href="http://www.sphere.com/" title="Bot home page [new window]" target="_blank">Sphere Scout</a>',
-'spip','<a href="http://www.spip.net" title="SPIP home page [new window]" target="_blank">SPIP</a>',
-'sproose_crawler','<a href="http://www.sproose.com/bot.html" title="Bot home page [new window]" target="_blank">sproose crawler</a>',
-'ssearch_bot', '<a href="http://www.semantissimo.de/" title="sSearch Crawler [new window]" target="_blank">sSearch Crawler</a>',
-'steroid__download','<a href="http://faqs.org.ru/progr/pascal/delphi_internet2.htm" title="STEROID  Download home page [new window]" target="_blank">STEROID  Download</a>',
-'steeler','<a href="http://www.tkl.iis.u-tokyo.ac.jp/~crawler/ " title="Steeler home page [new window]" target="_blank">Steeler</a>',
-'stq_bot', '<a href="http://www.searchteq.de" rel="nofollow" title="SEARCHTEQ Home Page [new window]" target="_blank">SEARCHTEQ</a>',
-'suchfin\-bot','<a href="http://www.suchfin.de/" title="Suchfin-Bot home page [new window]" target="_blank">Suchfin-Bot</a>',
-'superbot','<a href="http://www.sparkleware.com/superbot/" title="SuperBot home page [new window]" target="_blank">SuperBot</a>',
-'surveybot','SurveyBot',
-'susie','<a href="http://www.sync2it.com/bms/susie.php" title="Susie home page [new window]" target="_blank">Susie</a>',
-'syndic8','Syndic8',
-'syndicapi','<a href="http://syndicapi.com/bot.html" title="Bot home page [new window]" target="_blank">SyndicAPI</a>',
-'synoobot','<a href="http://www.synoo.de/bot.html" title="webmaster@synoo.com SynooBot home page [new window]" target="_blank">SynooBot</a>',
-'tcl_http_client_package','<a href="http://www.tcl.tk/man/tcl8.4/TclCmd/http.htm" title="Tcl http client package home page [new window]" target="_blank">Tcl http client package</a>',
-'technoratibot', 'Technoratibot',
-'teragramcrawlersurf','<a href="http://www.teragram.com/" title="TeragramCrawlerSURF home page [new window]" target="_blank">TeragramCrawlerSURF</a>',
-'test_crawler','<a href="http://netp.ath.cx/" title="Test Crawler home page [new window]" target="_blank">Test Crawler</a>',
-'testbot','<a href="http://www.agbrain.com/" title="TestBot home page [new window]" target="_blank">TestBot</a>',
-'thumbsniper', '<a href="http://thumbsniper.com" rel="nofollow" title="ThumbSniper Home Page [new window]" target="_blank">ThumbSniper</a>',
-'t\-h\-u\-n\-d\-e\-r\-s\-t\-o\-n\-e','<a href="http://www.thunderstone.com/" title="Bot home page. Used by many. [new window]" target="_blank">T-H-U-N-D-E-R-S-T-O-N-E</a>',
-'topicblogs', '<a href="http://www.topicblogs.com/" title="Bot home page [new window]" target="_blank">topicblogs</a>',
-'turnitinbot', '<a href="http://www.turnitin.com/robot/crawlerinfo.html" rel="nofollow" title="TurnitinBot Home Page [new window]" target="_blank">Turn It In</a>',
-'turtle', 'Turtle',
-'turtlescanner', 'Turtle',
-'tutorgigbot','<a href="http://www.tutorgig.info/" title="TutorGigBot home page [new window]" target="_blank">TutorGigBot</a>',
-'twiceler','<a href="http://www.cuill.com/twiceler/robot.html" title="Twiceler home page [new window]" target="_blank">twiceler</a>',
-'ubicrawler','<a href="http://law.dsi.unimi.it/ubicrawler/" title="Bot home page [new window]" target="_blank">UbiCrawler</a>',
-'ultraseek', 'Ultraseek',
-'unchaos_bot_hybrid_web_search_engine','<a href="http://www.unchaos.com/" title="UnChaos Bot Hybrid Web Search Engine home page [new window]" target="_blank">UnChaos Bot Hybrid Web Search Engine</a>',
-'unido\-bot','<a href="http://www.unchina.org/unido/unido/our_projects/3_3.html" title="unido-bot home page [new window]" target="_blank">unido-bot</a>',
-'unisterbot', 'UnisterBot; E-Mail only: crawler (at) unister.de',
-'updated','<a href="http://www.updated.com/" title="updated home page [new window]" target="_blank">updated</a>',
-'ustc\-semantic\-group','<a href="http://ai.ustc.edu.cn/mas/en/research/index.php" title="Bot home page [new window]" target="_blank">USTC-Semantic-Group</a>',
-'vagabondo\-wap','<a href="http://www.wise-guys.nl/Contact/index.php?botselected=webagents&amp;lang=uk" title="Bot home page [new window]" target="_blank">Vagabondo-WAP</a>',
-'vagabondo','<a href="http://www.wise-guys.nl/Contact/index.php?botselected=webagents&amp;lang=uk" title="Bot home page [new window]" target="_blank">Vagabondo</a>',
-'vebidoobot', '<span title="As on Oct. 27, 2015, the user agent string did not contain a web address.">vebidoobot</span>',
-'vermut','<a href="http://vermut.aol.com/" title="Bot home page [new window]" target="_blank">Vermut</a>',
-'versus_crawler_from_eda\.baykan@epfl\.ch','<a href="http://www.epfl.ch/Eindex.html  " title="versus crawler from eda.baykan@epfl.ch home page [new window]" target="_blank">versus crawler from eda.baykan@epfl.ch</a>',
-'vespa_crawler','<a href="http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&template=detail.html&match=%5Cbid_t_z_030406_1%5Cb" title="Bot home page [new window]" target="_blank">Vespa Crawler</a>',
-'voltron', '<span title="As on Oct. 21, 2015, the user agent string did not contain a web address.">voltron</span>',
-'vortex','<a href="http://marty.anstey.ca/projects/robots/vortex/" title="Bot home page [new window]" target="_blank">VORTEX</a>',
-'vse\/','<a href="http://www.vivisimo.com/" title="VSE home page [new window]" target="_blank">VSE</a>',
-'w3c\-checklink','<a href="http://validator.w3.org/checklink/" title="Bot home page [new window]" target="_blank">W3C Link Checker</a>',
-'w3c[_+\s]css[_+\s]validator[_+\s]jfouffa', '<a href="http://jigsaw.w3.org/css-validator/" title="Bot home page [new window]" target="_blank">W3C jigsaw CSS Validator</a>',
-'w3c_validator','<a href="http://validator.w3.org/" title="Bot home page [new window]" target="_blank">W3C Validator</a>',
-'watchmouse', '<a href="http://www.watchmouse.com/en/" title="WatcMouse">WatchMouse Website Monitor</a>',
-'wavefire','<a href="http://www.wavefire.com" title="info@wavefire.com; Bot home page [new window]" target="_blank">Wavefire</a>',
-'waybackarchive\.org', '<span title="Maybe related to spiderlytics.">No website, email: spider(at)waybackarchive.org</span>',
-# 2.12.2013 Project Honeypot reports at least one of the IPs used by waybackarchive with a spiderlytics UA string.
-# Problably not related to the wayback machine of archive.org.
-'wbsearchbot', '<a href="http://www.warebay.com/bot.html" rel="nofollow" title="WBSearchBot [new window]" target="_blank">WBSearchBot</a>',
-'webclipping\.com', 'WebClipping.com',
-'webcompass', 'webcompass',
-'webcrawl\.net','<a href="http://www.webcrawl.net/" title="webcrawl.net home page [new window]" target="_blank">webcrawl.net</a>',
-'web_downloader','<a href="http://www.krasu.ru/soft/chuchelo/" title="Web Downloader home page [new window]" target="_blank">Web Downloader</a>',
-'webdup','<a href="http://www.webdup.com/en/index.html" title="Webdup home page [new window]" target="_blank">Webdup</a>',
-'webfilter','<a href="http://www.verso.com/enterprise/netspective/webfilter.asp" title="Bot home page [new window]" target="_blank">WebFilter</a>',
-'webindexer','<a href="mailto://webindexerv1@yahoo.com" title="WebIndexer home page [new window]" target="_blank">WebIndexer</a>',
-'webminer','<a href="http://64.124.122.252/feedback.html" title="WebMiner home page [new window]" target="_blank">WebMiner</a>',
-'website[_+\s]monitoring[_+\s]bot','<a href="http://InternetSupervision.com/UrlMonitor/3/" title="Website_Monitoring_Bot home page [new window]" target="_blank">Website_Monitoring_Bot</a>',
-'webvulncrawl', 'WebVulnCrawl',
-'wells_search','<a href="http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&amp;template=detail.html&amp;match=\bid_t_z_1484\b " title="Wells Search home page [new window]" target="_blank">Wells Search</a>',
-'wer-liefert-was', '<a href="http://www.wlw.de/extern/crawler/Wer-liefert-was-Crawler.html" rel="nofollow" title="Page given in UA string gave a 404 Error on July 2, 2015 [new window]" target="_blank">Wer-liefert-was Crawler</a> Note: AWStats counts most traffic as user traffic',
-'wesee:search', '<a href="http://www.wesee.com/en/support/bot/" title="WeSEE Bot Home Page (gave a 404-Error on Nov. 2, 2013) [new window]" target="_blank">WeSEE Bot</a>',
-'wevikabot', '<a href="http://www.wevika.de/" rel="nofollow" title="WeViKa Home Page [new window]" target="_blank">WeViKa</a>',
-'wonderer', 'Web Wombat Redback Spider',
-'wotbox', '<a href="http://www.wotbox.com/bot/" rel="nofollow" title="Wotbox Bot Home Page [new window]" target="_blank">Wotbox</a>',
-'wume_crawler','<a href="http://wume.cse.lehigh.edu/~xiq204/crawler/ " title="wume crawler home page [new window]" target="_blank">wume crawler</a>',
-'wwweasel',,'<a href="http://wwweasel.de/" title="Website_Monitoring_Bot home page [new window]" target="_blank">WWWeasel</a>',
-'xenu\'s_link_sleuth','<a href="http://home.snafu.de/tilman/xenulink.html" title="Xenu Link Sleuth home page [new window]" target="_blank">Xenu Link Sleuth</a>',
-'xenu_link_sleuth','<a href="http://home.snafu.de/tilman/xenulink.html" title="Xenu Link Sleuth home page [new window]" target="_blank">Xenu Link Sleuth</a>',
-'xirq','<a href="http://www.xirq.com/" title="xirq home page [new window]" target="_blank">xirq</a>',
-'xovibot', '<a href="http://www.xovibot.net/" rel="nofollow" title="XoviBot Home Page [new window]" target="_blank">XoviBot</a>',
-'y!j', '<a href="http://help.yahoo.co.jp/help/jp/search/indexing/indexing-15.html" title="Bot home page [new window]" target="_blank">Y!J Yahoo Japan</a>',
-'yacy', '<a href="http://yacy.net/bot.html" rel="nofollow" title="YaCy Home Page [new window]" target="_blank">YaCy</a>',
-'yahoo\-blogs','<a href="http://help.yahoo.com/help/us/ysearch/crawling/crawling-02.html" title="Bot home page [new window]" target="_blank">Yahoo-Blogs</a>',
-'yahoo\-verticalcrawler', 'Yahoo Vertical Crawler',
-'yahoofeedseeker', '<a href="http://publisher.yahoo.com/rssguide" title="Bot home page [new window]" target="_blank">Yahoo Feed Seeker</a>',
-'yahooseeker\-testing', '<a href="http://search.yahoo.com/" title="Bot home page [new window]" target="_blank">YahooSeeker-Testing</a>',
-'yahooseeker', '<a href="http://help.yahoo.com/help/us/ysearch/crawling/crawling-02.html" title="Bot home page [new window]" target="_blank">YahooSeeker Yahoo! Blog crawler</a>',
-'yahoo\-mmcrawler', '<a href="mailto:mms-mmcrawler-support@yahoo-inc.com?subject=Yahoo-MMCrawler Information" title="E-mail Bot">Yahoo-MMCrawler</a>',
-'yahoo!_mindset','<a href="http://mindset.research.yahoo.com/" title="Bot home page [new window]">Yahoo! Mindset</a>',
-'yandex', '<a href="http://yandex.com/bots" title="Bot home page [new window]">Yandex Bot</a>',
-'flexum', 'Flexum Search Engine',
-'yanga', 'Yanga WorldSearch Bot',
-'yet-another-spider','<a href="http://188.40.112.195/" title="Yet-Another-Spider home page [new window]" target="_blank">Yet-Another-Spider</a>',
-'yisouspider', 'YisouSpider (no additional information in UA string)',
-'yooglifetchagent','<a href="http://www.yoogli.com/" title="yoogliFetchAgent home page [new window]" target="_blank">yoogliFetchAgent</a>',
-'z\-add_link_checker','<a href="http://w3.z-add.co.uk/linkcheck/" title="Z-Add Link Checker home page [new window]" target="_blank">Z-Add Link Checker</a>',
-'zealbot','ZealBot',
-'zhuaxia','<a href="http://www.zhuaxia.com/"  target="_blank">ZhuaXia</a>',
-'zspider','<a href="http://feedback.redkolibri.com/" title="Bot home page [new window]" target="_blank">zspider</a>',
-'zeus','<a href="http://www.webmasterworld.com/forum11/1840.htm" title="Bot documentation [new window]" target="_blank">Zeus Webster Pro</a>',
-'zumbot','<a href="http://help.zum.com/inquiry" title="ZumBot home page [new window]" target="_blank">ZumBot</a>',
-'ng\/1\.','<a href="http://www.exabot.com/" title="Bot home page [new window]" target="_blank">NG 1.x (Exalead)</a>', # put at end to avoid false positive
-'ng\/2\.','<a href="http://www.exabot.com/" title="Bot home page [new window]" target="_blank">NG 2.x (Exalead)</a>', # put at end to avoid false positive
-'exabot','<a href="http://www.exabot.com/" title="Bot home page [new window]" target="_blank">Exabot</a>', # put at end to avoid false positive
-# Other id that are 99% of robots
-'wget','WGet tools',
-'libwww','Perl tool',
-'^java\/[0-9]','<a href="http://www.projecthoneypot.org/harvester_useragents.php" title="Bot home page [new window]" target="_blank">Java (Often spam bot)</a>', # put at end to avoid false positive
-# Generic robot
-'robot', 'Unknown robot (identified by \'robot\')',
-'checker', 'Unknown robot (identified by \'checker\')',
-'crawl', 'Unknown robot (identified by \'crawl\')',
-'discovery', 'Unknown robot (identified by \'discovery\')',
-'hunter', 'Unknown robot (identified by \'hunter\')',
-'scanner', 'Unknown robot (identified by \'scanner\')',
-'spider', 'Unknown robot (identified by \'spider\')',
-'sucker', 'Unknown robot (identified by \'sucker\')',
-'bot[\s_+:,\.\;\/\\\-]', 'Unknown robot (identified by \'bot\' followed by a space or one of the following characters _+:,.;/\-)',
-'[\s_+:,\.\;\/\\\-]bot', 'Unknown robot (identified by a space or one of the characters _+:,.;/\- followed by \'bot\')',
-'curl', 'Common *nix tool for automating web document retrieval. Most likely a bot.',
-'php', 'A PHP script',
-'ruby\/', 'Ruby script',
-# Additional bots found by Sussex.
-'^[1-3]$', 'Generic bot identified as "1", "2" or "3"',
-'alltop', 'alltop',
-'applesyndication', 'applesyndication',
-'asynchttpclient', 'asynchttpclient',
-'bingbot', '<a href="http://www.bing.com/bingbot.htm" title="Bing home page [new window]" target="_blank">Bingbot</a>',
-'blogged_crawl', 'blogged_crawl',
-'bloglovin', 'bloglovin',
-'butterfly', 'butterfly',
-'buzztracker', 'buzztracker',
-'carpathia', 'carpathia',
-'catbot', 'catbot',
-'chattertrap', 'chattertrap',
-'check_http', 'check_http (nagios)',
-'coldfusion', 'coldfusion',
-'covario', 'covario',
-'daylifefeedfetcher', 'daylifefeedfetcher',
-'discobot', 'discobot',
-'dlvr\.it', 'dlvr.it',
-'dreamwidth', 'dreamwidth',
-'drupal', 'Drupal Site',
-'ezoom', 'ezoom',
-'feedmyinbox', 'feedmyinbox',
-'feedroll\.com', 'feedroll.com',
-'feedzira', 'feedzira',
-'fever\/', '<a href="http://feedafever.com">Feed a Fever</a>',
-'freenews', 'freenews',
-'geohasher', 'geohasher',
-'hanrss', 'hanrss',
-'inagist', 'inagist',
-'jacobin\sclub', 'jacobin club',
-'jakarta', 'jakarta',
-'js\-kit', 'js-kit',
-'largesmall\scrawler', 'largesmall crawler',
-'linkedinbot', 'linkedinbot',
-'longurl', 'longurl',
-'metauri', 'metauri',
-'microsoft\-webdav\-miniredir', 'microsoft-webdav-miniredir',
-'^motorola$', 'Suspected Bot masquerading as "Motorola"',
-'movabletype', 'movabletype',
-'^mozilla\/3\.0\s\(compatible$', 'Suspected bot masqurading as Mozilla',
-'^mozilla\/4\.0$', 'Suspected bot masqurading as Mozilla',
-'^mozilla\/4\.0\s\(compatible;\)$', 'Suspected bot masqurading as Mozilla',
-'^mozilla\/5\.0$', 'Suspected bot masqurading as Mozilla',
-'^mozilla\/5\.0\s\(compatible;$', 'Suspected bot masqurading as Mozilla',
-'^mozilla\/5\.0\s\(en\-us\)$', 'Suspected bot masqurading as Mozilla',
-'^mozilla\/5\.0\sfirefox\/3\.0\.5$', 'Suspected bot masqurading as Mozilla',
-'^msie', 'Suspected bot masquerading as M$ IE',
-'netnewswire', 'netnewswire',
-'\snetseer\s', '<a href="http://www.netseer.com/crawler.html">Net Seer</a>',
-'netvibes', 'netvibes',
-'newrelicpinger', 'newrelicpinger',
-'newsfox', 'Fox News',
-'nextgensearchbot', 'nextgensearchbot',
-'ning', 'ning',
-'pingdom', 'pingdom',
-'pita', 'pita (pain in the ass?)',
-'postpost', 'postpost',
-'postrank', 'postrank',
-'printfulbot', 'printfulbot',
-'protopage', 'protopage',
-'proximic', '<a href="http://www.proximic.com/info/spider.php" title="Proximic Spider home page [new window]" target="_blank">Proximic Spider</a>',
-'quipply', 'quipply',
-'r6\_', '<a href="http://www.radian6.com/crawler">Radian 6 Crawler</a>',
-'ratingburner', 'ratingburner',
-'regator', 'regator',
-'rome\sclient', 'rome client',
-'rpt\-httpclient', 'rpt-httpclient',
-'rssgraffiti', 'rssgraffiti',
-'sage\+\+', 'sage++',
-'scoutjet', '<a href="http://wwww.scoutjet.com/" target="_blank">ScoutJet</a> crawler for <a href="http://blekko.com/" target="_blank">Blekko</a>.',
-'simplepie', 'simplepie',
-'sitebot', 'sitebot',
-'summify\.com', '<a href="http://summify.com/">summify.com</a>',
-'superfeedr', 'superfeedr',
-'synthesio', 'synthesio',
-'teoma', 'teoma',
-'topblogsinfo', 'topblogsinfo',
-'topix\.net', 'topix.net',
-'trapit', 'trapit',
-'trileet', 'trileet',
-'tweetedtimes', '<a href="http://tweetedtimes.com">The Tweeted Times</a>',
-'twisted\spagegetter', 'twisted pagegetter',
-'twitterbot', '<span title="As on Nov. 27, 2015, the user agent string did not contain a web address.">Twitterbot</span>',
-'twitterfeed', 'twitterfeed',
-'unwindfetchor', 'unwindfetchor',
-'wazzup', 'wazzup',
-'windows\-rss\-platform', 'windows-rss-platform',
-'wiumi', 'wiumi',
-'xydo', 'xydo',
-'yahoo!\sslurp', 'Additional Yahoo bots.',
-'yahoo\spipes', 'Additional Yahoo bots.',
-'yahoo\-newscrawler', 'Additional Yahoo bots.',
-'yahoocachesystem', 'Additional Yahoo bots.',
-'yahooexternalcache', 'Additional Yahoo bots.',
-'yahoo!\ssearchmonkey', 'Additional Yahoo bots.',
-'yahooysmcm', 'Additional Yahoo bots.',
-'yammer', 'yammer',
-#'yandexbot', 'yandexbot', #already covered by 'yandex'
-'yeti', 'yeti',
-'yie8', 'yie8',
-'youdao', 'youdao',
-'yourls', 'yourls',
-'zemanta', 'zemanta',
-'zend_http_client', 'Zend Http Client',
-'no_user_agent','Unknown robot (identified by empty user agent string)',
-# Unknown robots identified by hit on robots.txt
-'unknown', 'Unknown robot (identified by hit on \'robots.txt\')'
-);
-
-
-# RobotsAffiliateLib
-# This list try to tell by which Search Engine a robot is used
-#-------------------------------------------------------------
-%RobotsAffiliateLib = (
-'bingpreview'=>'Bing',
-'fast\-webcrawler'=>'AllTheWeb',
-'googlebot'=>'Google',
-'google\-sitemap'=>'Google',
-'google[_+\s]web[_+\s]preview'=>'Google',
-'msnbot'=>'MSN',
-'nutch'=>'Looksmart',
-'scooter'=>'AltaVista',
-'wisenutbot'=>'Looksmart',
-'yahoo\-blogs'=>'Yahoo',
-'yahoo\-verticalcrawler'=>'Yahoo',
-'yahoofeedseeker'=>'Yahoo',
-'yahooseeker\-testing'=>'Yahoo',
-'yahooseeker'=>'Yahoo',
-'yahoo\-mmcrawler'=>'Yahoo',
-'yahoo!_mindset'=>'Yahoo',
-'zyborg'=>'Looksmart',
-'cfetch'=>'Kosmix',
-'^voyager\/'=>'Kosmix',
-# Additional bots found by Sussex.
-'feedfetcher\-google'=>'Google',
-'bingbot'=>'MSN',
-'twitterbot'=>'Twitter',
-'twitterfeed'=>'Twitter',
-'yahoo!\sslurp'=>'Yahoo',
-'yahoo\spipes'=>'Yahoo',
-'yahoo-newscrawler'=>'Yahoo',
-'yahoocachesystem'=>'Yahoo',
-'yahooexternalcache'=>'Yahoo',
-'yahoo!\ssearchmonkey'=>'Yahoo',
-'yahooysmcm'=>'Yahoo'
-);
-
-1;
+# AWSTATS ROBOTS DATABASE\r
+#-------------------------------------------------------\r
+# If you want to add robots to extend AWStats database detection capabilities,\r
+# you must add an entry in RobotsSearchIDOrder_listx and RobotsHashIDLib.\r
+\r
+# The entry in RobotsSearchIDOrder_listx is a Perl regular expression\r
+# (see http://perldoc.perl.org/perlreref.html). AWSTats applies these\r
+# expressions to the user agent string in the order given by the lists. The\r
+# first match specifies the robot.\r
+#\r
+# Note: This regular expression must not contain any whitespace.\r
+# Otherwise AWStats will produce lines in the database that\r
+# will be misinterpreted and as a consequence the corresponding data in the\r
+# generated HTML reports will be wrong. If you want to match whitespace in\r
+# the user agent string, use other constructs like '\s', '[:blank:]',\r
+# '\p{IsSpace}', '\x20' etc.\r
+#\r
+# The corresponding entry in RobotsHashIDLib contains the regular expression\r
+# as key, followed by a string containing HTML-text. AWStats inserts this\r
+# text into reports to describe the bot. If possible the text should contain\r
+# a link to the bot home page. This makes it easier for sysadmins to find\r
+# the information necessary e.g. to adapt the robots.txt file.\r
+#\r
+# An entry in the RobotsAffiliateLib is not necessary. An entry in this list\r
+# contains as first part the regular expression specifying the bot. The\r
+# second part is a string that gives the Company or product managing the bot.\r
+# This information is not used yet.\r
+#\r
+# There are several sorts of bots that AWStats is not able to detect and\r
+# therefore a considerable amount of bot generated traffic counts\r
+# as user traffic:\r
+#\r
+# a) A crawler that identifies itself in the referrer string, but not in\r
+#    the user agent string. An example is the crawler from semalt.semalt.com.\r
+#\r
+# b) Crawlers that correctly access robots.txt but identify themselves in\r
+#    in the user agent string only once or just a few times. Most of the\r
+#    time a user agent string ist used that does not contain hints that\r
+#    a bot is involved. An example is the iCjobs spider.\r
+#    msnbot-UDiscovery/2.0b seems to show this behaviour too.\r
+#\r
+#\r
+#\r
+#-------------------------------------------------------\r
+\r
+# 2016-09-02 RobC \r
+#              Fixed a few errors and added a few missing bots from awstats 7.5 release.\r
+#\r
+# 2016-08-28 RobC \r
+#              Complete re-build of this file almost from scratch.\r
+#              dropped many old bots, added many new bots and reordered file.\r
+#              edited and added regex expressions to stop spaces causing problems.\r
+#              You should tune file by placing the most common robots crawling your site at top \r
+#              in List1.\r
+#\r
+#\r
+#              N.B. many bots need to be in correct order so don't chnage order without checking if\r
+#              change will cause counts to be allocated to wrong bot. Not always simple.\r
+#\r
+#\r
+# 2005-08-19 Sean Carlos http://www.antezeta.com/awstats.html\r
+#              added dipsie (not tested with real data).\r
+#              added DomainsDB.net http://domainsdb.net/\r
+#              added ia_archiver-web.archive.org (was inadvertently grouped with Alexa traffic)\r
+#              added Nutch (used by looksmart (furl?))\r
+#              added rssImagesBot\r
+#              added Sqworm\r
+#              added t\-h\-u\-n\-d\-e\-r\-s\-t\-o\-n\-e\r
+#              added w3c css-validator\r
+#              added documentation link to bot home pages for above and selected major bots.\r
+#                    In the case of international bots, choose .com page.\r
+#                    Included tool tip (html "title").\r
+#                    To do: parameterize to match both AWStats language and tooltips settings.\r
+#                    To do: add html links for all bots based on current documentation in source\r
+#                           files referenced below.\r
+#              changed '\wbot[\/\-]', to '\wbot[\/\-]' (removed comma)\r
+#              made minor grammar corrections to notes below\r
+# 2005-08-24   added YahooSeeker-Testing\r
+#                      added w3c-checklink\r
+#                      updated url for ask.com\r
+# 2005-08-24           added Girafabot http://www.girafa.com/\r
+# 2005-08-30           added PluckFeedCrawler http://www.pluck.com/\r
+#              added Gaisbot/3.0 (robot05@gais.cs.ccu.edu.tw; )\r
+#              dded geniebot (wgao@genieknows.com)\r
+#              added BecomeBot link http://www.become.com/site_owners.html\r
+#              added topicblogs http://www.topicblogs.com/\r
+#              added Powermarks; seen used by referrer spam\r
+#              added YahooSeeker\r
+#              added NG/2. http://www.exabot.com/\r
+# 2005-09-15   added link for Walhello appie\r
+#              added bender focused_crawler\r
+#              updated YahooSeeker description (blog crawler)\r
+# 2005-09-16   added link for http://linkchecker.sourceforge.net\r
+#              added ConveraCrawler/0.9d ( http://www.authoritativeweb.com/crawl)\r
+#              added Blogslive  info@blogslive.com intelliseek.com\r
+#              added BlogPulse (ISSpider-3.0) intelliseek.com\r
+# 2005-09-26   added Feedfetcher-Google (http://www.google.com/feedfetcher.html)\r
+#              added EverbeeCrawler\r
+#              added Yahoo-Blogs http://help.yahoo.com/help/us/ysearch/crawling/crawling-02.html\r
+#              added link for Bloglines http://www.bloglines.com\r
+# 2005-10-19   fixed Feedfetcher-Google (http://www.google.com/feedfetcher.html)\r
+#              added Blogshares Spiders (Synchronized V1.5.1)\r
+#              added yacy\r
+# 2005-11-21   added Argus www.simpy.com\r
+#              added BlogsSay :: RSS Search Crawler (http://www.blogssay.com/)\r
+#              added MJ12bot http://majestic12.co.uk/bot.php\r
+#              added OpenTaggerBot (http://www.opentagger.com/opentaggerbot.htm)\r
+#              added OutfoxBot/0.3 (For internet experiments; outfox.agent@gmail.com)\r
+#              added RufusBot Rufus Web Miner http://64.124.122.252.webaroo.com/feedback.html\r
+#              added Seekbot (http://www.seekbot.net/bot.html)\r
+#              added Yahoo-MMCrawler/3.x (mms-mmcrawler-support@yahoo-inc.com)\r
+#               added link for BaiDuSpider\r
+#              added link for Blogshares Spider\r
+#              added link for StackRambler http://www.rambler.ru/doc/faq.shtml\r
+#              added link for WISENutbot\r
+#              added link for ZyBorg/1.0 (wn-14.zyborg@looksmart.net; http://www.WISEnutbot.com.  Moved location to above wisenut to avoid classification as wisenut\r
+# 2005-12-15\r
+#              added FAST Enteprise Crawler/6 (www dot fastsearch dot com). Note spelling Enteprise not Enterprise.\r
+#              added findlinks http://wortschatz.uni-leipzig.de/findlinks/\r
+#              added IBM Almaden Research Center WebFountain\99 http://www.almaden.ibm.com/cs/crawler [hc3]\r
+#              added INFOMINE/8.0 VLCrawler (http://infomine.ucr.edu/useragents)\r
+#              added lmspider (lmspider@scansoft.com) http://www.nuance.com/\r
+#              added noxtrumbot http://www.noxtrum.com/\r
+#              added SandCrawler (Microsoft)\r
+#              added SBIder http://www.sitesell.com/sbider.html\r
+#              added SeznamBot http://fulltext.seznam.cz/\r
+#              added sohu-search http://corp.sohu.com/ (looked for //robots.txt not /robots.txt)\r
+#              added the ruffle SemanticWeb crawler v0.5 - http://www.unreach.net\r
+#              added WebVulnCrawl/1.0 libwww-perl/5.803 (looked for //robots.txt not /robots.txt)\r
+#              added Yahoo! Japan keyoshid http://www.yahoo.co.jp/\r
+#              added Y!J http://help.yahoo.co.jp/help/jp/search/indexing/indexing-15.html\r
+#              added link for GigaBot\r
+#              added link for MagpieRSS\r
+#              added link for MSIECrawler\r
+# 2005-12-21\r
+#              added aipbot http://www.aipbot.com aipbot@aipbot.com [matthys70 users.sourceforge.net]\r
+#              added Everest-Vulcan Inc./0.1 (R&D project; http://everest.vulcan.com/crawlerhelp)\r
+#              added Fast-Search-Engine http://www.fast-search-engine.com/ [matthys70  users.sourceforge.net]\r
+#              added g2Crawler (nobody@airmail.net) http://crawler.instantnetworks.net/\r
+#              added Jakarta commons-httpclient http://jakarta.apache.org/commons/httpclient/ (hit robots.txt).  May be used as robot or browser - a site may want to remove this entry.\r
+#              added OmniExplorer_Bot http://www.omni-explorer.com/ [matthys70 users.sourceforge.net]\r
+#              added USTC-Semantic-Group ai.ustc.edu.cn/mas/en/research/index.php ?\r
+# 2005-12-22\r
+#              added EARTHCOM.info www.earthcom.info\r
+#              added HTTrack off-line browser 'httrack','HTTrack', http://www.httrack.com/ [Moizes Gabor]\r
+#              added KummHttp http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&template=detail.html&match=\bid_g_l_301105_2\b [Moizes Gabor]\r
+# 2006-01-01\r
+#              added Dulance http://www.dulance.com/bot.jsp\r
+#              added MojeekBot http://www.mojeek.com/bot.html\r
+#              added nicebot http://www.egghelp.org/setup.htm ?\r
+#              added Snappy http://www.urltrends.com/faq.php\r
+#              added sohu agent\r
+#              added VORTEX http://marty.anstey.ca/robots/vortex/ [matthys70 users.sourceforge.net]\r
+#              added zspider http://feedback.redkolibri.com/\r
+# 2006-01-13\r
+#              added boitho.com-dc http://www.boitho.com/dcbot.html\r
+#              added IRLbot http://irl.cs.tamu.edu/crawler\r
+#              added virus_detector virus_harvester@securecomputing.com\r
+#              added Wavefire http://www.wavefire.com; info@wavefire.com\r
+\r
+#              added WebFilter Robot\r
+# 2006-01-24\r
+#              added Shim-Crawler http://www.logos.ic.i.u-tokyo.ac.jp/crawler/; crawl@logos.ic.i.u-tokyo.ac.jp\r
+#              added Exabot exabot.com\r
+#              added LetsCrawl.com http://letscrawl.com\r
+#              added ichiro http://help.goo.ne.jp/door/crawlerE.html\r
+# 2006-01-27    additional 22 robots from a list provided by Moizes Gabor\r
+#              added ALeadSoftbot      http://www.aleadsoft.com/bot.htm\r
+#              added CipinetBot        http://www.cipinet.com/bot.html\r
+#              added Cuasarbot http://www.cuasar.com/\r
+#              added Dumbot    http://www.dumbfind.com/\r
+#              added Extreme_Picture_Finder    http://www.exisoftware.com/\r
+#              added Fooky.com/ScorpionBot/ScoutOut    http://www.fooky.com/scorpionbots\r
+#              added IlTrovatore-Setaccio      http://www.iltrovatore.it/aiuto/motore_di_ricerca.html  bot@iltrovatore.it\r
+#              added InsurancoBot      http://www.fastspywareremoval.com/\r
+#              added InternetArchive   http://lucene.apache.org/nutch/bot.html         nutch-agent@lucene.apache.org\r
+#              added KazoomBot http://www.kazoom.ca/bot.html   kazoombot@kazoom.ca\r
+#              added Kurzor    http://www.easymail.hu/ cursor@easymail.hu\r
+#              added NutchCVS  http://lucene.apache.org/nutch/bot.html nutch-agent@lucene.apache.org\r
+#              added NutchOSU-VLIB     http://lucene.apache.org/nutch/bot.html nutch-agent@lucene.apache.org\r
+#              added Orbiter   http://www.dailyorbit.com/bot.htm\r
+#              added PHP_version_tracker       http://www.nexen.net/phpversion/bot.php\r
+#              added SuperBot  http://www.sparkleware.com/superbot/\r
+#              added SynooBot  http://www.synoo.de/bot.html    webmaster@synoo.com\r
+#              added TestBot   http://www.agbrain.com/\r
+#              added TutorGigBot       http://www.tutorgig.info/\r
+#              added WebIndexer        mailto://webindexerv1@yahoo.com\r
+#              added WebMiner  http://64.124.122.252/feedback.html\r
+# 2006-02-01\r
+#              added heritrix https://sourceforge.net/forum/message.php?msg_id=3550202\r
+#              added Zeus Webster Pro https://sourceforge.net/forum/message.php?msg_id=3141164\r
+#               additional robots from a list provided by Moizes Gabor [ mojzi -a-t- free mail hu ]\r
+#              added Candlelight_Favorites_Inspector\r
+#              added DomainChecker\r
+#              added EasyDL\r
+#              added FavOrg\r
+#              added Favorites_Sweeper\r
+#              added Html_Link_Validator\r
+#              added Internet_Ninja\r
+#              added JRTwine_Software_Check_Favorites_Utility\r
+#              fixed Microsoft_URL_Control\r
+#              added miniRank\r
+#              added Missigua_Locator\r
+#              added NPBot\r
+#              added Ocelli\r
+#              added Onet.pl_SA\r
+#              added proodleBot\r
+#              added SearchGuild_DMOZ_Experiment\r
+#              added Susie\r
+#              added Website_Monitoring_Bot\r
+#              added Xenu_Link_Sleuth\r
+# 2006-05-15\r
+#              added ASPseek http://www.aspseek.org/\r
+#              added AdamM Bot http://home.blic.net/adamm/\r
+#              added archive.org_bot http://crawls.archive.org/collections/bncf/crawl.html\r
+#              added arianna.libero.it (Italian Portal/search engine)\r
+#              added Biz360 spider http://www.biz360.com\r
+#              added BlogBridge Service http://www.blogbridge.com/\r
+#              added BlogSearch http://www.icerocket.com/\r
+#              added libcrawl\r
+#              added edgeio-relanshanbottriever http://www.edgeio.com\r
+#              added FeedFlow http://feedflow.com/about\r
+#              added Biblioteca Nazionale Centrale di Firenze (Italian National Archive) http://www.bncf.firenze.sbn.it/raccolta.txt\r
+#              added Java catchall - used by many spam bots\r
+#              added lanshanbot http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&template=detail.html&match=%5Cbid_g_l_140406_1%5Cb\r
+#              added msnbot-media http://search.msn.com/msnbot.htm\r
+#              added MT::Telegraph::Agent\r
+#              added Netluchs http://www.netluchs.de/ (German SE bot)\r
+#              added oBot http://www.webmasterworld.com/forum11/1616.htm\r
+#              added Onfolio http://www.onfolio.com/  (IE Toolbar plugin) - hit rss feeds.\r
+#              added ping.blo.gs http://blo.gs/ping.php blog bot\r
+#              added Sphere Scout http://www.sphere.com/\r
+#              added sproose crawler http://www.sproose.com/bot.html\r
+#              added SyndicAPI http://syndicapi.com/bot.html\r
+#              added Yahoo! Mindset http://mindset.research.yahoo.com/\r
+#              added msrabot\r
+#              added Vagabondo & Vagabondo-WAP http://www.wise-guys.nl/Contact/index.php?botselected=webagents)#=uk\r
+#              fixed Missigua Locator detection (Missigua_Locator -> Missigua Locator)\r
+#              changed echo to echo! to avoid conflict with the bonecho (Firefox 2.0) browser.\r
+#                      This requires you to reprocess historic logs if you want EchO! to be recognized for older reports.\r
+# 2006-05-17\r
+#              added Alpha Search Agent # 62.152.125.60 Eurologon Srl\r
+#              added Krugle http://www.krugle.com/crawler/info.html the search engine for developers\r
+#              added Octora Beta Bot http://www.octora.com/ # Blog and Rss Search Engine\r
+#              added UbiCrawler http://law.dsi.unimi.it/ubicrawler/\r
+#              added Yahoo! Slurp China http://misc.yahoo.com.cn/help.html\r
+#                      You must reprocess old logs for the Yahoo! Slurp China bot to be detected in old reports\r
+# 2006-05-20\r
+#              added 1-More Scanner http://www.myzips.com/software/1-More-Scanner.phtml\r
+#              added Accoona-AI-Agent http://www.accoona.com/\r
+#              added ActiveBookmark http://www.libmaster.com/active_bookmark.php\r
+#              added BIGLOTRON http://www.biglotron.com/robot.html\r
+#              added Bookmark-Manager http://bkm.sourceforge.net/\r
+#              added cbn00glebot\r
+#              added Cerberian Drtrs http://www.pgts.com.au/cgi-bin/psql?robot_info=25240\r
+#              added CFNetwork http://www.cocoadev.com/index.pl?CFNetwork\r
+#              added CheckWeb link validator http://p.duby.free.fr/chkweb.htm\r
+#              added Computer and Automation Research Institute Crawler http://www.ilab.sztaki.hu/~stamas/publications/p184-benczur.html\r
+#              added ConveraCrawler http://www.authoritativeweb.com/crawl/\r
+#              added ConveraMultiMediaCrawler http://www.authoritativeweb.com/crawl/\r
+#              added CSE HTML Validator Lite Online http://online.htmlvalidator.com/php/onlinevallite.php\r
+#              added Cursor http://adcenter.hu/docs/en/bot.html\r
+#              added Custo http://www.netwu.com/custo/\r
+#              added DataFountains/DMOZ Downloader http://infomine.ucr.edu/\r
+#              added Deepindex http://www.deepindex.net/faq.php\r
+#              added DNSGroup http://www.dnsgroup.com/\r
+#              added DoCoMo http://www.nttdocomo.co.jp/\r
+#              added dumm.de-Bot http://www.dumm.de/\r
+#              added ETS v http://www.freetranslation.com/help/\r
+#              added eventax http://www.eventax.de/\r
+#              added FAST Enterprise Crawler * crawleradmin.t-info@telekom.de http://www.telekom.de/\r
+#              added FAST Enterprise Crawler http://www.fast.no/\r
+#              added FAST Enterprise Crawler * T-Info_BI_cluster crawleradmin.t-info@telekom.de http://www.telekom.de/\r
+#              added FeedValidator http://feedvalidator.org/\r
+#              added FilmkameraBot http://www.filmkamera.at/bot.html\r
+#              added Findexa Crawler http://www.findexa.no/gulesider/article26548.ece\r
+#              added Global Fetch http://www.wesonet.com/\r
+#              added GOFORITBOT http://www.goforit.com/about/\r
+#              added GoForIt.com http://www.goforit.com/about/\r
+#              added GPU p2p crawler http://gpu.sourceforge.net/search_engine.php\r
+#              added HooWWWer http://cosco.hiit.fi/search/hoowwwer/\r
+#              added HPPrint\r
+#              added HTMLParser http://htmlparser.sourceforge.net/\r
+#              added Hundesuche.com-Bot http://www.hundesuche.com/\r
+#              added InfoBot http://www.infobot.org/\r
+#              added InfociousBot http://corp.infocious.com/tech_crawler.php\r
+#              added InternetSupervision http://internetsupervision.com/\r
+#              added isearch2006 http://www.yahoo.com.cn/\r
+#              added IUPUI_Research_Bot http://spamhuntress.com/2005/04/25/a-mail-harvester-visits/\r
+#              added KalamBot http://64.124.122.251/feedback.html\r
+#              added kamano.de NewsFeedVerzeichnis http://www.kamano.de/\r
+#              added Kevin http://dznet.com/kevin/\r
+#              added KnowItAll http://www.cs.washington.edu/research/knowitall/\r
+#              added Knowledge.com http://www.knowledge.com/\r
+#              added Kouaa Krawler http://www.kouaa.com/\r
+#              added ksibot http://ego.ms.mff.cuni.cz/\r
+#              added Link Valet Online http://www.htmlhelp.com/tools/valet/\r
+#              added lwp-request http://search.cpan.org/~gaas/libwww-perl-5.69/bin/lwp-request\r
+#              added lwp-trivial http://search.cpan.org/src/GAAS/libwww-perl-5.805/lib/LWP/Simple.pm\r
+#              added MapoftheInternet.com http://MapoftheInternet.com/\r
+#              added Matrix S.p.A. - FAST Enterprise Crawler http://tin.virgilio.it/\r
+#              added Megite http://www.megite.com/\r
+#              added Metaspinner http://index.meta-spinner.de/\r
+#              added Mini-reptile\r
+#              added Misterbot http://www.misterbot.fr/\r
+#              added Miva http://www.miva.com/\r
+#              added Mizzu Labs http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&template=detail.html&match=\bid_m_141105_2\b\r
+#              added MSRBOT http://research.microsoft.com/research/sv/msrbot/\r
+#              added MS SharePoint Portal Server - MS Search 4.0 Robot http://support.microsoft.com/default.aspx?scid=kb;en-us;284022\r
+#              added Mydoyouhike http://www.doyouhike.net/my\r
+#              added NASA Search http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&template=detail.html&match=\bid_n_s_140506_2\b\r
+#              added NetSprint http://www.netsprint.pl/serwis/\r
+#              added NimbleCrawler http://www.healthline.com/\r
+#              added OpenWebSpider http://www.openwebspider.org/\r
+#              added Oracle Ultra Search http://www.oracle.com/technology/products/ultrasearch/index.html\r
+#              added OSSProxy http://www.marketscore.com/FAQ.Aspx\r
+#              added passwordmaker.org http://passwordmaker.org/\r
+#              added PEAR HTTP Request class http://pear.php.net/\r
+#              added PEERbot http://www.peerbot.com/\r
+#              added PHP version tracker http://www.nexen.net/phpversion/bot.php\r
+#              added PictureOfInternet http://malfunction.org/poi/\r
+#              added plinki http://www.plinki.com/\r
+#              added Port Huron Labs http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&template=detail.html&match=\bid_n_s_1133\b\r
+#              added PostFavorites http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&template=detail.html&match=\bid_n_s_1135\b\r
+#              added ProjectWF-java-test-crawler\r
+#              added PyQuery http://sourceforge.net/projects/pyquery/\r
+#              added Schizozilla http://spamhuntress.com/2005/03/18/gizmo/\r
+#              added Scumbot\r
+#              added Sensis Web Crawler http://www.sensis.com.au/\r
+#              added snap.com beta crawler http://www.snap.com/\r
+#              added Steeler http://www.tkl.iis.u-tokyo.ac.jp/~crawler/\r
+#              added STEROID  Download http://faqs.org.ru/progr/pascal/delphi_internet2.htm\r
+#              added Suchfin-Bot http://www.suchfin.de/\r
+#              added Sunrise http://www.sunrisexp.com/\r
+#              added Tagyu Agent http://www.tagyu.com/\r
+#              added Tcl http client package http://www.tcl.tk/man/tcl8.4/TclCmd/http.htm\r
+#              added TeragramCrawlerSURF http://www.teragram.com/\r
+#              added Test Crawler http://netp.ath.cx/\r
+#              added UnChaos Bot Hybrid Web Search Engine http://www.unchaos.com/\r
+#              added unido-bot http://www.unchina.org/unido/unido/our_projects/3_3.html\r
+#              added UniversalFeedParser http://feedparser.org/ (seen from md301000.inktomisearch.com)\r
+#              added updated http://www.updated.com/\r
+#              added Vermut http://vermut.aol.com\r
+#              added versus crawler from eda.baykan@epfl.ch http://www.epfl.ch/Eindex.html\r
+#              added Vespa Crawler (Yahoo Norway?) http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&template=detail.html&match=%5Cbid_t_z_030406_1%5Cb\r
+#              added VSE http://www.vivisimo.com/\r
+#              added webcrawl.net http://www.webcrawl.net/\r
+#              added Web Downloader http://www.krasu.ru/soft/chuchelo/\r
+#              added Webdup http://www.webdup.com/en/index.html\r
+#              added Wells Search http://www.psychedelix.com/cgi-bin/csv2html.pl?data=allagents.csv&template=detail.html&match=\bid_t_z_1484\b\r
+#              added WordPress http://wordpress.org/\r
+#              added wume crawler http://wume.cse.lehigh.edu/~xiq204/crawler/\r
+#              added Xenu's Link Sleuth (with ')\r
+#              added xirq http://www.xirq.com/\r
+#              added yoogliFetchAgent http://www.yoogli.com/\r
+#              added Z-Add Link Checker http://w3.z-add.co.uk/linkcheck/\r
+#              -- fix - some robots were reported with _ where _ should have been a space.\r
+#              changed Xenu Link Sleuth\r
+#              changed microsoft[_+\s]url[_+\s]control -> microsoft_url_control\r
+#              changed favorites_sweeper -> favorites_sweeper\r
+#              -- updates\r
+#              updated AskJeeves to Ask\r
+# 2012-06-05 Albrecht Mueller\r
+#              added Grabber from SDSC (San Diego Supercomputer Center).\r
+# 2013-09-30 Albrecht Mueller\r
+# AWStats probably cannot detect this bot as it identifies itself in\r
+# the referrer field and not in the user agent string.\r
+#92.113.100.35 - - [29/Sep/2013:17:22:46 +0200] "GET /robots.txt HTTP/1.1" 200 516 "-" "Mozilla/5.0 (Windows NT 6.1; WOW64; rv:5.0) Gecko/20100101 Firefox/5.0" "-"\r
+#92.113.100.35 - - [29/Sep/2013:17:22:49 +0200] "GET /tghome.htm HTTP/1.1" 200 4445 "http://extrabot.com/help/frytygativyheku.htm" "Mozilla/5.0 (Windows NT 6.1; WOW64; rv:5.0) Gecko/20100101 Firefox/5.0" "-"\r
+#92.113.100.35 - - [29/Sep/2013:17:22:51 +0200] "GET / HTTP/1.1" 200 5467 "http://extrabot.com/help/frytygativyheku.htm" "Mozilla/5.0 (Windows NT 6.1; WOW64; rv:5.0) Gecko/20100101 Firefox/5.0" "-"\r
+\r
+# to do  MS Search 4.0 Robot\r
+\r
+#package AWSROB;\r
+\r
+\r
+# Robots list was found at http://www.robotstxt.org/wc/active/all.txt\r
+# Other robots can be found at http://www.jafsoft.com/searchengines/webbots.html\r
+# Rem: To avoid bad detection, some robot's ids were removed from this list:\r
+#      - Robots with ID of 3 letters only\r
+#      - Robots called 'webs' and 'tcl'\r
+# Rem: directhit changed into direct_hit (its real id)\r
+# Rem: calif changed into calif[^r] to avoid confusion between Tiscalifreenet browser\r
+# Rem: fish changed into [^a]fish to avoid confusion between Madsafish browser\r
+# Rem: roadrunner changed into road_runner\r
+# Rem: lycos changed to lycos_ to avoid confusion with lycos-online browser\r
+# Rem: voyager changed into ^voyager\/ to avoid to exclude voyager and amigavoyager browser\r
+\r
+# RobotsSearchIDOrder\r
+# It contains all matching criteria to search for in log fields. This list is\r
+# used to know in which order to search Robot IDs.\r
+# Most frequent ones are in list1, used when LevelForRobotsDetection is 1 or more\r
+# Minor robots are in list2, used when LevelForRobotsDetection is 2 or more\r
+# Note: Robots IDs are in lower case, '_', ' ' and '+' are changed into '[_+\s]' and are quoted.\r
+#-------------------------------------------------------\r
+\r
+@RobotsSearchIDOrder_list1 = (\r
+# Common robots (In robot file)\r
+'bingbot/',\r
+'bingpreview',\r
+'MSIECrawler',\r
+'msnbot/',\r
+'msnbot\-media/',\r
+'AdIdxBot/',\r
+'NOT[\x20]Googlebot/',\r
+'Googlebot/',\r
+'Google[\x20]Web[\x20]Preview',\r
+'Googlebot\-Image/',\r
+'Googlebot\-Mobile/',\r
+'google\-sitemaps',\r
+'Googlebot\-News',\r
+'Googlebot\-Video/',\r
+'AdsBot\-Google[\x20]\(',\r
+'AdsBot\-Google\-Mobile\-Apps',\r
+'Mediapartners-Google',\r
+'Feedfetcher\-Google',\r
+'Google\-Adwords\-Instant',\r
+'Firefox/1\.5',\r
+'Yahoo![\x20]Slurp[\x20]China',\r
+'Yahoo![\x20]Slurp',\r
+'Baiduspider/',\r
+'Baiduspider\-image',\r
+'baidu',\r
+'YandexBot/',\r
+'YandexImages/',\r
+'YandexMetrika/',\r
+'YandexMobileBot/',\r
+'yandex',\r
+'electricmonk/',\r
+'spbot/',\r
+'SeznamBot/',\r
+'msie8',\r
+'AhrefsBot/',\r
+'007ac9[\x20]Crawler',\r
+'2345Explorer/',\r
+'360Spider',\r
+'A[\x20]Simple[\x20]Crawler',\r
+'Abrave',\r
+'acapbot/',\r
+'Accoona\-AI\-Agent/',\r
+'AdnormCrawlerCatchBot/',\r
+'aiHitBot/',\r
+'aipbot/',\r
+'Apache\-HttpClient/',\r
+'Apexoo[\x20]Spider',\r
+'Applebot/',\r
+'archive\.org_bot',\r
+'Babya[\x20]Discoverer',\r
+'BDCbot/',\r
+'BinGet/',\r
+'bl\.uk_lddc_bot/',\r
+'BLEXBot/',\r
+'boitho\.com\-dc/',\r
+'BusinessBot:',\r
+'CatchBot/',\r
+'CB/Nutch',\r
+'CCBot/',\r
+'Cliqzbot/',\r
+'CMS[\x20]Crawler',\r
+'ConveraCrawler/',\r
+'cosmos/',\r
+'crawl/Nutch',\r
+'Crawler/',\r
+'crawler4j',\r
+'CRAZYWEBCRAWLER',\r
+'CSE[\x20]HTML[\x20]Validator',\r
+'C\-T[\x20]bot',\r
+'Curl/PHP',\r
+'Dalvik/',\r
+'DataCrawler/',\r
+'Deepnet[\x20]Explorer',\r
+'DeuSu/',\r
+'Digincore',\r
+'Discordbot/',\r
+'DoCoMo/',\r
+'Domain[\x20]Re\-Animator[\x20]Bot',\r
+'DomainCrawler/',\r
+'DomainMacroCrawler/',\r
+'DomainSONOCrawler/',\r
+'DomainStatsBot/',\r
+'DotBot/',\r
+'DuckDuckGo\-Favicons\-Bot/',\r
+'ELinks/',\r
+'ELinks[\x20]\(',\r
+'EmailMarketingRobot/',\r
+'EmeraldShield\.com[\x20]WebBot',\r
+'envolk\[ITS\]spider/',\r
+'EsperanzaBot',\r
+'Exabot/',\r
+'facebookexternalhit/',\r
+'fast_enterprise_crawler.*scrawleradmin\.t\-info@telekom\.de',\r
+'fast_enterprise_crawler.*t\-info_bi_cluster_crawleradmin\.t\-info@telekom\.de',\r
+'FAST\-WebCrawler/',\r
+'Feosey[\x20]Mohk[\x20]Crawler',\r
+'findlinks/',\r
+'Findxbot/',\r
+'FirePHP/',\r
+'FlippyBearBot/',\r
+'FreeWebMonitoring[\x20]SiteChecker/',\r
+'fujilabol',\r
+'FurlBot/',\r
+'Gaisbot/',\r
+'Gallent[\x20]Spider',\r
+'GarlikCrawler/',\r
+'GetintentCrawler[\x20]getintent\.com',\r
+'Gigabot/',\r
+'gipo\-crawler/Nutch',\r
+'Girafabot',\r
+'Gluten[\x20]Free[\x20]Crawler/',\r
+'gocrawl',\r
+'GrapeshotCrawler/',\r
+'GSiteCrawler/',\r
+'GurujiBot/',\r
+'HaosouSpider',\r
+'holmes/',\r
+'HTTP_Request2/',\r
+'HubSpot[\x20]Webcrawler',\r
+'HyperCrawl/',\r
+'ICC\-Crawler/',\r
+'iconoclast',\r
+'IDGCrawler/Nutch',\r
+'idmarch[\x20]Automatic\.beta/',\r
+'Incutio[\x20]XML',\r
+'InfluenceBot',\r
+'IRLbot/',\r
+'IssueCrawler',\r
+'istellabot/',\r
+'James[\x20]BOT',\r
+'Jigsaw/',\r
+'JobFeed',\r
+'KomodiaBot/',\r
+'Konqueror/',\r
+'linkapediabot',\r
+'metager\-linkchecker',\r
+'linkchecker',\r
+'LinkCheck',\r
+'linkdexbot/',\r
+'LinkedInBot/',\r
+'LinkpadBot/',\r
+'Links[\x20]\(',\r
+'LinksManager\.com_bot',\r
+'LWP::Simple/',\r
+'Mail\.RU_Bot/',\r
+'meanpathbot/',\r
+'Mediatoolkitbot',\r
+'MegaIndex\.ru/',\r
+'merzscope',\r
+'mfibot/',\r
+'microsoft.*discovery',\r
+'missigua_locator',\r
+'MixrankBot',\r
+'MJ12bot/',\r
+'MojeekBot/',\r
+'Mojolicious',\r
+'MXT/Nutch',\r
+'My[\x20]Nutch[\x20]Spider/',\r
+'myse/Nutch',\r
+'NerdyBot',\r
+'netEstate[\x20]NE[\x20]Crawler',\r
+'NetResearchServer/',\r
+'NRLCorpusBuilder/Nutch',\r
+'nutch\-1\.4/',\r
+'nutch\-1\.8/',\r
+'NutchCVS/',\r
+'o\.uk[\x20]robot',\r
+'oBot/',\r
+'ocrawler;',\r
+'ODP[\x20]link[\x20]checker',\r
+'Offline[\x20]Explorer/',\r
+'OmniExplorer_Bot/',\r
+'OrangeBot/',\r
+'PageBitesHyperBot/',\r
+'pdffillerbot/',\r
+'PhantomJS',\r
+'PHP/5\.2\.8',\r
+'Ploetz[\x20]\+[\x20]Zeller',\r
+'Plukkie/',\r
+'Princetonbot/',\r
+'PrivacyAwareBot/',\r
+'proximic',\r
+'psbot/',\r
+'psbot\-image',\r
+'python_wk_crawler',\r
+'Python\-urllib/',\r
+'QCrawl',\r
+'ResearchBot',\r
+'roboto',\r
+'rogerbot/',\r
+'RSSingBot',\r
+'RukiCrawler/',\r
+'SafeDNS[\x20]search[\x20]bot/',\r
+'SafeDNSBot',\r
+'SafeSearch[\x20]microdata[\x20]crawler',\r
+'safesearch',\r
+'SBL\-BOT',\r
+'Screaming[\x20]Frog[\x20]SEO[\x20]Spider/',\r
+'ScreenerBot[\x20]Crawler[\x20]Beta',\r
+'Searchie/',\r
+'Seekmo',\r
+'semanticbot',\r
+'SemrushBot/',\r
+'seo\-audit\-check\-bot/',\r
+'Seobility',\r
+'SEOkicks\-Robot',\r
+'SEOlyticsCrawler/',\r
+'SEOstats',\r
+'Seosys/Nutch',\r
+'Seoterritory\.com[\x20]bot',\r
+'Shim\-Crawler',\r
+'SiteExplorer/',\r
+'siteexplorer\.info',\r
+'Slackbot\-LinkExpanding',\r
+'SmabblerBot/',\r
+'Sogou[\x20]web[\x20]spider/',\r
+'special_archiver/',\r
+'Spiderbot/',\r
+'ssearch_bot',\r
+'SurdotlyBot/',\r
+'SurveyBot/',\r
+'taiil/Nutch',\r
+'tbot\-nutch',\r
+'TeeRaidBot',\r
+'TelegramBot',\r
+'Test/Nutch',\r
+'Test[\x20]Spider',\r
+'TestCrawler',\r
+'TurnitinBot/',\r
+'TurnitinBot',\r
+'TweetmemeBot/',\r
+'UCY/Nutch',\r
+'Uptimebot/',\r
+'URL[\x20]Checker',\r
+'UXCrawlerBot',\r
+'Validator\.nu/',\r
+'vBSEO',\r
+'vBulletin[\x20]via[\x20]PHP',\r
+'vebidoobot',\r
+'viz/Nutch',\r
+'VoilaBot',\r
+'VORTEX/',\r
+'voyager/',\r
+'W3C_Validator/',\r
+'W3C\-checklink/',\r
+'WBSearchBot/',\r
+'WeSEE:Ads/PageBot',\r
+'WeSEE:Ads/PictureBot',\r
+'WeSEE_Bot',\r
+'Wget/',\r
+'Who\.is[\x20]Bot',\r
+'wonderbot/',\r
+'woobot/',\r
+'Wotbox/',\r
+'Xaldon[\x20]WebSpider',\r
+'Xenu[\x20]Link[\x20]Sleuth',\r
+'xenu_link_sleuth',\r
+'XML[\x20]Sitemaps[\x20]Generator',\r
+'XoviBot/',\r
+'yacybot',\r
+'Yahoo[\x20]Link[\x20]Preview',\r
+'YisouSpider',\r
+'yoozBot',\r
+'zspider/',\r
+'ZumBot/',\r
+# below placed at end to catch some generics\r
+'nbot',\r
+'ng/1\.',\r
+'ng/2\.',\r
+'libwww\-perl',\r
+'CFNetwork',\r
+'urllib',\r
+'javabee',\r
+'projectwf\-java\-test\-crawler',\r
+'java',\r
+'loocalcrawler/nutch',\r
+'nutchosu\-vlib',\r
+'nutch',\r
+'perlcrawler',\r
+'perl',\r
+# old robots using firefox < version 11 not identifying themselves as a robot.\r
+'(firefox/)([0-9]\.|[0-1][0]\.)'\r
+);\r
+\r
+@RobotsSearchIDOrder_list2 = (\r
+# Less common robots (In robot file)\r
+'^Mozilla$',\r
+'^mozilla\/3\.0\s\(compatible$',\r
+'^mozilla\/4\.0$',\r
+'^mozilla\/4\.0\s\(compatible;\)$',\r
+'^mozilla\/5\.0$',\r
+'^mozilla\/5\.0\s\(compatible;$',\r
+'^mozilla\/5\.0\s\(en\-us\)$',\r
+'^mozilla\/5\.0\sfirefox\/3\.0\.5$',\r
+'^Mozilla/6\.0[\x20]\(compatible\)$',\r
+'^Mozilla/(.*)Beta[\x20]\(Windows\)',\r
+'MSIE[\x20]2',\r
+'MSIE[\x20]3',\r
+'MSIE[\x20]4',\r
+'MSIE[\x20]5',\r
+'MSIE[\x20]6',\r
+'Windows[\x20]95',\r
+'Windows[\x20]98',\r
+\r
+# these could be removed to speed up processing as they are rarely seen\r
+'a6\-indexer',\r
+'abcdatos',\r
+'abonti\.com',\r
+'acme\.spider',\r
+'activebookmark',\r
+'adamm_bot',\r
+'advbot',\r
+'affectv\.co\.uk',\r
+'ahoythehomepagefinder',\r
+'aleadsoftbot',\r
+'alkaline',\r
+'allrati',\r
+'alltop',\r
+'almaden',\r
+'alpha_search_agent',\r
+'anthill',\r
+'antibot',\r
+'aport',\r
+'appie',\r
+'applesyndication',\r
+'arachnophilia',\r
+'arale',\r
+'araneo',\r
+'architext',\r
+'archive\-de\.com',\r
+'aretha',\r
+'argus',\r
+'ariadne',\r
+'arianna\.libero\.it',\r
+'arks',\r
+'aspider',\r
+'aspseek',\r
+'asterias',\r
+'asynchttpclient',\r
+'atn\.txt',\r
+'atomz',\r
+'auresys',\r
+'awbot',\r
+'backlinktest\.com',\r
+'backrub',\r
+'bbot',\r
+'becomebot',\r
+'bender',\r
+'betabot',\r
+'bigbrother',\r
+'biglotron',\r
+'BingLocalSearch',\r
+'bittorrent_bot',\r
+'biz360[_+\s]spider',\r
+'bjaaland',\r
+'blackwidow',\r
+'blindekuh',\r
+'blogbridge[_+\s]service',\r
+'blogged_crawl',\r
+'bloglines',\r
+'bloglovin',\r
+'blogpulse',\r
+'blogsearch',\r
+'blogshares',\r
+'blogslive',\r
+'blogssay',\r
+'bloodhound',\r
+'bncf\.firenze\.sbn\.it/raccolta\.txt',\r
+'bobby',\r
+'bookmark\-manager',\r
+'borg\-bot',\r
+'boris',\r
+'brightnet',\r
+'bruinbot',\r
+'bspider',\r
+'bubing',\r
+'bumblebee',\r
+'butterfly',\r
+'buzztracker',\r
+'cactvschemistryspider',\r
+'calif[^r]',\r
+'candlelight[_+\s]favorites[_+\s]inspector',\r
+'careerbot',\r
+'carpathia',\r
+'cassandra',\r
+'catbot',\r
+'cbn00glebot',\r
+'cerberian_drtrs',\r
+'cfetch',\r
+'cgireader',\r
+'chattertrap',\r
+'check_http',\r
+'checkbot',\r
+'checkweb_link_validator',\r
+'christcrawler',\r
+'churl',\r
+'cienciaficcion',\r
+'cipinetbot',\r
+'imagecoccoc',\r
+'coccoc',\r
+'coldfusion',\r
+'collective',\r
+'combine',\r
+'commons\-httpclient',\r
+'computer_and_automation_research_institute_crawler',\r
+'conceptbot',\r
+'contentmatch',\r
+'converamultimediacrawler',\r
+'coolbot',\r
+'copubbot',\r
+'core',\r
+'covario',\r
+'cruiser',\r
+'cscrawler',\r
+'cuasarbot',\r
+'cursor',\r
+'cusco',\r
+'custo',\r
+'cyberspyder',\r
+'datafountains/dmoz_downloader',\r
+'dataprovider\.com',\r
+'daumoa',\r
+'daviesbot',\r
+'daylifefeedfetcher',\r
+'daypopbot',\r
+'deepindex',\r
+'desertrealm',\r
+'deweb',\r
+'dienstspider',\r
+'digger',\r
+'digout4u',\r
+'diibot',\r
+'dipsie\.bot',\r
+'direct_hit',\r
+'discobot',\r
+'dlvr\.it',\r
+'dnabot',\r
+'dnsgroup',\r
+'doccheckbot',\r
+'domainappender',\r
+'domainchecker',\r
+'domainsdb\.net',\r
+'download_express',\r
+'dragonbot',\r
+'dreamwidth',\r
+'drupal',\r
+'dulance',\r
+'dumbot',\r
+'dumm\.de\-bot',\r
+'dwcp',\r
+'e\-collector',\r
+'earthcom\.info',\r
+'easydl',\r
+'ebiness',\r
+'eccp',\r
+'echo!',\r
+'edgeio\-retriever',\r
+'elfinbot',\r
+'emacs',\r
+'emcspider',\r
+'enteprise',\r
+'ernst[:blank:]2\.0',\r
+'esther',\r
+'ets_v',\r
+'eventax',\r
+'everbeecrawler',\r
+'everest\-vulcan',\r
+'evliyacelebi',\r
+'exactseek',\r
+'extreme[_+\s]picture[_+\s]finder',\r
+'ezoom',\r
+'ezresult',\r
+'facebook',\r
+'facebot',\r
+'fast\-search\-engine',\r
+'matrix_s\.p\.a\._\-_fast_enterprise_crawler',\r
+'fast_enterprise_crawler',\r
+'fastbot',\r
+'fastcrawler',\r
+'favicon',\r
+'favorg',\r
+'favorites_sweeper',\r
+'fdse',\r
+'feedburner',\r
+'feedcrawl',\r
+'feedflow',\r
+'feedmyinbox',\r
+'feedroll\.com',\r
+'feedsky',\r
+'feedster',\r
+'feedvalidator',\r
+'feedzira',\r
+'felix',\r
+'ferret',\r
+'fetchbot',\r
+'fetchrover',\r
+'fever/',\r
+'fido',\r
+'filmkamerabot',\r
+'filterdb\.iss\.net',\r
+'finderlein[_+\s]research[_+\s]crawler',\r
+'findexa_crawler',\r
+'finnish',\r
+'fireball',\r
+'firmilybot',\r
+'flexum',\r
+'foaf\-search\.net',\r
+'fooky\.com/ScorpionBot',\r
+'fouineur',\r
+'francoroute',\r
+'freecrawl',\r
+'freenews',\r
+'funnelweb',\r
+'g2crawler',\r
+'gama',\r
+'gazz',\r
+'gcreep',\r
+'geniebot',\r
+'genieo',\r
+'geohasher',\r
+'getbot',\r
+'geturl',\r
+'gigablastopensource',\r
+'global_fetch',\r
+'gnodspider',\r
+'goforit\.com',\r
+'goforitbot',\r
+'golem',\r
+'gonzo',\r
+'gougou',\r
+'gpu_p2p_crawler',\r
+'grabber',\r
+'grapeshot',\r
+'grapnel',\r
+'griffon',\r
+'gromit',\r
+'grub',\r
+'gulliver',\r
+'gulperbot',\r
+'hambot',\r
+'hanrss',\r
+'harvest',\r
+'havindex',\r
+'henrythemiragorobot',\r
+'heritrix',\r
+'hl_ftien_spider',\r
+'hometown',\r
+'hoowwwer',\r
+'hpprint',\r
+'htdig',\r
+'html[_+\s]link[_+\s]validator',\r
+'htmlgobble',\r
+'htmlparser',\r
+'httrack',\r
+'hundesuche\.com\-bot',\r
+'hyperdecontextualizer',\r
+'ia_archiver\-web\.archive\.org',\r
+'ia_archiver',\r
+'iajabot',\r
+'iaskspider',\r
+'i\-bot',\r
+'icarus6j',\r
+'ichiro',\r
+'icjobs\.de',\r
+'ilse',\r
+'iltrovatore\-setaccio',\r
+'imagelock',\r
+'implisensebot',\r
+'inagist',\r
+'incywincy',\r
+'infobot',\r
+'infociousbot',\r
+'infohelfer',\r
+'infomine',\r
+'informant',\r
+'infoseeksidewinder',\r
+'infoseek',\r
+'infospider',\r
+'inspectorwww',\r
+'insurancobot',\r
+'integromedb\.org',\r
+'intelliagent',\r
+'internet[_+\s]ninja',\r
+'internetarchive',\r
+'internetseer',\r
+'internetsupervision',\r
+'ips\-agent',\r
+'irobot',\r
+'iron33',\r
+'isearch2006',\r
+'israelisearch',\r
+'iupui_research_bot',\r
+'izsearch',\r
+'jacobin[\x20]club',\r
+'jakarta',\r
+'jbot',\r
+'jcrawler',\r
+'jeeves',\r
+'jennybot',\r
+'jobboerse',\r
+'jobot',\r
+'jobo',\r
+'joebot',\r
+'jrtwine[_+\s]software[_+\s]check[_+\s]favorites[_+\s]utility',\r
+'js\-kit',\r
+'jubii',\r
+'jumpstation',\r
+'justview',\r
+'kalambot',\r
+'kamano\.de_newsfeedverzeichnis',\r
+'kapsi',\r
+'katipo',\r
+'kazoombot',\r
+'kevin',\r
+'keyoshid',\r
+'kilroy',\r
+'kinja\-imagebot',\r
+'kinjabot',\r
+'knowitall',\r
+'knowledge\.com',\r
+'ko[_+\s]yappo[_+\s]robot',\r
+'kouaa_krawler',\r
+'krugle',\r
+'ksibot',\r
+'kummhttp',\r
+'kurzor',\r
+'labelgrabber\.txt',\r
+'lanshanbot',\r
+'larbin',\r
+'largesmall[\x20]crawler',\r
+'legs',\r
+'letscrawl\.com',\r
+'libcrawl',\r
+'lilina',\r
+'link_valet_online',\r
+'linkbot',\r
+'linkdex\.com',\r
+'linkidator',\r
+'linkscan',\r
+'linkstats[\x20]bot',\r
+'linkwalker',\r
+'lipperhey',\r
+'livejournal\.com',\r
+'lmspider',\r
+'loadtimebot',\r
+'lockon',\r
+'logo_gif',\r
+'longurl',\r
+'lssrocketcrawler',\r
+'ltbot',\r
+'ltx71',\r
+'lwp\-request',\r
+'lwp\-trivial',\r
+'lycos[_+\s]',\r
+'macworm',\r
+'madaali\.de',\r
+'magpierss',\r
+'magpie',\r
+'mapoftheinternet\.com',\r
+'marvin',\r
+'mattie',\r
+'mediabot',\r
+'mediafox',\r
+'megaindex',\r
+'megite',\r
+'memorybot',\r
+'mercator',\r
+'meshexplorer',\r
+'metager2\-verification\-bot',\r
+'metajobbot',\r
+'metaspinner',\r
+'metauri',\r
+'miadev',\r
+'microsoft[_+\s]url[_+\s]control',\r
+'microsoft[\x20]bits',\r
+'microsoft\-webdav\-miniredir',\r
+'mindcrawler',\r
+'mindupbot',\r
+'mini\-reptile',\r
+'minirank',\r
+'misterbot',\r
+'miva',\r
+'mizzu_labs',\r
+'mnogosearch',\r
+'moget',\r
+'momspider',\r
+'monster',\r
+'motor',\r
+'movabletype',\r
+'ms[_+\s]search[_+\s]6\.0[_+\s]robot',\r
+'ms_search_4\.0_robot',\r
+'msnbot\-udiscovery',\r
+'msrabot',\r
+'msrbot',\r
+'mt::telegraph::agent',\r
+'muncher',\r
+'muscatferret',\r
+'mwdsearch',\r
+'mydoyouhike',\r
+'myweb',\r
+'nagios',\r
+'nasa_search',\r
+'ndspider',\r
+'nederland\.zoek',\r
+'netcarta',\r
+'netcraft',\r
+'netluchs',\r
+'netmechanic',\r
+'netnewswire',\r
+'netscoop',\r
+'netsprint',\r
+'netvibes',\r
+'newrelicpinger',\r
+'newscan\-online',\r
+'newsfox',\r
+'newsgatoronline',\r
+'nextgensearchbot',\r
+'nhse',\r
+'nicebot',\r
+'nimblecrawler',\r
+'ning',\r
+'nomad',\r
+'northstar',\r
+'noxtrumbot',\r
+'npbot',\r
+'nzexplorer',\r
+'objectssearch',\r
+'occam',\r
+'ocelli',\r
+'octopus',\r
+'octora_beta_bot',\r
+'onet\.pl[_+\s]sa',\r
+'onfolio',\r
+'openfind',\r
+'opentaggerbot',\r
+'openwebspider',\r
+'optimizer',\r
+'oracle_ultra_search',\r
+'orb_search',\r
+'orbiter',\r
+'packrat',\r
+'pageboy',\r
+'panscient',\r
+'parasite',\r
+'passwordmaker\.org',\r
+'patric',\r
+'pear_http_request_class',\r
+'peerbot',\r
+'pegasus',\r
+'perignator',\r
+'perman',\r
+'petersnews',\r
+'phantom',\r
+'php[_+\s]version[_+\s]tracker',\r
+'phpcrawl',\r
+'phpdig',\r
+'picmole',\r
+'pictureofinternet',\r
+'piltdownman',\r
+'pimptrain',\r
+'ping\.blo\.gs',\r
+'pingdom',\r
+'pioneer',\r
+'pita',\r
+'pitkow',\r
+'pjspider',\r
+'plinki',\r
+'pluckfeedcrawler',\r
+'plumtreewebaccessor',\r
+'pogodak',\r
+'pompos',\r
+'popdexter',\r
+'poppi',\r
+'port_huron_labs',\r
+'portalb',\r
+'postfavorites',\r
+'postpost',\r
+'postrank',\r
+'powermarks',\r
+'printfulbot',\r
+'proodlebot',\r
+'protopage',\r
+'publiclibraryarchive',\r
+'pyquery',\r
+'python',\r
+'qihoobot',\r
+'quipply',\r
+'qwantify',\r
+'r6\_',\r
+'rambler',\r
+'ratingburner',\r
+'raven',\r
+'rbse',\r
+'redalert',\r
+'regator',\r
+'relevantnoise\.com',\r
+'resumerobot',\r
+'rhcs',\r
+'riddler',\r
+'road_runner',\r
+'robbie',\r
+'robi',\r
+'robocrawl',\r
+'robofox',\r
+'robozilla',\r
+'rojo',\r
+'rome[\x20]client',\r
+'roverbot',\r
+'rpt\-httpclient',\r
+'rssgraffiti',\r
+'rssimagesbot',\r
+'ruffle',\r
+'rufusbot',\r
+'rules',\r
+'safeads\.xyz',\r
+'safetynetrobot',\r
+'sage\+\+',\r
+'sandcrawler',\r
+'savetheworldheritage',\r
+'sbider',\r
+'schizozilla',\r
+'scooter',\r
+'scoutjet',\r
+'scumbot',\r
+'search\-info',\r
+'search_au',\r
+'searchguild[_+\s]dmoz[_+\s]experiment',\r
+'searchmetricsbot',\r
+'searchprocess',\r
+'seekbot',\r
+'semalt',\r
+'senrigan',\r
+'sensis_web_crawler',\r
+'seodiver',\r
+'seokicks\.de',\r
+'seoscanners',\r
+'sgscout',\r
+'shaggy',\r
+'shaihulud',\r
+'shareaholicbot',\r
+'shoutcast',\r
+'sift',\r
+'simbot',\r
+'simplepie',\r
+'sistrix',\r
+'site\-valet',\r
+'sitebot',\r
+'sitedomain\-bot',\r
+'sitetech',\r
+'skimbot',\r
+'skymob',\r
+'slcrawler',\r
+'slurp',\r
+'slysearch',\r
+'smartspider',\r
+'smtbot',\r
+'snap\.com_beta_crawler',\r
+'snappy',\r
+'snooper',\r
+'sohu\-search',\r
+'sohu',\r
+'solbot',\r
+'speedy',\r
+'sphere_scout',\r
+'spider[_+\s]monkey',\r
+'spiderline',\r
+'spiderlytics',\r
+'spiderman',\r
+'spiderview',\r
+'spip',\r
+'sproose_crawler',\r
+'spry',\r
+'sqworm',\r
+'ssearcher',\r
+'steeler',\r
+'steroid__download',\r
+'stq_bot',\r
+'Stratagems[\x20]Kumo',\r
+'suchfin\-bot',\r
+'suke',\r
+'summify\.com',\r
+'sunrise',\r
+'suntek',\r
+'superbot',\r
+'superfeedr',\r
+'susie',\r
+'sven',\r
+'syndic8',\r
+'syndicapi',\r
+'synoobot',\r
+'synthesio',\r
+'t\-h\-u\-n\-d\-e\-r\-s\-t\-o\-n\-e',\r
+'tach_bw',\r
+'tagyu_agent',\r
+'tailrank',\r
+'tarantula',\r
+'tarspider',\r
+'tcl_http_client_package',\r
+'techbot',\r
+'technoratibot',\r
+'templeton',\r
+'teoma',\r
+'teragramcrawlersurf',\r
+'test_crawler',\r
+'testbot',\r
+'thumbsniper',\r
+'titan',\r
+'titin',\r
+'tkwww',\r
+'tlspider',\r
+'topblogsinfo',\r
+'topicblogs',\r
+'topix\.net',\r
+'trapit',\r
+'trileet',\r
+'turtlescanner',\r
+'turtle',\r
+'tutorgigbot',\r
+'tweetedtimes',\r
+'twiceler',\r
+'twisted[\x20]pagegetter',\r
+'twitterbot',\r
+'twitterfeed',\r
+'ubicrawler',\r
+'ucsd',\r
+'udmsearch',\r
+'ultraseek',\r
+'unchaos_bot_hybrid_web_search_engine',\r
+'unido\-bot',\r
+'unisterbot',\r
+'universalfeedparser',\r
+'unlost_web_crawler',\r
+'unwindfetchor',\r
+'updated',\r
+'urlck',\r
+'ustc\-semantic\-group',\r
+'vagabondo\-wap',\r
+'vagabondo',\r
+'valkyrie',\r
+'vermut',\r
+'versus_crawler_from_eda\.baykan@epfl\.ch',\r
+'verticrawl',\r
+'vespa_crawler',\r
+'victoria',\r
+'virus[_+\s]detector',\r
+'visionsearch',\r
+'voidbot',\r
+'voltron',\r
+'vse/',\r
+'vwbot',\r
+'w3c[_+\s]css[_+\s]validator[_+\s]jfouffa',\r
+'w3index',\r
+'w3m2',\r
+'wallpaper',\r
+'wanderer',\r
+'wapspider',\r
+'wapspIRLider',\r
+'watchmouse',\r
+'wavefire',\r
+'waybackarchive\.org',\r
+'wazzup',\r
+'web_downloader',\r
+'webbandit',\r
+'webbase',\r
+'webcatcher',\r
+'webclipping\.com',\r
+'webcollage',\r
+'webcompass',\r
+'webcopy',\r
+'webcrawl\.net',\r
+'webdup',\r
+'webfetcher',\r
+'webfilter',\r
+'webfoot',\r
+'webinator',\r
+'webindexer',\r
+'weblayers',\r
+'weblinker',\r
+'webminer',\r
+'webmirror',\r
+'webmoose',\r
+'webquest',\r
+'webreader',\r
+'webreaper',\r
+'website[_+\s]monitoring[_+\s]bot',\r
+'websnarf',\r
+'webspider',\r
+'webvac',\r
+'webvulncrawl',\r
+'webwalker',\r
+'webwalk',\r
+'webwatch',\r
+'wells_search',\r
+'wer\-liefert\-was',\r
+'wesee:search',\r
+'wevikabot',\r
+'whatuseek',\r
+'whowhere',\r
+'windows\-rss\-platform',\r
+'wired\-digital',\r
+'zyborg',\r
+'wisenutbot',\r
+'wiumi',\r
+'wmir',\r
+'wolp',\r
+'wombat',\r
+'wonderer',\r
+'woozweb',\r
+'wordpress',\r
+'worm',\r
+'wume_crawler',\r
+'wwwc',\r
+'wwweasel',\r
+'wz101',\r
+'xget',\r
+'xirq',\r
+'xydo',\r
+'y!j',\r
+'yahoo![\x20]searchmonkey',\r
+'yahoo!_mindset',\r
+'yahoo\-blogs',\r
+'yahoo\-mmcrawler',\r
+'yahoo\-newscrawler',\r
+'yahoo[\x20]pipes',\r
+'yahoo\-verticalcrawler',\r
+'yahoocachesystem',\r
+'yahooexternalcache',\r
+'yahoofeedseeker',\r
+'yahooseeker\-testing',\r
+'yahooseeker',\r
+'yahooysmcm',\r
+'yammer',\r
+'yanga',\r
+'yet\-another\-spider',\r
+'yeti',\r
+'yie8',\r
+'yodaobot',\r
+'yooglifetchagent',\r
+'youdao',\r
+'yourls',\r
+'z\-add_link_checker',\r
+'zealbot',\r
+'zemanta',\r
+'zend_http_client',\r
+'zeus',\r
+'zhuaxia',\r
+'[^a]fish',\r
+'[\x20]netseer[\x20]',\r
+'^[1-3]$',\r
+'^finbot',\r
+'^motorola$',\r
+'^msie',\r
+'^voyager/',\r
+'^webindex$',\r
+'1\-more_scanner'\r
+);\r
+\r
+@RobotsSearchIDOrder_listgen = (\r
+# Generic robot\r
+'robot',\r
+'blog',\r
+'checker',\r
+'crawl',\r
+'discover',\r
+'feed',\r
+'fetcher',\r
+'hunter',\r
+'link',\r
+'scanner',\r
+'seek',\r
+'sitemap',\r
+'spider',\r
+'sucker',\r
+'validator',\r
+'bot[\s_+:,\.\;\/\\\-]',\r
+'[\s_+:,\.\;\/\\\-]bot',\r
+'curl',\r
+'php',\r
+'ruby/',\r
+'no_user_agent'\r
+);\r
+\r
+\r
+# RobotsHashIDLib\r
+# List of robots names ('robot id','robot clear text')\r
+#-------------------------------------------------------\r
+%RobotsHashIDLib   = (\r
+# Common robots (In robot file)\r
+'bingbot/','bingbot',\r
+'bingpreview','BingPreview',\r
+'MSIECrawler','MSIECrawler',\r
+'msnbot/','msnbot',\r
+'msnbot\-media/','msnbot-media',\r
+'AdIdxBot/','AdIdxBot Microsoft Ad Quality control',\r
+'NOT[\x20]Googlebot/','NOT Googlebot',\r
+'Googlebot/','Googlebot',\r
+'Google[\x20]Web[\x20]Preview','Google Web Preview',\r
+'Googlebot\-Image/','Googlebot-Image',\r
+'Googlebot\-Mobile/','Googlebot-Mobile',\r
+'google\-sitemaps','google-sitemaps',\r
+'Googlebot\-News','Googlebot-News',\r
+'Googlebot\-Video/','Googlebot-Video',\r
+'AdsBot\-Google[\x20]\(','AdsBot-Google',\r
+'AdsBot\-Google\-Mobile\-Apps','AdsBot-Google-Mobile-Apps',\r
+'Mediapartners\-Google','Mediapartners-Google',\r
+'Feedfetcher\-Google','Feedfetcher-Google',\r
+'Google\-Adwords\-Instant','Google-Adwords-Instant',\r
+'Firefox/1\.5','Nautic Expo using Firefox/1.5',\r
+'Yahoo![\x20]Slurp[\x20]China','Yahoo! Slurp China',\r
+'Yahoo![\x20]Slurp','Yahoo! Slurp',\r
+'Baiduspider/','Baiduspider',\r
+'Baiduspider\-image','Baiduspider-image',\r
+'baidu','Baidu ( catchall )',\r
+'YandexBot/','YandexBot',\r
+'YandexImages/','YandexImages',\r
+'YandexMetrika/','YandexMetrika',\r
+'YandexMobileBot/','YandexMobileBot',\r
+'yandex','Yandex ( catchall )',\r
+'electricmonk/','electricmonk',\r
+'spbot/','spbot',\r
+'SeznamBot/','SeznamBot',\r
+'msie8','msie8 - ( Rogue Robot )',\r
+'AhrefsBot/','AhrefsBot',\r
+'007ac9[\x20]Crawler','007ac9 Crawler',\r
+'2345Explorer/','2345Explorer',\r
+'360Spider','360Spider',\r
+'A[\x20]Simple[\x20]Crawler','A Simple Crawler',\r
+'Abrave','Abrave',\r
+'acapbot/','acapbot',\r
+'Accoona\-AI\-Agent/','Accoona-AI-Agent',\r
+'AdnormCrawlerCatchBot/','AdnormCrawlerCatchBot',\r
+'aiHitBot/','aiHitBot',\r
+'aipbot/','aipbot',\r
+'Apache\-HttpClient/','Apache-HttpClient',\r
+'Apexoo[\x20]Spider','Apexoo Spider',\r
+'Applebot/','Applebot',\r
+'archive\.org_bot','archive.org_bot',\r
+'Babya[\x20]Discoverer','Babya Discoverer',\r
+'BDCbot/','BDCbot',\r
+'BinGet/','BinGet',\r
+'bl\.uk_lddc_bot/','bl.uk_lddc_bot',\r
+'BLEXBot/','BLEXBot',\r
+'boitho\.com\-dc/','boitho.com-dc',\r
+'BusinessBot:','BusinessBot:',\r
+'CatchBot/','CatchBot',\r
+'CB/Nutch','CB/Nutch',\r
+'CCBot/','CCBot',\r
+'Cliqzbot/','Cliqzbot',\r
+'CMS[\x20]Crawler','CMS Crawler',\r
+'ConveraCrawler/','ConveraCrawler',\r
+'cosmos/','cosmos',\r
+'crawl/Nutch','crawl/Nutch',\r
+'Crawler/','Crawler',\r
+'crawler4j','crawler4j',\r
+'CRAZYWEBCRAWLER','CRAZYWEBCRAWLER',\r
+'CSE[\x20]HTML[\x20]Validator','CSE HTML Validator',\r
+'C\-T[\x20]bot','C-T bot',\r
+'Curl/PHP','Curl/PHP',\r
+'Dalvik/','Dalvik',\r
+'DataCrawler/','DataCrawler',\r
+'Deepnet[\x20]Explorer','Deepnet Explorer',\r
+'DeuSu/','DeuSu',\r
+'Digincore','Digincore',\r
+'Discordbot/','Discordbot',\r
+'DoCoMo/','DoCoMo',\r
+'Domain[\x20]Re\-Animator[\x20]Bot','Domain Re-Animator Bot',\r
+'DomainCrawler/','DomainCrawler',\r
+'DomainMacroCrawler/','DomainMacroCrawler',\r
+'DomainSONOCrawler/','DomainSONOCrawler',\r
+'DomainStatsBot/','DomainStatsBot',\r
+'DotBot/','DotBot',\r
+'DuckDuckGo\-Favicons\-Bot/','DuckDuckGo-Favicons-Bot',\r
+'ELinks/','ELinks',\r
+'ELinks[\x20]\(','ELinks (',\r
+'EmailMarketingRobot/','EmailMarketingRobot',\r
+'EmeraldShield\.com[\x20]WebBot','EmeraldShield.com WebBot',\r
+'envolk\[ITS\]spider/','envolk ITS spider',\r
+'EsperanzaBot','EsperanzaBot',\r
+'Exabot/','Exabot',\r
+'facebookexternalhit/','facebookexternalhit',\r
+'fast_enterprise_crawler.*scrawleradmin\.t\-info@telekom\.de','FAST Enterprise crawleradmin.t-info@telekom.de',\r
+'fast_enterprise_crawler.*t\-info_bi_cluster_crawleradmin\.t\-info@telekom\.de','FAST Enterprise T-Info_BI_cluster crawleradmin.t-info@telekom.de',\r
+'FAST\-WebCrawler/','FAST-WebCrawler',\r
+'Feosey[\x20]Mohk[\x20]Crawler','Feosey Mohk Crawler',\r
+'findlinks/','findlinks',\r
+'Findxbot/','Findxbot',\r
+'FirePHP/','FirePHP',\r
+'FlippyBearBot/','FlippyBearBot',\r
+'FreeWebMonitoring[\x20]SiteChecker/','FreeWebMonitoring SiteChecker',\r
+'fujilabol','fujilabol',\r
+'FurlBot/','FurlBot',\r
+'Gaisbot/','Gaisbot',\r
+'Gallent[\x20]Spider','Gallent Spider',\r
+'GarlikCrawler/','GarlikCrawler',\r
+'GetintentCrawler[\x20]getintent\.com','GetintentCrawler getintent.com',\r
+'Gigabot/','Gigabot',\r
+'gipo\-crawler/Nutch','gipo-crawler/Nutch',\r
+'Girafabot','Girafabot',\r
+'Gluten[\x20]Free[\x20]Crawler/','Gluten Free Crawler',\r
+'gocrawl','gocrawl',\r
+'GrapeshotCrawler/','GrapeshotCrawler',\r
+'GSiteCrawler/','GSiteCrawler',\r
+'GurujiBot/','GurujiBot',\r
+'HaosouSpider','HaosouSpider',\r
+'holmes/','holmes',\r
+'HTTP_Request2/','HTTP_Request2',\r
+'HubSpot[\x20]Webcrawler','HubSpot Webcrawler',\r
+'HyperCrawl/','HyperCrawl',\r
+'ICC\-Crawler/','ICC-Crawler',\r
+'iconoclast','iconoclast',\r
+'IDGCrawler/Nutch','IDGCrawler/Nutch',\r
+'idmarch[\x20]Automatic\.beta/','idmarch Automatic.beta',\r
+'Incutio[\x20]XML','Incutio XML',\r
+'InfluenceBot','InfluenceBot',\r
+'IRLbot/','IRLbot',\r
+'IssueCrawler','IssueCrawler',\r
+'istellabot/','istellabot',\r
+'James[\x20]BOT','James BOT',\r
+'Jigsaw/','Jigsaw',\r
+'JobFeed','JobFeed',\r
+'KomodiaBot/','KomodiaBot',\r
+'Konqueror/','Konqueror',\r
+'linkapediabot','linkapediabot',\r
+'metager\-linkchecker','metager-linkchecker',\r
+'linkchecker','linkchecker',\r
+'LinkCheck','LinkCheck',\r
+'linkdexbot/','linkdexbot',\r
+'LinkedInBot/','LinkedInBot',\r
+'LinkpadBot/','LinkpadBot',\r
+'Links[\x20]\(','Links (',\r
+'LinksManager\.com_bot','LinksManager.com_bot',\r
+'LWP::Simple/','LWP::Simple',\r
+'Mail\.RU_Bot/','Mail.RU Bot',\r
+'meanpathbot/','meanpathbot',\r
+'Mediatoolkitbot','Mediatoolkitbot',\r
+'MegaIndex\.ru/','MegaIndex.ru',\r
+'merzscope','merzscope',\r
+'mfibot/','mfibot',\r
+'microsoft.*discovery','Microsoft Office Protocol Discovery',\r
+'missigua_locator','missigua_locator',\r
+'MixrankBot','MixrankBot',\r
+'MJ12bot/','MJ12bot',\r
+'MojeekBot/','MojeekBot',\r
+'Mojolicious','Mojolicious',\r
+'MXT/Nutch','MXT/Nutch',\r
+'My[\x20]Nutch[\x20]Spider/','My Nutch Spider',\r
+'myse/Nutch','myse/Nutch',\r
+'NerdyBot','NerdyBot',\r
+'netEstate[\x20]NE[\x20]Crawler','netEstate NE Crawler',\r
+'NetResearchServer/','NetResearchServer',\r
+'NRLCorpusBuilder/Nutch','NRLCorpusBuilder/Nutch',\r
+'nutch\-1\.4/','nutch-1.4',\r
+'nutch\-1\.8/','nutch-1.8',\r
+'NutchCVS/','NutchCVS',\r
+'o\.uk[\x20]robot','o uk.robot',\r
+'oBot/','oBot',\r
+'ocrawler;','ocrawler;',\r
+'ODP[\x20]link[\x20]checker','ODP link checker',\r
+'Offline[\x20]Explorer/','Offline Explorer',\r
+'OmniExplorer_Bot/','OmniExplorer_Bot',\r
+'OrangeBot/','OrangeBot',\r
+'PageBitesHyperBot/','PageBitesHyperBot',\r
+'pdffillerbot/','pdffillerbot',\r
+'PhantomJS','PhantomJS',\r
+'PHP/5\.2\.8','PHP/5.2.8',\r
+'Ploetz[\x20]\+[\x20]Zeller','Ploetz + Zeller',\r
+'Plukkie/','Plukkie',\r
+'Princetonbot/','Princetonbot',\r
+'PrivacyAwareBot/','PrivacyAwareBot',\r
+'proximic','proximic',\r
+'psbot/','psbot',\r
+'psbot\-image','psbot-image',\r
+'python_wk_crawler','python_wk_crawler',\r
+'Python\-urllib/','Python-urllib',\r
+'QCrawl','QCrawl',\r
+'ResearchBot','ResearchBot',\r
+'roboto','roboto',\r
+'rogerbot/','rogerbot',\r
+'RSSingBot','RSSingBot',\r
+'RukiCrawler/','RukiCrawler',\r
+'SafeDNS[\x20]search[\x20]bot/','SafeDNS search bot',\r
+'SafeDNSBot','SafeDNSBot',\r
+'SafeSearch[\x20]microdata[\x20]crawler','SafeSearch microdata crawler',\r
+'safesearch','safesearch ( catchall )',\r
+'SBL\-BOT','SBL-BOT',\r
+'Screaming[\x20]Frog[\x20]SEO[\x20]Spider/','Screaming Frog SEO Spider',\r
+'ScreenerBot[\x20]Crawler[\x20]Beta','ScreenerBot Crawler Beta',\r
+'Searchie/','Searchie',\r
+'Seekmo','Seekmo',\r
+'semanticbot','semanticbot',\r
+'SemrushBot/','SemrushBot',\r
+'seo\-audit\-check\-bot/','seo-audit-check-bot',\r
+'Seobility','Seobility',\r
+'SEOkicks\-Robot','SEOkicks-Robot',\r
+'SEOlyticsCrawler/','SEOlyticsCrawler',\r
+'SEOstats','SEOstats',\r
+'Seosys/Nutch','Seosys/Nutch',\r
+'Seoterritory\.com[\x20]bot','Seoterritory.com.bot',\r
+'Shim\-Crawler','Shim-Crawler',\r
+'SiteExplorer/','SiteExplorer',\r
+'siteexplorer\.info','siteexplorer.info',\r
+'Slackbot\-LinkExpanding','Slackbot-LinkExpanding',\r
+'SmabblerBot/','SmabblerBot',\r
+'Sogou[\x20]web[\x20]spider/','Sogou web spider',\r
+'special_archiver/','special_archiver',\r
+'Spiderbot/','Spiderbot',\r
+'ssearch_bot','ssearch_bot',\r
+'SurdotlyBot/','SurdotlyBot',\r
+'SurveyBot/','SurveyBot',\r
+'taiil/Nutch','taiil/Nutch',\r
+'tbot\-nutch','tbot-nutch',\r
+'TeeRaidBot','TeeRaidBot',\r
+'TelegramBot','TelegramBot',\r
+'Test/Nutch','Test/Nutch',\r
+'Test[\x20]Spider','Test Spider',\r
+'TestCrawler','TestCrawler',\r
+'TurnitinBot/','TurnitinBot',\r
+'TurnitinBot','TurnitinBot',\r
+'TweetmemeBot/','TweetmemeBot',\r
+'UCY/Nutch','UCY/Nutch',\r
+'Uptimebot/','Uptimebot',\r
+'URL[\x20]Checker','URL Checker',\r
+'UXCrawlerBot','UXCrawlerBot',\r
+'Validator\.nu/','Validator.nu',\r
+'vBSEO','vBSEO',\r
+'vBulletin[\x20]via[\x20]PHP','vBulletin via PHP',\r
+'vebidoobot','vebidoobot',\r
+'viz/Nutch','viz/Nutch',\r
+'VoilaBot','VoilaBot',\r
+'VORTEX/','VORTEX',\r
+'voyager/','voyager',\r
+'W3C_Validator/','W3C_Validator',\r
+'W3C\-checklink/','W3C-checklink',\r
+'WBSearchBot/','WBSearchBot',\r
+'WeSEE:Ads/PageBot','WeSEE:Ads/PageBot',\r
+'WeSEE:Ads/PictureBot','WeSEE:Ads/PictureBot',\r
+'WeSEE_Bot','WeSEE_Bot',\r
+'Wget/','Wget',\r
+'Who\.is[\x20]Bot','Who.is.Bot',\r
+'wonderbot/','wonderbot',\r
+'woobot/','woobot',\r
+'Wotbox/','Wotbox',\r
+'Xaldon[\x20]WebSpider','Xaldon WebSpider',\r
+'Xenu[\x20]Link[\x20]Sleuth','Xenu Link Sleuth',\r
+'xenu_link_sleuth','xenu_link_sleuth',\r
+'XML[\x20]Sitemaps[\x20]Generator','XML Sitemaps Generator',\r
+'XoviBot/','XoviBot',\r
+'yacybot','yacybot',\r
+'Yahoo[\x20]Link[\x20]Preview','Yahoo Link Preview',\r
+'YisouSpider','YisouSpider',\r
+'yoozBot','yoozBot',\r
+'zspider/','zspider',\r
+'ZumBot/','ZumBot',\r
+# below placed at end to catch some generics\r
+'nbot','nbot',\r
+'ng/1\.','ng/1.',\r
+'ng/2\.','ng/2.',\r
+'libwww\-perl','libwww-perl',\r
+'CFNetwork','CFNetwork',\r
+'urllib','urllib',\r
+'javabee','javabee',\r
+'projectwf\-java\-test\-crawler','projectwf-java-test-crawler',\r
+'java','Java ( catchall )',\r
+'loocalcrawler/nutch','loocalcrawler/nutch',\r
+'nutchosu\-vlib','nutchosu-vlib',\r
+'nutch','nutch ( catchall )',\r
+'perlcrawler','perlcrawler',\r
+'perl','perl',\r
+'(firefox/)([0-9]\.|[0-1][0]\.)','Firefox version 10 and lower - various robots',\r
+\r
+# Less common robots (In robot file)\r
+'^Mozilla$','Mozilla ( Rogue Robot )',\r
+'^mozilla\/3\.0\s\(compatible$', 'mozilla/3.0 (compatible - ( Rogue Robot )',\r
+'^mozilla\/4\.0$', 'mozilla/4.0 - ( Rogue Robot )',\r
+'^mozilla\/4\.0\s\(compatible;\)$', 'mozilla/4.0 (compatible;) - ( Rogue Robot )',\r
+'^mozilla\/5\.0$', 'mozilla/5.0 - ( Rogue Robot )',\r
+'^mozilla\/5\.0\s\(compatible;$', 'mozilla/5.0 (compatible; - ( Rogue Robot )',\r
+'^mozilla\/5\.0\s\(en\-us\)$', 'mozilla/5.0 (en-us) - ( Rogue Robot )',\r
+'^mozilla\/5\.0\sfirefox\/3\.0\.5$', 'mozilla/5.0 firefox/3.0.5 - ( Rogue Robot )',\r
+'^Mozilla/6\.0[\x20]\(compatible\)$','Mozilla/6.0 (compatible) - ( Rogue Robot )',\r
+'^Mozilla/(.*)Beta[\x20]\(Windows\)','Mozilla Beta (Windows) - ( Rogue Robot )',\r
+'MSIE[\x20]2','MSIE 2 - ( Rogue Robot )',\r
+'MSIE[\x20]3','MSIE 3 - ( Rogue Robot )',\r
+'MSIE[\x20]4','MSIE 4 - ( Rogue Robot )',\r
+'MSIE[\x20]5','MSIE 5 - ( Rogue Robot )',\r
+'MSIE[\x20]6','MSIE 6 - ( Rogue Robot )',\r
+'Windows[\x20]95','Windows 95 - ( Rogue Robot )',\r
+'Windows[\x20]98','Windows 99 - ( Rogue Robot )',\r
+\r
+# these could be removed to speed up processing as they are rarely seen\r
+'a6\-indexer','a6-indexer',\r
+'abcdatos','abcdatos',\r
+'abonti\.com','abonti.com',\r
+'acme\.spider','acme.spider',\r
+'activebookmark','activebookmark',\r
+'adamm_bot','adamm_bot',\r
+'advbot','advbot',\r
+'affectv\.co\.uk','affectv.co.uk',\r
+'ahoythehomepagefinder','ahoythehomepagefinder',\r
+'aleadsoftbot','aleadsoftbot',\r
+'alkaline','alkaline',\r
+'allrati','allrati',\r
+'alltop','alltop',\r
+'almaden','almaden',\r
+'alpha_search_agent','alpha_search_agent',\r
+'anthill','anthill',\r
+'antibot','antibot',\r
+'aport','aport',\r
+'appie','appie',\r
+'applesyndication','applesyndication',\r
+'arachnophilia','arachnophilia',\r
+'arale','arale',\r
+'araneo','araneo',\r
+'architext','architext',\r
+'archive\-de\.com','archive-de.com',\r
+'aretha','aretha',\r
+'argus','argus',\r
+'ariadne','ariadne',\r
+'arianna\.libero\.it','arianna.libero.it',\r
+'arks','arks',\r
+'aspider','aspider',\r
+'aspseek','aspseek',\r
+'asterias','asterias',\r
+'asynchttpclient','asynchttpclient',\r
+'atn\.txt','atn.txt',\r
+'atomz','atomz',\r
+'auresys','auresys',\r
+'awbot','awbot',\r
+'backlinktest\.com','backlinktest.com',\r
+'backrub','backrub',\r
+'bbot','bbot',\r
+'becomebot','becomebot',\r
+'bender','bender',\r
+'betabot','betabot',\r
+'bigbrother','bigbrother',\r
+'biglotron','biglotron',\r
+'BingLocalSearch','BingLocalSearch',\r
+'bittorrent_bot','bittorrent_bot',\r
+'biz360[_+\s]spider','biz360 spider',\r
+'bjaaland','bjaaland',\r
+'blackwidow','blackwidow',\r
+'blindekuh','blindekuh',\r
+'blogbridge[_+\s]service','blogbridge service',\r
+'blogged_crawl','blogged_crawl',\r
+'bloglines','bloglines',\r
+'bloglovin','bloglovin',\r
+'blogpulse','blogpulse',\r
+'blogsearch','blogsearch',\r
+'blogshares','blogshares',\r
+'blogslive','blogslive',\r
+'blogssay','blogssay',\r
+'bloodhound','bloodhound',\r
+'bncf\.firenze\.sbn\.it/raccolta\.txt','bncf\.firenze\.sbn.it/raccolta.txt',\r
+'bobby','bobby',\r
+'bookmark\-manager','bookmark-manager',\r
+'borg\-bot','borg-bot',\r
+'boris','boris',\r
+'brightnet','brightnet',\r
+'bruinbot','bruinbot',\r
+'bspider','bspider',\r
+'bubing','bubing',\r
+'bumblebee','bumblebee',\r
+'butterfly','butterfly',\r
+'buzztracker','buzztracker',\r
+'cactvschemistryspider','cactvschemistryspider',\r
+'calif[^r]','calif[^r]',\r
+'candlelight[_+\s]favorites[_+\s]inspector','candlelight favorites inspector',\r
+'careerbot','careerbot',\r
+'carpathia','carpathia',\r
+'cassandra','cassandra',\r
+'catbot','catbot',\r
+'cbn00glebot','cbn00glebot',\r
+'cerberian_drtrs','cerberian_drtrs',\r
+'cfetch','cfetch',\r
+'cgireader','cgireader',\r
+'chattertrap','chattertrap',\r
+'check_http','check_http',\r
+'checkbot','checkbot',\r
+'checkweb_link_validator','checkweb_link_validator',\r
+'christcrawler','christcrawler',\r
+'churl','churl',\r
+'cienciaficcion','cienciaficcion',\r
+'cipinetbot','cipinetbot',\r
+'imagecoccoc','imagecoccoc',\r
+'coccoc','coccoc',\r
+'coldfusion','coldfusion',\r
+'collective','collective',\r
+'combine','combine',\r
+'commons\-httpclient','commons-httpclient',\r
+'computer_and_automation_research_institute_crawler','computer_and_automation_research_institute_crawler',\r
+'conceptbot','conceptbot',\r
+'contentmatch','contentmatch',\r
+'converamultimediacrawler','converamultimediacrawler',\r
+'coolbot','coolbot',\r
+'copubbot','copubbot',\r
+'core','core',\r
+'covario','covario',\r
+'cruiser','cruiser',\r
+'cscrawler','cscrawler',\r
+'cuasarbot','cuasarbot',\r
+'cursor','cursor',\r
+'cusco','cusco',\r
+'custo','custo',\r
+'cyberspyder','cyberspyder',\r
+'datafountains/dmoz_downloader','datafountains/dmoz_downloader',\r
+'dataprovider\.com','dataprovider.com',\r
+'daumoa','daumoa',\r
+'daviesbot','daviesbot',\r
+'daylifefeedfetcher','daylifefeedfetcher',\r
+'daypopbot','daypopbot',\r
+'deepindex','deepindex',\r
+'desertrealm','desertrealm',\r
+'deweb','deweb',\r
+'dienstspider','dienstspider',\r
+'digger','digger',\r
+'digout4u','digout4u',\r
+'diibot','diibot',\r
+'dipsie\.bot','dipsie.bot',\r
+'direct_hit','direct_hit',\r
+'discobot','discobot',\r
+'dlvr\.it','dlvr.it',\r
+'dnabot','dnabot',\r
+'dnsgroup','dnsgroup',\r
+'doccheckbot','doccheckbot',\r
+'domainappender','domainappender',\r
+'domainchecker','domainchecker',\r
+'domainsdb\.net','domainsdb.net',\r
+'download_express','download_express',\r
+'dragonbot','dragonbot',\r
+'dreamwidth','dreamwidth',\r
+'drupal','drupal',\r
+'dulance','dulance',\r
+'dumbot','dumbot',\r
+'dumm\.de\-bot','dumm.de-bot',\r
+'dwcp','dwcp',\r
+'e\-collector','e-collector',\r
+'earthcom\.info','earthcom.info',\r
+'easydl','easydl',\r
+'ebiness','ebiness',\r
+'eccp','eccp',\r
+'echo!','echo!',\r
+'edgeio\-retriever','edgeio-retriever',\r
+'elfinbot','elfinbot',\r
+'emacs','emacs',\r
+'emcspider','emcspider',\r
+'enteprise','enteprise',\r
+'ernst[:blank:]2\.0','ernst[:blank:]2.0',\r
+'esther','esther',\r
+'ets_v','ets_v',\r
+'eventax','eventax',\r
+'everbeecrawler','everbeecrawler',\r
+'everest\-vulcan','everest-vulcan',\r
+'evliyacelebi','evliyacelebi',\r
+'exactseek','exactseek',\r
+'extreme[_+\s]picture[_+\s]finder','extreme picture finder',\r
+'ezoom','ezoom',\r
+'ezresult','ezresult',\r
+'facebook','facebook',\r
+'facebot','facebot',\r
+'fast\-search\-engine','fast-search-engine',\r
+'matrix_s\.p\.a\._\-_fast_enterprise_crawler','matrix_s.p.a._-_fast_enterprise_crawler',\r
+'fast_enterprise_crawler','fast_enterprise_crawler',\r
+'fastbot','fastbot',\r
+'fastcrawler','fastcrawler',\r
+'favicon','favicon',\r
+'favorg','favorg',\r
+'favorites_sweeper','favorites_sweeper',\r
+'fdse','fdse',\r
+'feedburner','feedburner',\r
+'feedcrawl','feedcrawl',\r
+'feedflow','feedflow',\r
+'feedmyinbox','feedmyinbox',\r
+'feedroll\.com','feedroll.com',\r
+'feedsky','feedsky',\r
+'feedster','feedster',\r
+'feedvalidator','feedvalidator',\r
+'feedzira','feedzira',\r
+'felix','felix',\r
+'ferret','ferret',\r
+'fetchbot','fetchbot',\r
+'fetchrover','fetchrover',\r
+'fever/','fever',\r
+'fido','fido',\r
+'filmkamerabot','filmkamerabot',\r
+'filterdb\.iss\.net','filterdb.iss.net',\r
+'finderlein[_+\s]research[_+\s]crawler','finderlein research crawler',\r
+'findexa_crawler','findexa_crawler',\r
+'finnish','finnish',\r
+'fireball','fireball',\r
+'firmilybot','firmilybot',\r
+'flexum','flexum',\r
+'foaf\-search\.net','foaf-search.net',\r
+'fooky\.com/ScorpionBot','fooky.com/ScorpionBot',\r
+'fouineur','fouineur',\r
+'francoroute','francoroute',\r
+'freecrawl','freecrawl',\r
+'freenews','freenews',\r
+'funnelweb','funnelweb',\r
+'g2crawler','g2crawler',\r
+'gama','gama',\r
+'gazz','gazz',\r
+'gcreep','gcreep',\r
+'geniebot','geniebot',\r
+'genieo','genieo',\r
+'geohasher','geohasher',\r
+'getbot','getbot',\r
+'geturl','geturl',\r
+'gigablastopensource','gigablastopensource',\r
+'global_fetch','global_fetch',\r
+'gnodspider','gnodspider',\r
+'goforit\.com','goforit.com',\r
+'goforitbot','goforitbot',\r
+'golem','golem',\r
+'gonzo','gonzo',\r
+'gougou','gougou',\r
+'gpu_p2p_crawler','gpu_p2p_crawler',\r
+'grabber','grabber',\r
+'grapeshot','grapeshot',\r
+'grapnel','grapnel',\r
+'griffon','griffon',\r
+'gromit','gromit',\r
+'grub','grub',\r
+'gulliver','gulliver',\r
+'gulperbot','gulperbot',\r
+'hambot','hambot',\r
+'hanrss','hanrss',\r
+'harvest','harvest',\r
+'havindex','havindex',\r
+'henrythemiragorobot','henrythemiragorobot',\r
+'heritrix','heritrix',\r
+'hl_ftien_spider','hl_ftien_spider',\r
+'hometown','hometown',\r
+'hoowwwer','hoowwwer',\r
+'hpprint','hpprint',\r
+'htdig','htdig',\r
+'html[_+\s]link[_+\s]validator','html link validator',\r
+'htmlgobble','htmlgobble',\r
+'htmlparser','htmlparser',\r
+'httrack','httrack',\r
+'hundesuche\.com\-bot','hundesuche.com-bot',\r
+'hyperdecontextualizer','hyperdecontextualizer',\r
+'ia_archiver\-web\.archive\.org','ia_archiver-web.archive.org',\r
+'ia_archiver','ia_archiver',\r
+'iajabot','iajabot',\r
+'iaskspider','iaskspider',\r
+'i\-bot','i-bot',\r
+'icarus6j','icarus6j',\r
+'ichiro','ichiro',\r
+'icjobs\.de','icjobs.de',\r
+'ilse','ilse',\r
+'iltrovatore\-setaccio','iltrovatore-setaccio',\r
+'imagelock','imagelock',\r
+'implisensebot','implisensebot',\r
+'inagist','inagist',\r
+'incywincy','incywincy',\r
+'infobot','infobot',\r
+'infociousbot','infociousbot',\r
+'infohelfer','infohelfer',\r
+'infomine','infomine',\r
+'informant','informant',\r
+'infoseeksidewinder','infoseeksidewinder',\r
+'infoseek','infoseek',\r
+'infospider','infospider',\r
+'inspectorwww','inspectorwww',\r
+'insurancobot','insurancobot',\r
+'integromedb\.org','integromedb.org',\r
+'intelliagent','intelliagent',\r
+'internet[_+\s]ninja','internet ninja',\r
+'internetarchive','internetarchive',\r
+'internetseer','internetseer',\r
+'internetsupervision','internetsupervision',\r
+'ips\-agent','ips-agent',\r
+'irobot','irobot',\r
+'iron33','iron33',\r
+'isearch2006','isearch2006',\r
+'israelisearch','israelisearch',\r
+'iupui_research_bot','iupui_research_bot',\r
+'izsearch','izsearch',\r
+'jacobin[\x20]club','jacobin club',\r
+'jakarta','jakarta',\r
+'jbot','jbot',\r
+'jcrawler','jcrawler',\r
+'jeeves','jeeves',\r
+'jennybot','jennybot',\r
+'jobboerse','jobboerse',\r
+'jobot','jobot',\r
+'jobo','jobo',\r
+'joebot','joebot',\r
+'jrtwine[_+\s]software[_+\s]check[_+\s]favorites[_+\s]utility','jrtwine software check favorites utility',\r
+'js\-kit','js-kit',\r
+'jubii','jubii',\r
+'jumpstation','jumpstation',\r
+'justview','justview',\r
+'kalambot','kalambot',\r
+'kamano\.de_newsfeedverzeichnis','kamano.de_newsfeedverzeichnis',\r
+'kapsi','kapsi',\r
+'katipo','katipo',\r
+'kazoombot','kazoombot',\r
+'kevin','kevin',\r
+'keyoshid','keyoshid',\r
+'kilroy','kilroy',\r
+'kinja\-imagebot','kinja-imagebot',\r
+'kinjabot','kinjabot',\r
+'knowitall','knowitall',\r
+'knowledge\.com','knowledge.com',\r
+'ko[_+\s]yappo[_+\s]robot','ko yappo robot',\r
+'kouaa_krawler','kouaa_krawler',\r
+'krugle','krugle',\r
+'ksibot','ksibot',\r
+'kummhttp','kummhttp',\r
+'kurzor','kurzor',\r
+'labelgrabber\.txt','labelgrabber.txt',\r
+'lanshanbot','lanshanbot',\r
+'larbin','larbin',\r
+'largesmall[\x20]crawler','largesmall crawler',\r
+'legs','legs',\r
+'letscrawl\.com','letscrawl.com',\r
+'libcrawl','libcrawl',\r
+'lilina','lilina',\r
+'link_valet_online','link_valet_online',\r
+'linkbot','linkbot',\r
+'linkdex\.com','linkdex.com',\r
+'linkidator','linkidator',\r
+'linkscan','linkscan',\r
+'linkstats[\x20]bot','linkstats bot',\r
+'linkwalker','linkwalker',\r
+'lipperhey','lipperhey',\r
+'livejournal\.com','livejournal.com',\r
+'lmspider','lmspider',\r
+'loadtimebot','loadtimebot',\r
+'lockon','lockon',\r
+'logo_gif','logo_gif',\r
+'longurl','longurl',\r
+'lssrocketcrawler','lssrocketcrawler',\r
+'ltbot','ltbot',\r
+'ltx71','ltx71',\r
+'lwp\-request','lwp-request',\r
+'lwp\-trivial','lwp-trivial',\r
+'lycos[_+\s]','lycos ',\r
+'macworm','macworm',\r
+'madaali\.de','madaali.de',\r
+'magpierss','magpierss',\r
+'magpie','magpie',\r
+'mapoftheinternet\.com','mapoftheinternet.com',\r
+'marvin','marvin',\r
+'mattie','mattie',\r
+'mediabot','mediabot',\r
+'mediafox','mediafox',\r
+'megaindex','megaindex',\r
+'megite','megite',\r
+'memorybot','memorybot',\r
+'mercator','mercator',\r
+'meshexplorer','meshexplorer',\r
+'metager2\-verification\-bot','metager2-verification-bot',\r
+'metajobbot','metajobbot',\r
+'metaspinner','metaspinner',\r
+'metauri','metauri',\r
+'miadev','miadev',\r
+'microsoft[_+\s]url[_+\s]control','microsoft url control',\r
+'microsoft[\x20]bits','microsoft bits',\r
+'microsoft\-webdav\-miniredir','microsoft-webdav-miniredir',\r
+'mindcrawler','mindcrawler',\r
+'mindupbot','mindupbot',\r
+'mini\-reptile','mini-reptile',\r
+'minirank','minirank',\r
+'misterbot','misterbot',\r
+'miva','miva',\r
+'mizzu_labs','mizzu_labs',\r
+'mnogosearch','mnogosearch',\r
+'moget','moget',\r
+'momspider','momspider',\r
+'monster','monster',\r
+'motor','motor',\r
+'movabletype','movabletype',\r
+'ms[_+\s]search[_+\s]6\.0[_+\s]robot','ms search 6.0 robot',\r
+'ms_search_4\.0_robot','ms_search_4.0_robot',\r
+'msnbot\-udiscovery','msnbot-udiscovery',\r
+'msrabot','msrabot',\r
+'msrbot','msrbot',\r
+'mt::telegraph::agent','mt::telegraph::agent',\r
+'muncher','muncher',\r
+'muscatferret','muscatferret',\r
+'mwdsearch','mwdsearch',\r
+'mydoyouhike','mydoyouhike',\r
+'myweb','myweb',\r
+'nagios','nagios',\r
+'nasa_search','nasa_search',\r
+'ndspider','ndspider',\r
+'nederland\.zoek','nederland.zoek',\r
+'netcarta','netcarta',\r
+'netcraft','netcraft',\r
+'netluchs','netluchs',\r
+'netmechanic','netmechanic',\r
+'netnewswire','netnewswire',\r
+'netscoop','netscoop',\r
+'netsprint','netsprint',\r
+'netvibes','netvibes',\r
+'newrelicpinger','newrelicpinger',\r
+'newscan\-online','newscan-online',\r
+'newsfox','newsfox',\r
+'newsgatoronline','newsgatoronline',\r
+'nextgensearchbot','nextgensearchbot',\r
+'nhse','nhse',\r
+'nicebot','nicebot',\r
+'nimblecrawler','nimblecrawler',\r
+'ning','ning',\r
+'nomad','nomad',\r
+'northstar','northstar',\r
+'noxtrumbot','noxtrumbot',\r
+'npbot','npbot',\r
+'nzexplorer','nzexplorer',\r
+'objectssearch','objectssearch',\r
+'occam','occam',\r
+'ocelli','ocelli',\r
+'octopus','octopus',\r
+'octora_beta_bot','octora_beta_bot',\r
+'onet\.pl[_+\s]sa','onet.pl sa',\r
+'onfolio','onfolio',\r
+'openfind','openfind',\r
+'opentaggerbot','opentaggerbot',\r
+'openwebspider','openwebspider',\r
+'optimizer','optimizer',\r
+'oracle_ultra_search','oracle_ultra_search',\r
+'orb_search','orb_search',\r
+'orbiter','orbiter',\r
+'packrat','packrat',\r
+'pageboy','pageboy',\r
+'panscient','panscient',\r
+'parasite','parasite',\r
+'passwordmaker\.org','passwordmaker.org',\r
+'patric','patric',\r
+'pear_http_request_class','pear_http_request_class',\r
+'peerbot','peerbot',\r
+'pegasus','pegasus',\r
+'perignator','perignator',\r
+'perman','perman',\r
+'petersnews','petersnews',\r
+'phantom','phantom',\r
+'php[_+\s]version[_+\s]tracker','php version tracker',\r
+'phpcrawl','phpcrawl',\r
+'phpdig','phpdig',\r
+'picmole','picmole',\r
+'pictureofinternet','pictureofinternet',\r
+'piltdownman','piltdownman',\r
+'pimptrain','pimptrain',\r
+'ping\.blo\.gs','ping.blo.gs',\r
+'pingdom','pingdom',\r
+'pioneer','pioneer',\r
+'pita','pita',\r
+'pitkow','pitkow',\r
+'pjspider','pjspider',\r
+'plinki','plinki',\r
+'pluckfeedcrawler','pluckfeedcrawler',\r
+'plumtreewebaccessor','plumtreewebaccessor',\r
+'pogodak','pogodak',\r
+'pompos','pompos',\r
+'popdexter','popdexter',\r
+'poppi','poppi',\r
+'port_huron_labs','port_huron_labs',\r
+'portalb','portalb',\r
+'postfavorites','postfavorites',\r
+'postpost','postpost',\r
+'postrank','postrank',\r
+'powermarks','powermarks',\r
+'printfulbot','printfulbot',\r
+'proodlebot','proodlebot',\r
+'protopage','protopage',\r
+'publiclibraryarchive','publiclibraryarchive',\r
+'pyquery','pyquery',\r
+'python','python',\r
+'qihoobot','qihoobot',\r
+'quipply','quipply',\r
+'qwantify','qwantify',\r
+'r6\_','r6\_',\r
+'rambler','rambler',\r
+'ratingburner','ratingburner',\r
+'raven','raven',\r
+'rbse','rbse',\r
+'redalert','redalert',\r
+'regator','regator',\r
+'relevantnoise\.com','relevantnoise.com',\r
+'resumerobot','resumerobot',\r
+'rhcs','rhcs',\r
+'riddler','riddler',\r
+'road_runner','road_runner',\r
+'robbie','robbie',\r
+'robi','robi',\r
+'robocrawl','robocrawl',\r
+'robofox','robofox',\r
+'robozilla','robozilla',\r
+'rojo','rojo',\r
+'rome[\x20]client','rome client',\r
+'roverbot','roverbot',\r
+'rpt\-httpclient','rpt-httpclient',\r
+'rssgraffiti','rssgraffiti',\r
+'rssimagesbot','rssimagesbot',\r
+'ruffle','ruffle',\r
+'rufusbot','rufusbot',\r
+'rules','rules',\r
+'safeads\.xyz','safeads.xyz',\r
+'safetynetrobot','safetynetrobot',\r
+'sage\+\+','sage++',\r
+'sandcrawler','sandcrawler',\r
+'savetheworldheritage','savetheworldheritage',\r
+'sbider','sbider',\r
+'schizozilla','schizozilla',\r
+'scooter','scooter',\r
+'scoutjet','scoutjet',\r
+'scumbot','scumbot',\r
+'search\-info','search-info',\r
+'search_au','search_au',\r
+'searchguild[_+\s]dmoz[_+\s]experiment','searchguild dmoz experiment',\r
+'searchmetricsbot','searchmetricsbot',\r
+'searchprocess','searchprocess',\r
+'seekbot','seekbot',\r
+'semalt','semalt',\r
+'senrigan','senrigan',\r
+'sensis_web_crawler','sensis_web_crawler',\r
+'seodiver','seodiver',\r
+'seokicks\.de','seokicks.de',\r
+'seoscanners','seoscanners',\r
+'sgscout','sgscout',\r
+'shaggy','shaggy',\r
+'shaihulud','shaihulud',\r
+'shareaholicbot','shareaholicbot',\r
+'shoutcast','shoutcast',\r
+'sift','sift',\r
+'simbot','simbot',\r
+'simplepie','simplepie',\r
+'sistrix','sistrix',\r
+'site\-valet','site-valet',\r
+'sitebot','sitebot',\r
+'sitedomain\-bot','sitedomain-bot',\r
+'sitetech','sitetech',\r
+'skimbot','skimbot',\r
+'skymob','skymob',\r
+'slcrawler','slcrawler',\r
+'slurp','slurp',\r
+'slysearch','slysearch',\r
+'smartspider','smartspider',\r
+'smtbot','smtbot',\r
+'snap\.com_beta_crawler','snap.com_beta_crawler',\r
+'snappy','snappy',\r
+'snooper','snooper',\r
+'sohu\-search','sohu-search',\r
+'sohu','sohu ( catchall )',\r
+'solbot','solbot',\r
+'speedy','speedy',\r
+'sphere_scout','sphere_scout',\r
+'spider[_+\s]monkey','spider monkey',\r
+'spiderline','spiderline',\r
+'spiderlytics','spiderlytics',\r
+'spiderman','spiderman',\r
+'spiderview','spiderview',\r
+'spip','spip',\r
+'sproose_crawler','sproose_crawler',\r
+'spry','spry',\r
+'sqworm','sqworm',\r
+'ssearcher','ssearcher',\r
+'steeler','steeler',\r
+'steroid__download','steroid__download',\r
+'stq_bot','stq_bot',\r
+'Stratagems[\x20]Kumo','Stratagems Kumo',\r
+'suchfin\-bot','suchfin-bot',\r
+'suke','suke',\r
+'summify\.com','summify.com',\r
+'sunrise','sunrise',\r
+'suntek','suntek',\r
+'superbot','superbot',\r
+'superfeedr','superfeedr',\r
+'susie','susie',\r
+'sven','sven',\r
+'syndic8','syndic8',\r
+'syndicapi','syndicapi',\r
+'synoobot','synoobot',\r
+'synthesio','synthesio',\r
+'t\-h\-u\-n\-d\-e\-r\-s\-t\-o\-n\-e','t-h-u-n-d-e-r-s-t-o-n-e',\r
+'tach_bw','tach_bw',\r
+'tagyu_agent','tagyu_agent',\r
+'tailrank','tailrank',\r
+'tarantula','tarantula',\r
+'tarspider','tarspider',\r
+'tcl_http_client_package','tcl_http_client_package',\r
+'techbot','techbot',\r
+'technoratibot','technoratibot',\r
+'templeton','templeton',\r
+'teoma','teoma',\r
+'teragramcrawlersurf','teragramcrawlersurf',\r
+'test_crawler','test_crawler',\r
+'testbot','testbot',\r
+'thumbsniper','thumbsniper',\r
+'titan','titan',\r
+'titin','titin',\r
+'tkwww','tkwww',\r
+'tlspider','tlspider',\r
+'topblogsinfo','topblogsinfo',\r
+'topicblogs','topicblogs',\r
+'topix\.net','topix.net',\r
+'trapit','trapit',\r
+'trileet','trileet',\r
+'turtlescanner','turtlescanner',\r
+'turtle','turtle',\r
+'tutorgigbot','tutorgigbot',\r
+'tweetedtimes','tweetedtimes',\r
+'twiceler','twiceler',\r
+'twisted[\x20]pagegetter','twisted pagegetter',\r
+'twitterbot','twitterbot',\r
+'twitterfeed','twitterfeed',\r
+'ubicrawler','ubicrawler',\r
+'ucsd','ucsd',\r
+'udmsearch','udmsearch',\r
+'ultraseek','ultraseek',\r
+'unchaos_bot_hybrid_web_search_engine','unchaos_bot_hybrid_web_search_engine',\r
+'unido\-bot','unido-bot',\r
+'unisterbot','unisterbot',\r
+'universalfeedparser','universalfeedparser',\r
+'unlost_web_crawler','unlost_web_crawler',\r
+'unwindfetchor','unwindfetchor',\r
+'updated','updated',\r
+'urlck','urlck',\r
+'ustc\-semantic\-group','ustc-semantic-group',\r
+'vagabondo\-wap','vagabondo-wap',\r
+'vagabondo','vagabondo',\r
+'valkyrie','valkyrie',\r
+'vermut','vermut',\r
+'versus_crawler_from_eda\.baykan@epfl\.ch','versus_crawler_from_eda.baykan@epfl.ch',\r
+'verticrawl','verticrawl',\r
+'vespa_crawler','vespa_crawler',\r
+'victoria','victoria',\r
+'virus[_+\s]detector','virus_detector',\r
+'visionsearch','visionsearch',\r
+'voidbot','voidbot',\r
+'voltron','voltron',\r
+'vse/','vse',\r
+'vwbot','vwbot',\r
+'w3c[_+\s]css[_+\s]validator[_+\s]jfouffa','w3c_css_validator_jfouffa',\r
+'w3index','w3index',\r
+'w3m2','w3m2',\r
+'wallpaper','wallpaper',\r
+'wanderer','wanderer',\r
+'wapspider','wapspider',\r
+'wapspIRLider','wapspIRLider',\r
+'watchmouse','watchmouse',\r
+'wavefire','wavefire',\r
+'waybackarchive\.org','waybackarchive.org',\r
+'wazzup','wazzup',\r
+'web_downloader','web_downloader',\r
+'webbandit','webbandit',\r
+'webbase','webbase',\r
+'webcatcher','webcatcher',\r
+'webclipping\.com','webclipping.com',\r
+'webcollage','webcollage',\r
+'webcompass','webcompass',\r
+'webcopy','webcopy',\r
+'webcrawl\.net','webcrawl.net',\r
+'webdup','webdup',\r
+'webfetcher','webfetcher',\r
+'webfilter','webfilter',\r
+'webfoot','webfoot',\r
+'webinator','webinator',\r
+'webindexer','webindexer',\r
+'weblayers','weblayers',\r
+'weblinker','weblinker',\r
+'webminer','webminer',\r
+'webmirror','webmirror',\r
+'webmoose','webmoose',\r
+'webquest','webquest',\r
+'webreader','webreader',\r
+'webreaper','webreaper',\r
+'website[_+\s]monitoring[_+\s]bot','website monitoring bot',\r
+'websnarf','websnarf',\r
+'webspider','webspider',\r
+'webvac','webvac',\r
+'webvulncrawl','webvulncrawl',\r
+'webwalker','webwalker',\r
+'webwalk','webwalk',\r
+'webwatch','webwatch',\r
+'wells_search','wells_search',\r
+'wer\-liefert\-was','wer-liefert-was',\r
+'wesee:search','wesee:search',\r
+'wevikabot','wevikabot',\r
+'whatuseek','whatuseek',\r
+'whowhere','whowhere',\r
+'windows\-rss\-platform','windows-rss-platform',\r
+'wired\-digital','wired-digital',\r
+'zyborg','zyborg',\r
+'wisenutbot','wisenutbot',\r
+'wiumi','wiumi',\r
+'wmir','wmir',\r
+'wolp','wolp',\r
+'wombat','wombat',\r
+'wonderer','wonderer',\r
+'woozweb','woozweb',\r
+'wordpress','wordpress',\r
+'worm','worm',\r
+'wume_crawler','wume_crawler',\r
+'wwwc','wwwc',\r
+'wwweasel','wwweasel',\r
+'wz101','wz101',\r
+'xget','xget',\r
+'xirq','xirq',\r
+'xydo','xydo',\r
+'y!j','y!j',\r
+'yahoo![\x20]searchmonkey','yahoo! searchmonkey',\r
+'yahoo!_mindset','yahoo!_mindset',\r
+'yahoo\-blogs','yahoo-blogs',\r
+'yahoo\-mmcrawler','yahoo-mmcrawler',\r
+'yahoo\-newscrawler','yahoo-newscrawler',\r
+'yahoo[\x20]pipes','yahoo pipes',\r
+'yahoo\-verticalcrawler','yahoo-verticalcrawler',\r
+'yahoocachesystem','yahoocachesystem',\r
+'yahooexternalcache','yahooexternalcache',\r
+'yahoofeedseeker','yahoofeedseeker',\r
+'yahooseeker\-testing','yahooseeker-testing',\r
+'yahooseeker','yahooseeker',\r
+'yahooysmcm','yahooysmcm',\r
+'yammer','yammer',\r
+'yanga','yanga',\r
+'yet\-another\-spider','yet-another-spider',\r
+'yeti','yeti',\r
+'yie8','yie8',\r
+'yodaobot','yodaobot',\r
+'yooglifetchagent','yooglifetchagent',\r
+'youdao','youdao',\r
+'yourls','yourls',\r
+'z\-add_link_checker','z-add_link_checker',\r
+'zealbot','zealbot',\r
+'zemanta','zemanta',\r
+'zend_http_client','zend_http_client',\r
+'zeus','zeus',\r
+'zhuaxia','zhuaxia',\r
+'[^a]fish','[^a]fish',\r
+'[\x20]netseer[\x20]',' netseer ',\r
+'^[1-3]$','^[1-3]$',\r
+'^finbot','^finbot',\r
+'^motorola$','^motorola$',\r
+'^msie','^msie',\r
+'^voyager/','^voyager',\r
+'^webindex$','webindex',\r
+'1\-more_scanner','1-more_scanner',\r
+\r
+# Generic robot\r
+'robot','robot',\r
+'blog','blog',\r
+'checker','checker',\r
+'crawl','crawl',\r
+'discover','discover',\r
+'feed','feed',\r
+'fetcher','fetcher',\r
+'hunter','hunter',\r
+'link','link',\r
+'scanner','scanner',\r
+'seek','seek',\r
+'sitemap','sitemap',\r
+'spider','spider',\r
+'sucker','sucker',\r
+'validator','validator',\r
+'bot[\s_+:,\.\;\/\\\-]','Unknown robot identified by bot\*',\r
+'[\s_+:,\.\;\/\\\-]bot','Unknown robot identified by \*bot',\r
+'curl','Curl',\r
+'php','A PHP script',\r
+'ruby/','Ruby script',\r
+'no_user_agent','empty user agent string',\r
+# Unknown robots identified by hit on robots.txt\r
+'unknown','Unknown robot (identified by hit on robots.txt)'\r
+);\r
+\r
+\r
+# RobotsAffiliateLib\r
+# This list try to tell by which Search Engine a robot is used\r
+#-------------------------------------------------------------\r
+%RobotsAffiliateLib = (\r
+);\r
+\r
+1;\r
index e56b00801921b929b9cfec24415a9a3626b31623..ad3d3bda380aa126cc4677b413ddfcdc51712215 100644 (file)
-# AWSTATS SEARCH ENGINES DATABASE
-#------------------------------------------------------------------------------
-# If you want to add a Search Engine to extend AWStats database detection capabilities,
-# you must add an entry in SearchEnginesSearchIDOrder, SearchEnginesHashID and in
-# SearchEnginesHashLib.
-# An entry if known in SearchEnginesKnownUrl is also welcome.
-#
-# to eldy: Please check if the following description is correct:
-# You need the following information to specify a search engine:
-# (a) A regular expression that matches the referrer string of the
-#    search engine. Unclear: What about slashes in the name of
-#    a search engine, e.g. as in 'ecosia.com/search'. Seems that
-#    AWStats will non find search strings containing a slash.
-#    Maybe use a search string without a slash, and - if necessary -
-#    an entry in %NotSearchEnginesKeys , if this search string
-#    matches entries that are not search engines.
-#    Example of a web address of a Amazon search engine:
-#    http://www.amazon.de/gp/bit/apps/web/SERP/search/ref=bit_bds-p24_serp_cr_de?ie=UTF8tagbase=bds-p24&query=deutsch+8.+klasse+gymnasium+protokoll
-# (b) A unique string to identify the search engine within AWStats
-# (c) A regular expression that finds the start of the query part in the
-#    referrer string
-# (d) A HTML-fragment that goes into the reports generated by AWStats which
-#    identifies the search engine to human reader of the report. In the
-#    simplest case this is a string containing the name of the search
-#    engine. You can also provide a hypertext clause that presents the
-#    name together with a link to the search engine.
-#
-# The regular expression (a) goes into SearchEnginesSearchIDOrder_list1
-# or ..._list2. List 1 contains common search engines, list 2 those
-# that are not so often used.
-#
-# SearchEnginesHashID contains to consecutive entries for each search
-# engine: The regular expression (a) followed bei the search engine
-# identifier (b)
-#
-# SearchEnginesKnownUrl specifies how to find the start of the query.
-# For each search engine you enter the search engine identifier (b)
-# followed by the regular expression (c). Unclear: It is possible to
-# omit this entry. If you do this, how will AWStats find the start of
-# the query?
-#
-# SearchEnginesHashLib contains also two entries for each search engine:
-# The search engine identifier (b) followed by the HTML-Fragment (d)
-#
-# There are search engines that do not use a query part in their URLs.
-# They put the search expression in the main part of the URL instead.
-# AWStats is able to handle these cases. They are specified as described
-# above, except the following two things:
-# - The regular expression (c) searches the complete URL and not only
-#   the query part.
-# - An additional Entry in the list %SearchEnginesWithKeysNotInQuery is
-#   necessary.
-#
-#
-# AWStats runs a sanity check of the contents of search_engines.pm. This
-# check detects the following things:
-# - Inconsistencies (number of entries)
-# It does not detect the following errors:
-# - If the HTML-Fragment (d) is syntactically incorrect.
-#
-#------------------------------------------------------------------------------
-
-# 2005-08-19 Sean Carlos http://www.antezeta.com/awstats.html
-#            added minor italian search engines
-#                  arianna http://arianna.libero.it/
-#                  supereva http://search.supereva.com/
-#                  kataweb http://kataweb.it/
-#            corrected uk looksmart
-#                  'askuk','ask=', 'bbc','q=', 'freeserve','q=', 'looksmart','key=',
-#            to
-#                  'askuk','ask=', 'bbc','q=', 'freeserve','q=', 'looksmartuk','key=',
-#            corrected spelling
-#                     internationnal -> international
-#            added 'google\.'=>'mail\.google\.', to NotSearchEnginesKeys in order to
-#            avoid counting gmail referrals as search engine traffic
-# 2005-08-21 Sean Carlos http://www.antezeta.com/awstats.html
-#            avoid counting babelfish.altavista referrals as search engine traffic
-#            avoid counting translate.google referrals as search engine traffic
-# 2005-11-20 Sean Carlos
-#           added missing 'tiscali','key=', entry.  Check order
-# 2005-11-22 Sean Carlos
-#           added Google Base & Froogle.  Froogle not tested.
-# 2006-04-18 Sean Carlos http://www.antezeta.com/awstats.html
-#           added biglotron.com (France)
-#           added blingo http://www.blingo.com/
-#           added Clusty & Vivisimo
-#           added eniro.no (Norway) [https://sourceforge.net/forum/message.php?msg_id=3134783]
-#           added GPU p2p search http://search.centraldatabase.org/
-#           added mail.tiscali to "not search engines list" [https://sourceforge.net/forum/message.php?msg_id=3166688]
-#           added Ask group's "mysearch"
-#           added sify.com (India)
-#           added sogou.com (Cina) [https://sourceforge.net/forum/message.php?msg_id=3501603]
-#           Ask changes:
-#           - added Ask Japan (ask.jp)
-#           - break out Ask new country level variants (DE, ES, FR, IT, NL)
-#           - updated Ask name from Ask Jevees
-#           - added Ask q= parameter - many recent searches probably not recognized; [https://sourceforge.net/forum/message.php?msg_id=3465444]
-#           - updated Ask uk (new uk.ask.com added to older ask.co.uk)
-#           updated voila kw|rdata parameter [https://sourceforge.net/forum/message.php?msg_id=3373912]
-#           for each new engine, added link to Search Engine.  This serves to document engine. Done for major & Italian engines as well. Requires patch
-#              to AWStats to allow untranslated html.  Otherwise html will appear instead of link.
-#           reviewed mnoGoSearch (http://www.mnogosearch.org/); the search engined mentioned no longer
-#              exists https://sourceforge.net/forum/message.php?msg_id=3025426
-# 2006-05-13 Sean Carlos http://www.antezeta.com/awstats.html
-#            added 10 Chello European broadband portals (Austria, Belgium, Czech Republic, France, Hungary, The Netherlands, Norway, Poland, Slovakia, Sweden)
-#           added Alice Internal Search (blends data with Google?) search.alice.it.master:10005
-#            added detection of google cache views from IPs 66.249.93.104 72.14.203.104 72.14.207.104
-#              To do: add more extensive IP list; keywords not yet detected.
-#            added icerocket.com blog search http://www.icerocket.com/
-#           added live.com (msn) http://www.live.com/
-#           added Meta motor kartoo.  Note: Kartoo does not provide search words in referrers, thus the engine will appear in the
-#              search engine list but the actual search words are not available.
-#           added netluchs.de http://www.netluchs.de/
-#           added sphere.com blog search http://www.sphere.com/
-#           added wwweasel.de http://wwweasel.de
-#           added Yahoo Mindset! http://mindset.research.yahoo.com/
-#            updated Mirago query parameter recognition (qry=); added breakout for each country (France, Germany, Spain, Italy, Norway, Sweden, Denmark, Netherlands, Belgium, Switzerland)
-# 2006-05-13 Sean Carlos http://www.antezeta.com/awstats.html
-#           added Google cache IPs 64.233.183.104 & 66.102.7.104
-# 2006-05-20 Sean Carlos http://www.antezeta.com/awstats.html
-#              anzwers.com.au
-#              schoenerbrausen.de http://www.schoenerbrausen.de/
-#              added Google cache IP 216.239.59.104
-#              answerbus http://www.answerbus.com/ (does not provide keywords)
-# 2006-05-23 Sean Carlos http://www.antezeta.com/awstats.html
-#              added Google cache IP 66.102.9.104, 64.233.161.104
-# 2006-06-23 Sean Carlos http://www.antezeta.com/awstats.html
-#              added Alice Search search.alice.it
-#              added GoodSearch http://www.goodsearch.com/ (does not provide keywords) "a Yahoo-powered search engine that donates money to your favorite charity or school each time you search the web"
-#              added googlee.com, variant of Google
-#              added gotuneed http://www.gotuneed.com/ Italian search engine, in beta
-#              added icq.com
-#              added logic to parse Google Cache search keywords. Seems to work for alpha but not numeric cache IDs, i.e. search?q=cache:lWVLmnuGJswJ: is recognized but q=cache:Yv5qxeJNuhgJ: is not recognized. The URL triggering the keywords will also appear.  The URLs are probably too varied to parse out?
-#              added Nusearch http://www.nusearch.com/
-#              added Polymeta www.polymeta.hu (does not provide keywords)
-#              added scroogle http://www.scroogle.org/ (does not always provide keywords)
-#              added Tango http://tango.hu/search.php?st=0&q=jeles+napok
-#              Changed Google Cache notation 64\.233\.(161|167|179|183|187)\.104 to 64\.233\.1[0-9]{2}\.104
-#                                            72\.14\.(203|205|207|209|221)\.104 to 72\.14\.2[0-9]{2}\.104
-#                                            216\.239\.(51|59)\.104 to 216\.239\.5[0-9]\.104
-#                                            66\.102\.(7|9)\.104 to 66\.102\.[1-9]\.104
-# 2006-06-27 Sean Carlos http://www.antezeta.com/awstats.html
-#              added Onet.pl http://szukaj.onet.pl/
-#              corrected name "Wirtualna Polska" from "Szukaj" (search); added link http://szukaj.wp.pl/
-# 2006-06-30 Sean Carlos http://www.antezeta.com/awstats.html
-#      Additional Polish Search Engines:
-#      added Dodaj.pl http://www.dodaj.pl/
-#      added Gazeta.pl http://szukaj.gazeta.pl/
-#      added Gery.pl http://szukaj.gery.pl/
-#      added Hoga.pl http://www.hoga.pl/
-#      added Interia.pl http://www.google.interia.pl/
-#      added Katalog.Onet.pl http://katalog.onet.pl/
-#      added NetSprint.pl http://www.netsprint.pl/
-#      added o2.pl http://szukaj2.o2.pl/
-#      added Polska http://szukaj.polska.pl/
-#      added Szukacz http://www.szukacz.pl/
-#      added Wow.pl http://szukaj.wow.pl/
-#      added Sagool http://sagool.jp/
-
-# 2006-08-25 Social Bookmarks
-#      International
-#      added del.icio.us/search - for now, just search referrer. To do: consider /tag/(tagname) referrer?
-#      added stumbleupon.com - No keywords supplied.
-#      added swik.net
-#       added digg. Keywords sometimes supplied.
-#      Italy
-#      added segnalo.alice.it - No keywords supplied.
-#      added ineffabile.it - No keywords supplied.
-
-#       added filter for google groups.  Attempt to parse group name as keyword.
-
-# 2006-09-14
-#      added Eniro Sverige http://www.eniro.se/
-#      added MyWebSearch http://search.mywebsearch.com/
-#      added Teecno http://www.teecno.it/ Italian Open Source Search Engine
-
-#package AWSSE;
-
-# 2006-09-25 (Gabor Moizes)
-# added 4-counter (Google alternative) http://4-counter.com/
-# added Googlecom (Google alternative) http://googlecom.com/
-# added Goggle (Google alternative) http://goggle.co.hu/
-# added Comet toolbar http://as.starware.com
-# added new IP for Yahoo: 216.109.125.130
-# added Ledix http://ledix.net/
-# added AT&T search (powered by Google) http://www.att.net/
-# added Keresolap (Hungarian search engine) http://www.keresolap.hu/
-# added Mozbot (French search engine) http://www.mozbot.fr/
-# added Zoznam (Slovak search engine) http://www.zoznam.sk/
-# added sapo.pt (Portuguese search engine) http://www.sapo.pt/
-# added shaw.ca (powered by Google) http://start.shaw.ca/
-# added Searchalot http://www.searchalot.com/
-# added Copernic http://www.copernic.com/
-# added 216.109.125.130 to Yahoo
-# added 66.218.69.11 to Yahoo
-# added Avantfind http://www.avantfind.com/
-# added Steadysearch http://www.steadysearch.com/
-# added Steadysearch http://www.steady-search.com/
-# modified 216\.239\.5[0-9]\.104/search to 216\.239\.5[0-9]\.104
-
-
-# SearchEnginesSearchIDOrder
-# It contains all matching criteria to search for in log fields. This list is
-# used to know in which order to search Search Engines IDs.
-# Most frequent one are in list1, used when LevelForSearchEnginesDetection is 1 or more
-# Minor robots are in list2, used when LevelForSearchEnginesDetection is 2 or more
-# Note: Regex IDs are in lower case and ' ' and '+' are changed into '_'
-#------------------------------------------------------------------------------
-@SearchEnginesSearchIDOrder_list1=(
-# Major international search engines
-'google\.[\w.]+/products',
-'base\.google\.',
-'froogle\.google\.',
-'groups\.google\.',
-'images\.google\.',
-'google\.',
-'googlee\.',
-'googlecom\.com',
-'goggle\.co\.hu',
-'216\.239\.32\.20',
-'173\.194\.32\.223',
-'216\.239\.(35|37|39|51)\.100',
-'216\.239\.(35|37|39|51)\.101',
-'216\.239\.5[0-9]\.104',
-'64\.233\.1[0-9]{2}\.104',
-'66\.102\.[1-9]\.104',
-'66\.249\.93\.104',
-'72\.14\.2[0-9]{2}\.104',
-'msn\.',
-'live\.com',
-'bing\.',
-'voila\.',
-'mindset\.research\.yahoo',
-'yahoo\.','(66\.218\.71\.225|216\.109\.117\.135|216\.109\.125\.130|66\.218\.69\.11)',
-'search\.aol\.co',
-'tiscali\.',
-'lycos\.',
-'alexa\.com',
-'alltheweb\.com',
-'altavista\.',
-'a9\.com',
-'dmoz\.org',
-'netscape\.',
-'search\.terra\.',
-'www\.search\.com',
-'search\.sli\.sympatico\.ca',
-'excite\.'
-);
-
-@SearchEnginesSearchIDOrder_list2=(
-# Minor international search engines
-'4\-counter\.com',
-'att\.net',
-'bungeebonesdotcom',
-'northernlight\.',
-'hotbot\.',
-'kvasir\.',
-'webcrawler\.',
-'metacrawler\.',
-'go2net\.com',
-'(^|\.)go\.com',
-'euroseek\.',
-'looksmart\.',
-'spray\.',
-'nbci\.com\/search',
-'de\.ask.\com', # break out Ask country specific engines.  (.jp is in Japan section)
-'es\.ask.\com',
-'fr\.ask.\com',
-'it\.ask.\com',
-'nl\.ask.\com',
-'uk\.ask.\com',
-'(^|\.)ask\.com',
-'atomz\.',
-'overture\.com',               # Replace 'goto\.com','Goto.com',
-'teoma\.',
-'findarticles\.com',
-'infospace\.com',
-'mamma\.',
-'dejanews\.',
-'dogpile\.com',
-'wisenut\.com',
-'ixquick\.com',
-'search\.earthlink\.net',
-'i-une\.com',
-'blingo\.com',
-'centraldatabase\.org',
-'clusty\.com',
-'mysearch\.',
-'vivisimo\.com',
-'kartoo\.com',
-'icerocket\.com',
-'sphere\.com',
-'ledix\.net',
-'start\.shaw\.ca',
-'searchalot\.com',
-'copernic\.com',
-'avantfind\.com',
-'steadysearch\.com',
-'steady-search\.com',
-'claro-search\.com',
-'www1\.search-results\.com',
-'www\.holasearch\.com',
-'search\.conduit\.com',
-'static\.flipora\.com',
-'(?:www[12]?|mixidj)\.delta-search\.com',
-'start\.iminent\.com',
-'www\.searchmobileonline\.com',
-'int\.search-results\.com',
-'www2\.inbox\.com',
-'www\.govome\.com',
-'find1friend\.com',
-'start\.mysearchdial\.com',
-'go\.speedbit\.com',
-'search\.certified-toolbar\.com',
-'search\.sweetim\.com',
-'search\.searchcompletion\.com',
-'en\.eazel\.com',
-'sr\.searchfunmoods\.com',
-'173\.194\.35\.177',
-'dalesearch\.com',
-'sweetpacks-search\.com',
-'searchgol\.com',
-'duckduckgo\.com',
-'sr\.facemoods\.com',
-'shoppstop\.com',
-'searchya\.com',
-'picsearch\.de',
-'webssearches\.com',
-'airzip\.inspsearch\.com',
-'zapmeta\.de',
-'localmoxie\.com',
-'search-results\.mobi',
-'androidsearch\.com',
-'isearch\.nation\.com',
-'search\.zonealarm\.com',
-'www\.buenosearch\.com',
-'search\.foxtab\.com',
-'searches\.qone8\.com',
-'startpage\.com',
-'www\.qwant\.com',
-'searches\.safehomepage\.com',
-'searches\.vi-view\.com',
-'wow\.utop\.it',
-'windowssearch\.com',
-'www\.wow\.com',
-'globososo\.',
-'kingtale3\.inspsearch\.com',
-'swisscows\.ch',
-'preciobarato\.xyz',
-'www\.dregol\.com',
-'search\.socialdownloadr\.com',
-'int\.search\.myway\.com',
-'de\.dolphin\.com',
-'mys\.yoursearch\.me',
-# Chello Portals
-'chello\.at',
-'chello\.be',
-'chello\.cz',
-'chello\.fr',
-'chello\.hu',
-'chello\.nl',
-'chello\.no',
-'chello\.pl',
-'chello\.se',
-'chello\.sk',
-'chello', # required as catchall for new countries not yet known
-# Mirago
-'mirago\.be',
-'mirago\.ch',
-'mirago\.de',
-'mirago\.dk',
-'es\.mirago\.com',
-'mirago\.fr',
-'mirago\.it',
-'mirago\.nl',
-'no\.mirago\.com',
-'mirago\.se',
-'mirago\.co\.uk',
-'mirago', # required as catchall for new countries not yet known
-'answerbus\.com',
-'icq\.com\/search',
-'nusearch\.com',
-'goodsearch\.com',
-'scroogle\.org',
-'questionanswering\.com',
-'mywebsearch\.com',
-'as\.starware\.com',
-# Social Bookmarking Services
-'del\.icio\.us',
-'digg\.com',
-'stumbleupon\.com',
-'swik\.net',
-'segnalo\.alice\.it',
-'ineffabile\.it',
-# Minor Australian search engines
-'anzwers\.com\.au',
-# Minor brazilian search engines
-'engine\.exe', 'miner\.bol\.com\.br',
-# Minor chinese search engines
-'\.baidu\.com',     # baidu search portal
-'\.vnet\.cn',       # powered by MSN
-'\.soso\.com',      # powered by Google
-'\.sogou\.com',     # powered by Sohu
-'\.3721\.com',      # powered by Yahoo!
-'iask\.com',        # powered by Sina
-'\.accoona\.com',   # Accoona
-'\.163\.com',       # powered by Google
-'\.zhongsou\.com',  # zhongsou search portal
-# Minor czech search engines
-'atlas\.cz','seznam\.cz','quick\.cz','centrum\.cz','jyxo\.(cz|com)','najdi\.to','redbox\.cz',
-'isearch\.avg\.com',
-# Minor danish search-engines
-'opasia\.dk', 'danielsen\.com', 'sol\.dk', 'jubii\.dk', 'find\.dk', 'edderkoppen\.dk', 'netstjernen\.dk', 'orbis\.dk', 'tyfon\.dk', '1klik\.dk', 'ofir\.dk',
-# Minor dutch search engines
-'ilse\.','vindex\.',
-# Minor english search engines
-'(^|\.)ask\.co\.uk','bbc\.co\.uk/cgi-bin/search','ifind\.freeserve','looksmart\.co\.uk','splut\.','spotjockey\.','ukdirectory\.','ukindex\.co\.uk','ukplus\.','searchy\.co\.uk',
-'search\.fbdownloader\.com',
-'search\.fdownloadr\.com',
-'search\.babylon\.com',
-'my\.allgameshome\.com',
-'surfcanyon\.com',
-'uk\.foxstart\.com',
-'yandex\.com',
-# Minor finnish search engines
-'haku\.www\.fi',
-# Minor french search engines
-'recherche\.aol\.fr','ctrouve\.','francite\.','\.lbb\.org','rechercher\.libertysurf\.fr', 'search[\w\-]+\.free\.fr', 'recherche\.club-internet\.fr',
-'toile\.com', 'biglotron\.com',
-'mozbot\.fr',
-# Minor german search engines
-'sucheaol\.aol\.de',
-'o2suche\.aol\.de',
-'fireball\.de','infoseek\.de','suche\d?\.web\.de','[a-z]serv\.rrzn\.uni-hannover\.de',
-'suchen\.abacho\.de','(brisbane|suche)\.t-online\.de','allesklar\.de','meinestadt\.de',
-'212\.227\.33\.241',
-'(161\.58\.227\.204|161\.58\.247\.101|212\.40\.165\.90|213\.133\.108\.202|217\.160\.108\.151|217\.160\.111\.99|217\.160\.131\.108|217\.160\.142\.227|217\.160\.176\.42)',
-'wwweasel\.de',
-'netluchs\.de',
-'schoenerbrausen\.de',
-'suche\.gmx\.net',
-'suche\.gmx\.at',
-'ecosia\.org',
-'de\.aolsearch\.com',
-'suche\.aol\.de',
-'www\.startxxl\.com',
-'www\.benefind\.de',
-'www\.amazon\.de.*search', #Just as a reminder, probably will not work as AWstats seems to consider the host part of an URL only
-'de\.wow\.com',
-'www\.vlips\.de',
-'metager\.de',
-'search\.1und1\.de',
-'sm\.de',
-'sumaja\.de',
-'navigationshilfe\.t-online\.de',
-'umfis\.de',
-'fastbot\.de',
-'tixuma\.de',
-'suche\.freenet\.de',
-'www\.izito\.de',
-'extern\.peoplecheck\.de',
-'www\.oneseek\.de',
-'de\.wiki\.gov\.cn',
-'umuwa\.de',
-'suche\.1und1\.de',
-'www\.metasuche\.ch',
-# Minor Hungarian search engines
-'heureka\.hu','vizsla\.origo\.hu','lapkereso\.hu','goliat\.hu','index\.hu','wahoo\.hu','webmania\.hu','search\.internetto\.hu',
-'tango\.hu',
-'keresolap\.hu',
-'kereso\.startlap\.hu',
-'polymeta\.hu',
-# Minor Indian search engines
-'sify\.com',
-# Minor Italian search engines
-'virgilio\.it','arianna\.libero\.it','supereva\.com','kataweb\.it','search\.alice\.it\.master','search\.alice\.it','gotuneed\.com',
-'godado','jumpy\.it','shinyseek\.it','teecno\.it',
-# Minor Israeli search engines
-'search\.genieo\.com',
-# Minor Japanese search engines
-'ask\.jp','sagool\.jp',
-'websearch\.rakuten\.co\.jp',
-# Minor Norwegian search engines
-'sok\.start\.no', 'eniro\.no',
-# Minor Polish search engines
-'szukaj\.wp\.pl','szukaj\.onet\.pl','dodaj\.pl','gazeta\.pl','gery\.pl','hoga\.pl','netsprint\.pl','interia\.pl','katalog\.onet\.pl','o2\.pl','polska\.pl','szukacz\.pl','wow\.pl',
-# Minor russian search engines
-'ya(ndex)?\.ru', 'aport\.ru', 'rambler\.ru', 'turtle\.ru', 'metabot\.ru',
-'go\.mail\.ru',
-# Minor Swedish search engines
-'evreka\.passagen\.se','eniro\.se',
-# Minor Slovak search engines
-'zoznam\.sk',
-# Minor Portuguese search engines
-'sapo\.pt',
-# Minor swiss search engines
-'search\.ch', 'search\.bluewin\.ch',
-'www\.zapmeta\.ch',
-'etools\.ch',
-# Minor Croatian, Serbian, Macedonian, Bosnian and Herzegovinian search engines
-'pogodak\.'
-);
-@SearchEnginesSearchIDOrder_listgen=(
-# Generic search engines
-'search\..*\.\w+'
-);
-
-
-# NotSearchEnginesKeys
-# If a search engine key is found, we check its exclude list to know if it's
-# really a search engine
-#------------------------------------------------------------------------------
-%NotSearchEnginesKeys=(
-'altavista\.'=>'babelfish\.altavista\.',
-'google\.'=>'mail\.google\.',
-'google\.'=>'translate\.google\.',
-'google\.'=>'code\.google\.',
-'google\.'=>'groups\.google\.',
-'msn\.'=>'hotmail\.msn\.',
-'tiscali\.'=>'mail\.tiscali\.',
-'yahoo\.'=>'(?:picks|mail)\.yahoo\.|yahoo\.[^/]+/picks',
-'yandex\.'=>'direct\.yandex\.'
-);
-
-
-# SearchEnginesHashID
-# Each Search Engine Search ID is associated to an AWStats id string
-#------------------------------------------------------------------------------
-%SearchEnginesHashID = (
-# Major international search engines
-'google\.[\w.]+/products','google_products',
-'base\.google\.','google_base',
-'froogle\.google\.','google_froogle',
-'groups\.google\.','google_groups',
-'images\.google\.','google_image',
-'google\.','google',
-'googlee\.','google',
-'googlecom\.com','google',
-'goggle\.co\.hu','google',
-'216\.239\.32\.20', 'google',
-'173\.194\.32\.223', 'google',
-'216\.239\.(35|37|39|51)\.100','google_cache',
-'216\.239\.(35|37|39|51)\.101','google_cache',
-'216\.239\.5[0-9]\.104','google_cache',
-'64\.233\.1[0-9]{2}\.104','google_cache',
-'66\.102\.[1-9]\.104','google_cache',
-'66\.249\.93\.104','google_cache',
-'72\.14\.2[0-9]{2}\.104','google_cache',
-'msn\.','msn',
-'live\.com','live',
-'bing\.','bing',
-'voila\.','voila',
-'mindset\.research\.yahoo','yahoo_mindset',
-'yahoo\.','yahoo','(66\.218\.71\.225|216\.109\.117\.135|216\.109\.125\.130|66\.218\.69\.11)','yahoo',
-'lycos\.','lycos',
-'alexa\.com','alexa',
-'alltheweb\.com','alltheweb',
-'altavista\.','altavista',
-'a9\.com','a9',
-'dmoz\.org','dmoz',
-'netscape\.','netscape',
-'search\.terra\.','terra',
-'www\.search\.com','search.com',
-'tiscali\.','tiscali',
-'search\.aol\.co','aol',
-'search\.sli\.sympatico\.ca','sympatico',
-'excite\.','excite',
-# Minor international search engines
-'4\-counter\.com','google4counter',
-'att\.net','att',
-'bungeebonesdotcom','bungeebonesdotcom',
-'northernlight\.','northernlight',
-'hotbot\.','hotbot',
-'kvasir\.','kvasir',
-'webcrawler\.','webcrawler',
-'metacrawler\.','metacrawler',
-'go2net\.com','go2net',
-'(^|\.)go\.com','go',
-'euroseek\.','euroseek',
-'looksmart\.','looksmart',
-'spray\.','spray',
-'nbci\.com\/search','nbci',
-'de\.ask.\com','askde', # break out Ask country specific engines.
-'es\.ask.\com','askes',
-'fr\.ask.\com','askfr',
-'it\.ask.\com','askit',
-'nl\.ask.\com','asknl',
-'uk\.ask.\com','askuk',
-'(^|\.)ask\.co\.uk','askuk',
-'(^|\.)ask\.com','ask',
-'atomz\.','atomz',
-'overture\.com','overture',            # Replace 'goto\.com','Goto.com',
-'teoma\.','teoma',
-'findarticles\.com','findarticles',
-'infospace\.com','infospace',
-'mamma\.','mamma',
-'dejanews\.','dejanews',
-'dogpile\.com','dogpile',
-'wisenut\.com','wisenut',
-'ixquick\.com','ixquick',
-'search\.earthlink\.net','earthlink',
-'i-une\.com','iune',
-'blingo\.com','blingo',
-'centraldatabase\.org','centraldatabase',
-'clusty\.com','clusty',
-'mysearch\.','mysearch',
-'vivisimo\.com','vivisimo',
-'kartoo\.com','kartoo',
-'icerocket\.com','icerocket',
-'sphere\.com','sphere',
-'ledix\.net','ledix',
-'start\.shaw\.ca','shawca',
-'searchalot\.com','searchalot',
-'copernic\.com','copernic',
-'avantfind\.com','avantfind',
-'steadysearch\.com','steadysearch',
-'steady-search\.com','steadysearch',
-'claro-search\.com','clarosearch',
-'www1\.search-results\.com', 'searchresults',
-'www\.holasearch\.com', 'holasearch',
-'search\.conduit\.com', 'conduit',
-'static\.flipora\.com', 'flipora',
-'(?:www[12]?|mixidj)\.delta-search\.com', 'delta-search',
-'start\.iminent\.com', 'iminent',
-'www\.searchmobileonline\.com', 'searchmobileonline',
-'int\.search-results\.com', 'nortonsavesearch',
-'www2\.inbox\.com', 'inbox',
-'www\.govome\.com', 'govome',
-'find1friend\.com', 'find1friend',
-'start\.mysearchdial\.com', 'mysearchdial',
-'go\.speedbit\.com', 'speedbit',
-'search\.certified-toolbar\.com', 'certifiedtoolbarsearch',
-'search\.sweetim\.com', 'sweetim',
-'search\.searchcompletion\.com', 'searchcompletion',
-'en\.eazel\.com','eazelsearch',
-'sr\.searchfunmoods\.com', 'searchfunmoods',
-'173\.194\.35\.177', 'googleByIP',
-'dalesearch\.com', 'dalesearch',
-'sweetpacks-search\.com', 'sweetpacks',
-'searchgol\.com', 'searchgol',
-'duckduckgo\.com', 'duckduckgo',
-'sr\.facemoods\.com', 'facemoods',
-'shoppstop\.com', 'shoppstop',
-'searchya\.com', 'searchya',
-'picsearch\.de', 'picsearch',
-'webssearches\.com', 'webssearches',
-'airzip\.inspsearch\.com', 'webssearches',
-'zapmeta\.de', 'zapmeta',
-'localmoxie\.com', 'localmoxie',
-'search-results\.mobi', 'search-results_mobi',
-'androidsearch\.com', 'androidsearch',
-'isearch\.nation\.com', 'isearch_nation_com',
-'search\.zonealarm\.com', 'search_zonealarm_com',
-'www\.buenosearch\.com', 'www_buenosearch_com',
-'search\.foxtab\.com', 'search_foxtab_com',
-'searches\.qone8\.com', 'searches_qone8_com',
-'startpage\.com', 'startpage_com',
-'www\.qwant\.com', 'qwant_com',
-'searches\.safehomepage\.com', 'safehomepage_com',
-'searches\.vi-view\.com', 'vi-view_com',
-'wow\.utop\.it', 'wow_utop_it',
-'windowssearch\.com', 'windowssearch_com',
-'www\.wow\.com', 'www_wow_com',
-'globososo\.', 'globososo',
-'kingtale3\.inspsearch\.com', 'globososo',
-'swisscows\.ch', 'swisscows_ch',
-'preciobarato\.xyz', 'preciobarato_xyz',
-'www\.dregol\.com', 'www_dregol_com',
-'search\.socialdownloadr\.com', 'search_socialdownloadr_com',
-'int\.search\.myway\.com', 'int_search_myway_com',
-'de\.dolphin\.com', 'de_dolphin_com',
-'mys\.yoursearch\.me', 'mys_yoursearch_me',
-# Chello Portals
-'chello\.at','chelloat',
-'chello\.be','chellobe',
-'chello\.cz','chellocz',
-'chello\.fr','chellofr',
-'chello\.hu','chellohu',
-'chello\.nl','chellonl',
-'chello\.no','chellono',
-'chello\.pl','chellopl',
-'chello\.se','chellose',
-'chello\.sk','chellosk',
-'chello','chellocom',
-# Mirago
-'mirago\.be','miragobe',
-'mirago\.ch','miragoch',
-'mirago\.de','miragode',
-'mirago\.dk','miragodk',
-'es\.mirago\.com','miragoes',
-'mirago\.fr','miragofr',
-'mirago\.it','miragoit',
-'mirago\.nl','miragonl',
-'no\.mirago\.com','miragono',
-'mirago\.se','miragose',
-'mirago\.co\.uk','miragocouk',
-'mirago','mirago', # required as catchall for new countries not yet known
-'answerbus\.com','answerbus',
-'icq\.com\/search','icq',
-'nusearch\.com','nusearch',
-'goodsearch\.com','goodsearch',
-'scroogle\.org','scroogle',
-'questionanswering\.com','questionanswering',
-'mywebsearch\.com','mywebsearch',
-'as\.starware\.com','comettoolbar',
-# Social Bookmarking Services
-'del\.icio\.us','delicious',
-'digg\.com','digg',
-'stumbleupon\.com','stumbleupon',
-'swik\.net','swik',
-'segnalo\.alice\.it','segnalo',
-'ineffabile\.it','ineffabile',
-# Minor Australian search engines
-'anzwers\.com\.au','anzwers',
-# Minor brazilian search engines
-'engine\.exe','engine',
-'miner\.bol\.com\.br','miner',
-# Minor chinese search engines
-'\.baidu\.com','baidu',
-'iask\.com','iask',
-'\.accoona\.com','accoona',
-'\.3721\.com','3721',
-'\.163\.com','netease',
-'\.soso\.com','soso',
-'\.zhongsou\.com','zhongsou',
-'\.vnet\.cn','vnet',
-'\.sogou\.com','sogou',
-# Minor czech search engines
-'atlas\.cz','atlas',
-'seznam\.cz','seznam',
-'quick\.cz','quick',
-'centrum\.cz','centrum',
-'jyxo\.(cz|com)','jyxo',
-'najdi\.to','najdi',
-'redbox\.cz','redbox',
-'isearch\.avg\.com', 'avgsearch',
-# Minor danish search-engines
-'opasia\.dk','opasia',
-'danielsen\.com','danielsen',
-'sol\.dk','sol',
-'jubii\.dk','jubii',
-'find\.dk','finddk',
-'edderkoppen\.dk','edderkoppen',
-'netstjernen\.dk','netstjernen',
-'orbis\.dk','orbis',
-'tyfon\.dk','tyfon',
-'1klik\.dk','1klik',
-'ofir\.dk','ofir',
-# Minor dutch search engines
-'ilse\.','ilse',
-'vindex\.','vindex',
-# Minor english search engines
-'bbc\.co\.uk/cgi-bin/search','bbc',
-'ifind\.freeserve','freeserve',
-'looksmart\.co\.uk','looksmartuk',
-'splut\.','splut',
-'spotjockey\.','spotjockey',
-'ukdirectory\.','ukdirectory',
-'ukindex\.co\.uk','ukindex',
-'ukplus\.','ukplus',
-'searchy\.co\.uk','searchy',
-'search\.fbdownloader\.com','fbdownloader',
-'search\.fdownloadr\.com', 'fdownloadr_com',
-'search\.babylon\.com', 'babylon',
-'my\.allgameshome\.com', 'allgameshome',
-'surfcanyon\.com', 'surfcanyon_com',
-'uk\.foxstart\.com', 'uk_foxstart_com',
-'yandex\.com', 'yandex_com',
-# Minor finnish search engines
-'haku\.www\.fi','haku',
-# Minor french search engines
-'recherche\.aol\.fr','aolfr',
-'ctrouve\.','ctrouve',
-'francite\.','francite',
-'\.lbb\.org','lbb',
-'rechercher\.libertysurf\.fr','libertysurf',
-'search[\w\-]+\.free\.fr','free',
-'recherche\.club-internet\.fr','clubinternet',
-'toile\.com','toile',
-'biglotron\.com', 'biglotron',
-'mozbot\.fr', 'mozbot',
-# Minor german search engines
-'sucheaol\.aol\.de','aolde',
-'o2suche\.aol\.de','o2aolde',
-'fireball\.de','fireball',
-'infoseek\.de','infoseek',
-'suche\d?\.web\.de','webde',
-'[a-z]serv\.rrzn\.uni-hannover\.de','meta',
-'suchen\.abacho\.de','abacho',
-'(brisbane|suche)\.t-online\.de','t-online',
-'allesklar\.de','allesklar',
-'meinestadt\.de','meinestadt',
-'212\.227\.33\.241','metaspinner',
-'(161\.58\.227\.204|161\.58\.247\.101|212\.40\.165\.90|213\.133\.108\.202|217\.160\.108\.151|217\.160\.111\.99|217\.160\.131\.108|217\.160\.142\.227|217\.160\.176\.42)','metacrawler_de',
-'wwweasel\.de','wwweasel',
-'netluchs\.de','netluchs',
-'schoenerbrausen\.de','schoenerbrausen',
-'suche\.gmx\.net', 'gmxsuche',
-'suche\.gmx\.at', 'gmxsuche_at',
-'ecosia\.org', 'ecosiasearch',
-'de\.aolsearch\.com', 'aolsearch',
-'suche\.aol\.de', 'aolsuche',
-'www\.startxxl\.com', 'startxxl',
-'www\.benefind\.de', 'benefind',
-'www\.amazon\.de.*search', 'amazonsearch', #Not clear if this matches amazon searches only
-'de\.wow\.com', 'wowsearch',
-'www\.vlips\.de', 'vlips_de',
-'metager\.de', 'metager',
-'search\.1und1\.de', 'search_1und1_de',
-'sm\.de', 'smde',
-'sumaja\.de', 'sumaja',
-'navigationshilfe\.t-online\.de', 'navigationshilfe',
-'umfis\.de', 'umfis',
-'fastbot\.de', 'fastbot_de',
-'tixuma\.de', 'tixuma_de',
-'suche\.freenet\.de', 'freenet_de',
-'www\.izito\.de', 'izito_de',
-'extern\.peoplecheck\.de', 'peoplecheck_de',
-'www\.oneseek\.de', 'oneseek_de',
-'de\.wiki\.gov\.cn', 'de_wiki_gov_cn',
-'umuwa\.de', 'umuwa_de',
-'suche\.1und1\.de', '1und1_de',
-'www\.metasuche\.ch', 'metasuche_ch',
-# Minor Hungarian search engines
-'heureka\.hu','heureka',
-'vizsla\.origo\.hu','origo',
-'lapkereso\.hu','lapkereso',
-'goliat\.hu','goliat',
-'index\.hu','indexhu',
-'wahoo\.hu','wahoo',
-'webmania\.hu','webmania',
-'search\.internetto\.hu','internetto',
-'tango\.hu','tango_hu',
-'keresolap\.hu','keresolap_hu',
-'kereso\.startlap\.hu', 'startlap_hu',
-'polymeta\.hu','polymeta_hu',
-# Minor Indian search engines
-'sify\.com','sify',
-# Minor Italian search engines
-'virgilio\.it','virgilio',
-'arianna\.libero\.it','arianna',
-'supereva\.com','supereva',
-'kataweb\.it','kataweb',
-'search\.alice\.it\.master','aliceitmaster',
-'search\.alice\.it','aliceit',
-'gotuneed\.com','gotuneed',
-'godado','godado',
-'jumpy\.it','jumpy\.it',
-'shinyseek\.it','shinyseek\.it',
-'teecno\.it','teecnoit',
-# Minor Israeli search engines
-'search\.genieo\.com', 'genieo',
-# Minor Japanese search engines
-'ask\.jp','askjp',
-'sagool\.jp','sagool',
-'websearch\.rakuten\.co\.jp', 'rakuten',
-# Minor Norwegian search engines
-'sok\.start\.no','start', 'eniro\.no','eniro',
-# Minor Polish search engines
-'szukaj\.wp\.pl','wp',
-'szukaj\.onet\.pl','onetpl',
-'dodaj\.pl','dodajpl',
-'gazeta\.pl','gazetapl',
-'gery\.pl','gerypl',
-'netsprint\.pl\/hoga\-search','hogapl',
-'netsprint\.pl','netsprintpl',
-'interia\.pl','interiapl',
-'katalog\.onet\.pl','katalogonetpl',
-'o2\.pl','o2pl',
-'polska\.pl','polskapl',
-'szukacz\.pl','szukaczpl',
-'wow\.pl','wowpl',
-# Minor russian search engines
-'ya(ndex)?\.ru','yandex',
-'aport\.ru','aport',
-'rambler\.ru','rambler',
-'turtle\.ru','turtle',
-'metabot\.ru','metabot',
-'go\.mail\.ru', 'mailru',
-# Minor Swedish search engines
-'evreka\.passagen\.se','passagen',
-'eniro\.se','enirose',
-# Minor Slovak search engines
-'zoznam\.sk','zoznam',
-# Minor Portuguese search engines
-'sapo\.pt','sapo',
-# Minor swiss search engines
-'search\.ch','searchch',
-'search\.bluewin\.ch','bluewin',
-'www\.zapmeta\.ch', 'zapmeta_ch',
-'etools\.ch', 'etools_ch',
-# Minor Croatian, Serbian, Macedonian, Bosnian and Herzegovinian search engines
-'pogodak\.','pogodak',
-# Generic search engines
-'search\..*\.\w+','search'
-);
-
-
-# SearchEnginesWithKeysNotInQuery
-# List of search engines that store keyword as page instead of query parameter
-#------------------------------------------------------------------------------
-%SearchEnginesWithKeysNotInQuery=(
-'a9',1,    # www.a9.com/searchkey1%20searchkey2
-'iminent',1, #http://start.iminent.com/StartWeb/1031/toolbox/#q=searchkey1%20searchkey2&additional_arguments
-'de_wiki_gov_cn',1, #http://de.wiki.gov.cn/s_searchkey1%20searchkey2
-'umuwa_de', 1, #http://umuwa.de/searchkey or http://umuwa.de/searchkey/Images
-'amazonsearch', 1 #http://www.amazon.de/gp/bit/apps/web/SERP/search/ref=bit_bds-p24_serp_cr_de?ie=UTF8tagbase=bds-p24&query=deutsch+8.+klasse+gymnasium+protokoll
-);
-
-# SearchEnginesKnownUrl
-# Known rules to extract keywords from a referrer search engine URL
-#------------------------------------------------------------------------------
-%SearchEnginesKnownUrl=(
-# Most common search engines
-'alexa','q=',
-'alltheweb','q(|uery)=',
-'altavista','q=',
-'a9','a9\.com\/',
-'dmoz','search=',
-'google_products','(p|q|as_p|as_q)=',
-'google_base','(p|q|as_p|as_q)=',
-'google_froogle','(p|q|as_p|as_q)=',
-'google_groups','group\/', # does not work
-'google_image','(p|q|as_p|as_q)=',
-'google_cache','(p|q|as_p|as_q)=cache:[0-9A-Za-z]{12}:',
-'google','(p|q|as_p|as_q)=',
-'lycos','query=',
-'msn','q=',
-'live','q=',
-'bing','q=',
-'netscape','search=',
-'tiscali','key=',
-'aol','query=',
-'terra','query=',
-'voila','(kw|rdata)=',
-'search.com','q=',
-'yahoo_mindset','p=',
-'yahoo','p=',
-'sympatico', 'query=',
-'excite','search=',
-# Minor international search engines
-'google4counter','(p|q|as_p|as_q)=',
-'att','qry=',
-'bungeebonesdotcom','query=',
-'go','qt=',
-'askde','(ask|q)=', # break out Ask country specific engines.
-'askes','(ask|q)=',
-'askfr','(ask|q)=',
-'askit','(ask|q)=',
-'asknl','(ask|q)=',
-'ask','(ask|q)=',
-'atomz','sp-q=',
-'euroseek','query=',
-'findarticles','key=',
-'go2net','general=',
-'hotbot','mt=',
-'infospace','qkw=',
-'kvasir', 'q=',
-'looksmart','key=',
-'mamma','query=',
-'metacrawler','general=',
-'nbci','keyword=',
-'northernlight','qr=',
-'overture','keywords=',
-'dogpile', 'q(|kw)=',
-'spray','string=',
-'teoma','q=',
-'webcrawler','searchText=',
-'wisenut','query=',
-'ixquick', 'query=',
-'earthlink', 'q=',
-'iune','(keywords|q)=',
-'blingo','q=',
-'centraldatabase','query=',
-'clusty','query=',
-'mysearch','searchfor=',
-'vivisimo','query=',
-# kartoo: No keywords passed in referring URL.
-'kartoo','',
-'icerocket','q=',
-'sphere','q=',
-'ledix','q=',
-'shawca','q=',
-'searchalot','q=',
-'copernic','web\/',
-'avantfind','keywords=',
-'steadysearch','w=',
-'clarosearch','q=',
-'searchresults','q=',
-'holasearch', 'q=',
-'conduit', 'q=',
-'flipora', 'q=',
-'delta-search', 'q=',
-'iminent', 'q=',
-'searchmobileonline', 'q=',
-'nortonsavesearch', 'q=',
-'inbox', 'q(?:kw)?=',
-'govome', 'q=',
-'find1friend', 'q=',
-'mysearchdial', 'q=',
-'speedbit', 'q=',
-'certifiedtoolbarsearch', 'q=',
-'sweetim', 'q=',
-'searchcompletion', 'q=',
-'eazelsearch', 'q=',
-'searchfunmoods', 'q=',
-'googleByIP', 'q=',
-'dalesearch',  'q=',
-'sweetpacks', 'q=',
-'searchgol', 'q=',
-'duckduckgo', 'uddg=',
-'facemoods', 'q=',
-'shoppstop', 'keywords=',
-'searchya', 'q=',
-'picsearch', 'q=',
-'webssearches', 'q=',
-'zapmeta', 'query=',
-'localmoxie', 'keyword=',
-'search-results_mobi', 'q=',
-'androidsearch', 'q=',
-'isearch_nation_com', 'q=',
-'search_zonealarm_com', 'q=',
-'www_buenosearch_com', 'q=',
-'search_foxtab_com', 'q=',
-'searches_qone8_com', 'q=',
-'startpage_com', 'query=',
-'qwant_com', 'q=',
-'safehomepage_com', 'q=',
-'vi-view_com', 'q=',
-'wow_utop_it', 'q=',
-'windowssearch_com', 'q=',
-'www_wow_com', 'q=',
-'globososo', 'q=',
-'swisscows_ch', 'query=',
-'preciobarato_xyz', 's=',
-'www_dregol_com', 'q=',
-'search_socialdownloadr_com', 'q=',
-'int_search_myway_com', 'searchfor=',
-'de_dolphin_com', 'q=',
-'mys_yoursearch_me', 'q=',
-# Chello Portals
-'chelloat','q1=',
-'chellobe','q1=',
-'chellocz','q1=',
-'chellofr','q1=',
-'chellohu','q1=',
-'chellonl','q1=',
-'chellono','q1=',
-'chellopl','q1=',
-'chellose','q1=',
-'chellosk','q1=',
-'chellocom','q1=',
-# Mirago
-'miragobe','(txtsearch|qry)=',
-'miragoch','(txtsearch|qry)=',
-'miragode','(txtsearch|qry)=',
-'miragodk','(txtsearch|qry)=',
-'miragoes','(txtsearch|qry)=',
-'miragofr','(txtsearch|qry)=',
-'miragoit','(txtsearch|qry)=',
-'miragonl','(txtsearch|qry)=',
-'miragono','(txtsearch|qry)=',
-'miragose','(txtsearch|qry)=',
-'miragocouk','(txtsearch|qry)=',
-'mirago','(txtsearch|qry)=',
-'answerbus','', # Does not provide query parameters
-'icq','q=',
-'nusearch','nusearch_terms=',
-'goodsearch','Keywords=',
-'scroogle','Gw=', # Does not always provide query parameters
-'questionanswering','',
-'mywebsearch','searchfor=',
-'comettoolbar','qry=',
-# Social Bookmarking Services
-'delicious','all=',
-'digg','s=',
-'stumbleupon','',
-'swik','swik\.net/', # does not work. Keywords follow domain, e.g. http://swik.net/awstats+analytics
-'segnalo','',
-'ineffabile','',
-# Minor Australian search engines
-'anzwers','search=',
-# Minor brazilian search engines
-'engine','p1=', 'miner','q=',
-# Minor chinese search engines
-'baidu','(wd|word)=',
-'iask','(w|k)=',
-'accoona','qt=',
-'3721','(p|name)=',
-'netease','q=',
-'soso','q=',
-'zhongsou','(word|w)=',
-'sogou', 'query=',
-'vnet','kw=',
-# Minor czech search engines
-'atlas','(searchtext|q)=', 'seznam','(w|q)=', 'quick','query=', 'centrum','q=', 'jyxo','(s|q)=', 'najdi','dotaz=', 'redbox','srch=',
-'avgsearch', 'q=',
-# Minor danish search engines
-'opasia','q=', 'danielsen','q=', 'sol','q=', 'jubii','soegeord=', 'finddk','words=', 'edderkoppen','query=', 'orbis','search_field=', '1klik','query=', 'ofir','querytext=',
-# Minor dutch search engines
-'ilse','search_for=', 'vindex','in=',
-# Minor english search engines
-'askuk','(ask|q)=', 'bbc','q=', 'freeserve','q=', 'looksmartuk','key=',
-'splut','pattern=', 'spotjockey','Search_Keyword=', 'ukindex', 'stext=', 'ukdirectory','k=', 'ukplus','search=', 'searchy', 'search_term=',
-'fbdownloader','q=',
-'fdownloadr_com', 'q=',
-'babylon','q=',
-'allgameshome', 's=',
-'surfcanyon_com', 'q=',
-'uk_foxstart_com', 'q=',
-'yandex_com', 'text=',
-# Minor finnish search engines
-'haku','w=',
-# Minor french search engines
-'francite','name=', 'clubinternet', 'q=',
-'toile', 'q=',
-'biglotron','question=',
-'mozbot','q=',
-# Minor german search engines
-'aolde','q=',
-'o2aolde', 'q=',
-'fireball','q=', 'infoseek','qt=', 'webde','su=',
-'abacho','q=', 't-online','q=',
-'metaspinner','qry=',
-'metacrawler_de','qry=',
-'wwweasel','q=',
-'netluchs','query=',
-'schoenerbrausen','q=',
-'gmxsuche', 'q=',
-'gmxsuche_at', 'q=',
-'ecosiasearch', 'q=',
-'aolsearch', 'q=',
-'aolsuche', 'q=',
-'startxxl', 'q=',
-'benefind', 'q=',
-'amazonsearch', 'query=',
-'wowsearch', 'q=',
-'vlips_de', 'q=',
-'metager', 'eingabe=',
-'search_1und1_de', 'q=',
-'smde', 'q=',
-#'sumaja', 'no query string available', #There is no query string in the referrer url
-'navigationshilfe', 'q=',
-'umfis', 'suchbegriff=',
-'fastbot_de', 'red=[0-9]*\+',
-'tixuma_de', 'sc=',
-'freenet_de', 'query=',
-'izito_de', 'q=',
-'peoplecheck_de', 'q=',
-'oneseek_de', 'q=',
-'de_wiki_gov_cn', 'de\.wiki\.gov\.cn\/s_',
-'umuwa_de', 'umuwa\.de\/',
-'1und1_de', 'q=',
-'metasuche_ch', 'q=',
-# Minor Hungarian search engines
-'heureka','heureka=', 'origo','(q|search)=', 'goliat','KERESES=', 'wahoo','q=', 'internetto','searchstr=',
-'keresolap_hu','q=',
-'startlap_hu', 'q=',
-'tango_hu','q=',
-'polymeta_hu','',
-# Minor Indian search engines
-'sify','keyword=',
-# Minor Italian search engines
-'virgilio','qs=',
-'arianna','query=',
-'supereva','q=',
-'kataweb','q=',
-'aliceitmaster','qs=',
-'aliceit','qs=',
-'gotuneed','', # Not yet known
-'godado','Keywords=',
-'jumpy\.it','searchWord=',
-'shinyseek\.it','KEY=',
-'teecnoit','q=',
-# Minor Israeli search engines
-'genieo','q=',
-# Minor Japanese search engines
-'askjp','(ask|q)=',
-'sagool','q=',
-'rakuten', 'qt=',
-# Minor Norwegian search engines
-'start','q=', 'eniro','q=',
-# Minor Polish search engines
-'wp','szukaj=',
-'onetpl','qt=',
-'dodajpl','keyword=',
-'gazetapl','slowo=',
-'gerypl','q=',
-'hogapl','qt=',
-'netsprintpl','q=',
-'interiapl','q=',
-'katalogonetpl','qt=',
-'o2pl','qt=',
-'polskapl','qt=',
-'szukaczpl','q=',
-'wowpl','q=',
-# Minor russian search engines
-'yandex', 'text=', 'rambler','words=', 'aport', 'r=', 'metabot', 'st=',
-'mailru', 'q=',
-# Minor swedish search engines
-'passagen','q=',
-'enirose', 'hitta:', #Not sure if this works, as the keywords are part of the URL, and therefore the URL does not contain a question mark.
-# Minor swiss search engines
-'searchch', 'q=', 'bluewin', 'qry=',
-'zapmeta_ch', 'query=',
-'etools_ch', 'query=',
-# Minor Croatian, Serbian, Macedonian, Bosnian and Herzegovinian search engines
-'pogodak', 'q='
-);
-
-# SearchEnginesKnownUrlNotFound
-# Known rules to extract not found keywords from a referrer search engine URL
-#------------------------------------------------------------------------------
-%SearchEnginesKnownUrlNotFound=(
-# Most common search engines
-'msn','origq='
-);
-
-# If no rules are known, we take first paramater not into WordsToCleanSearchUrl
-#------------------------------------------------------------------------------
-@WordsToCleanSearchUrl= ('act=','annuaire=','btng=','cat=','categoria=','cfg=','cof=','cou=','count=','cp=','dd=','domain=','dt=','dw=','enc=','exec=','geo=','hc=','height=','hits=','hl=','hq=','hs=','id=','kl=','lang=','loc=','lr=','matchmode=','medor=','message=','meta=','mode=','order=','page=','par=','pays=','pg=','pos=','prg=','qc=','refer=','sa=','safe=','sc=','sort=','src=','start=','style=','stype=','sum=','tag=','temp=','theme=','type=','url=','user=','width=','what=','\\.x=','\\.y=','y=','look=');
-
-# SearchEnginesKnownUTFCoding
-# Known parameter that proves a search engine has coded its parameters in UTF-8
-#------------------------------------------------------------------------------
-%SearchEnginesKnownUTFCoding=(
-# Most common search engines
-'google','ie=utf-8',
-'alltheweb','cs=utf-8'
-);
-
-
-# SearchEnginesHashLib
-# List of search engines names
-# 'search_engine_id', 'search_engine_name',
-#------------------------------------------------------------------------------
-%SearchEnginesHashLib=(
-# Major international search engines
-'alexa','<a href="http://www.alexa.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Alexa</a>',
-'alltheweb','<a href="http://www.alltheweb.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">AllTheWeb</a>',
-'altavista','<a href="http://www.altavista.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">AltaVista</a>',
-'a9', '<a href="http://www.a9.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">A9</a>',
-'dmoz','<a href="http://dmoz.org/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">DMOZ</a>',
-'google_products','<a href="http://www.google.com/products" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Google (Products)</a>',
-'google_base','<a href="http://base.google.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Google (Base)</a>',
-'google_froogle','<a href="http://froogle.google.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Froogle (Google)</a>',
-'google_groups','<a href="http://groups.google.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Google (Groups)</a>',
-'google_image','<a href="http://images.google.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Google (Images)</a>',
-'google_cache','<a href="http://www.google.com/help/features.html#cached" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Google (cache)</a>',
-'google','<a href="http://www.google.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Google</a>',
-'lycos','<a href="http://www.lycos.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Lycos</a>',
-'msn','<a href="http://search.msn.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Microsoft MSN Search</a>',
-'live','<a href="http://www.live.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Microsoft Windows Live</a>',
-'bing','<a href="http://www.bing.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Microsoft Bing</a>',
-'netscape','<a href="http://www.netscape.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Netscape</a>',
-'aol','<a href="http://www.aol.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">AOL</a>',
-'terra','<a href="http://www.terra.es/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Terra</a>',
-'tiscali','<a href="http://search.tiscali.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Tiscali</a>',
-'voila','<a href="http://www.voila.fr/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Voila</a>',
-'search.com','<a href="http://www.search.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Search.com</a>',
-'yahoo_mindset','<a href="http://mindset.research.yahoo.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Yahoo! Mindset</a>',
-'yahoo','<a href="http://www.yahoo.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Yahoo!</a>',
-'sympatico','<a href="http://sympatico.msn.ca/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Sympatico</a>',
-'excite','<a href="http://www.excite.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Excite</a>',
-# Minor international search engines
-'google4counter','<a href="http://www.4-counter.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">4-counter (Google)</a>',
-'att','<a href="http://www.att.net/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">AT&T search (powered by Google)</a>',
-'bungeebonesdotcom','<a href="http://BungeeBones.com/search.php/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">BungeeBones</a>',
-'go','Go.com',
-'askde','<a href="http://de.ask.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Ask Deutschland</a>',
-'askes','<a href="http://es.ask.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Ask Espa&ntilde;a</a>', # break out Ask country specific engines.
-'askfr','<a href="http://fr.ask.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Ask France</a>',
-'askit','<a href="http://it.ask.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Ask Italia</a>',
-'asknl','<a href="http://nl.ask.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Ask Nederland</a>',
-'ask','<a href="http://www.ask.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Ask</a>',
-'atomz','Atomz',
-'dejanews','DejaNews',
-'euroseek','Euroseek',
-'findarticles','Find Articles',
-'go2net','Go2Net (Metamoteur)',
-'hotbot','Hotbot',
-'infospace','InfoSpace',
-'kvasir','Kvasir',
-'looksmart','Looksmart',
-'mamma','Mamma',
-'metacrawler','MetaCrawler (Metamoteur)',
-'nbci','NBCI',
-'northernlight','NorthernLight',
-'overture','Overture',                 # Replace 'goto\.com','Goto.com',
-'dogpile','<a href="http://www.dogpile.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Dogpile</a>',
-'spray','Spray',
-'teoma','<a href="http://search.ask.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Teoma</a>',                                                      # Replace 'directhit\.com','DirectHit',
-'webcrawler','<a href="http://www.webcrawler.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">WebCrawler</a>',
-'wisenut','WISENut',
-'ixquick','<a href="http://www.ixquick.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">ix quick</a>',
-'earthlink', 'Earth Link',
-'iune','<a href="http://www.i-une.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">i-une</a>',
-'blingo','<a href="http://www.blingo.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Blingo</a>',
-'centraldatabase','<a href="http://search.centraldatabase.org/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">GPU p2p search</a>',
-'clusty','<a href="http://www.clusty.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Clusty</a>',
-'mysearch','<a href="http://www.mysearch.com" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">My Search</a>',
-'vivisimo','<a href="http://www.vivisimo.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Vivisimo</a>',
-'kartoo','<a href="http://www.kartoo.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Kartoo</a>',
-'icerocket','<a href="http://www.icerocket.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Icerocket (Blog)</a>',
-'sphere','<a href="http://www.sphere.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Sphere (Blog)</a>',
-'ledix','<a href="http://www.ledix.net/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Ledix</a>',
-'shawca','<a href="http://start.shaw.ca/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Shaw.ca</a>',
-'searchalot','<a href="http://www.searchalot.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Searchalot</a>',
-'copernic','<a href="http://www.copernic.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Copernic</a>',
-'avantfind','<a href="http://www.avantfind.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Avantfind</a>',
-'steadysearch','<a href="http://www.avantfind.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Avantfind</a>',
-'clarosearch','<a href="http://www.claro-search.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Claro Search</a>',
-'searchresults','<a href="http://www1.search-results.com/" rel="nofollow" title="Search-results Home Page [new window]" target="_blank">Search-results</a>',
-'holasearch', '<a href="http://www.holasearch.com" rel="nofollow" title="Hola Search Home Page [new window]" target="_blank">Hola Search</a>',
-'conduit', '<a href="http://search.conduit.com" rel="nofollow" title="Conduit Search Home Page [new window]" target="_blank">Conduit Search</a>',
-'flipora', '<a href="http://static.flipora.com/" rel="nofollow" title="Flipora Home Page [new window]" target="_blank">Flipora</a>',
-'delta-search', '<a href="http://www.delta-search.com/" rel="nofollow" title="Delta Search Home Page [new window]" target="_blank">Delta Search</a>',
-'iminent', '<a href="http://start.iminent.com/" rel="nofollow" title="Iminent Home Page [new window]" target="_blank">Iminent</a>',
-'searchmobileonline', '<a href="http://www.searchmobileonline.com/" rel="nofollow" title="Search Mobile Online (StartApp) Home Page [new window]" target="_blank">Search Mobile Online (StartApp)</a>',
-'nortonsavesearch', '<a href="http://int.search-results.com/" rel="nofollow" title="Norton Safe Search Home Page [new window]" target="_blank">Norton Safe Search</a>',
-'inbox', '<a href="http://www2.inbox.com/search/results1.aspx" rel="nofollow" title="Inbox Search [new window]" target="_blank">Inbox Search</a>',
-'govome', '<a href="http://www.govome.com/" rel="nofollow" title="Govome [new window]" target="_blank">Govome</a>',
-'find1friend', '<a href="http://find1friend.com/" rel="nofollow" title="Find1Friend [new window]" target="_blank">Find1Friend</a>',
-'mysearchdial', '<a href="http://start.mysearchdial.com/" rel="nofollow" title="My Search Dial [new window]" target="_blank">My Search Dial</a>',
-'speedbit', '<a href="http://go.speedbit.com/" rel="nofollow" title="Speedbit [new window]" target="_blank">Speedbit</a>',
-'certifiedtoolbarsearch', '<a href="http://search.certified-toolbar.com/" rel="nofollow" title="Certified-Toolbar Search [new window]" target="_blank">Certified-Toolbar Search</a>',
-'sweetim', '<a href="http://search.sweetim.com/" rel="nofollow" title="SweetIM Search [new window]" target="_blank">SweetIM Search</a>',
-'searchcompletion', '<a href="http://search.searchcompletion.com/" rel="nofollow" title="SearchCompletion Search [new window]" target="_blank">SearchCompletion Search</a>',
-'eazelsearch', '<a href="http://en.eazel.com/" rel="nofollow" title="Eazel Search [new window]" target="_blank">Eazel Search</a>',
-'searchfunmoods', '<a href="http://sr.searchfunmoods.com/" rel="nofollow" title="Funmoods [new window]" target="_blank">Funmoods</a>',
-'googleByIP', '<a href="http://173.194.35.177/" rel="nofollow" title="Google (Access by IP-Address) [new window]" target="_blank">Google (Access by IP-Address)</a>',
-'dalesearch',  '<a href="http://www.dalesearch.com/" rel="nofollow" title="Dale Search [new window]" target="_blank">Dale Search</a>',
-'sweetpacks', '<a href="http://www.sweetpacks-search.com/" rel="nofollow" title="Sweetpacks [new window]" target="_blank">Sweetpacks</a>',
-'searchgol', '<a href="http://www.searchgol.com/" rel="nofollow" title="Search-Gol [new window]" target="_blank">Search-Gol</a>',
-'duckduckgo',  '<a href="http://r.duckduckgo.com/" rel="nofollow" title="DuckDuckGo Home Page [new window]" target="_blank">DuckDuckGo (Does not provide search keyphrases, using found page instead)</a>',
-'facemoods', '<a href="http://sr.facemoods.com/" rel="nofollow" title="Facemoods Search [new window]" target="_blank">Facemoods Search</a>',
-'shoppstop', '<a href="http://www.shoppstop.com/" rel="nofollow" title="ShoppStop [new window]" target="_blank">ShoppStop</a>',
-'searchya', '<a href="http://www.searchya.com/" rel="nofollow" title="Searchya [new window]" target="_blank">Searchya</a>',
-'picsearch', '<a href="http://www.picsearch.de/" rel="nofollow" title="picsearch [new window]" target="_blank">picsearch</a>',
-'webssearches', 'Various variants of Webssearches <a href="http://www.webssearches.com/" rel="nofollow" title="Webssearches [new window]" target="_blank">EMG Technologies</a> and <a href="http://airzip.inspsearch.com/" rel="nofollow" title="airzip.inspsearch.com [new window]" target="_blank">airzip.inspsearch.com</a>',
-#Jan 8, 2016: No genuine inspsearch.com search engine seems so exist, but there is a couple of search engines using subdomains of inspsearch.com. Unclear how these are related to each other.
-'zapmeta', '<a href="http://www.zapmeta.de/" rel="nofollow" title="ZapMeta [new window]" target="_blank">ZapMeta</a>',
-'localmoxie', '<a href="http://www.localmoxie.com/" rel="nofollow" title="Local Moxie [new window]" target="_blank">Local Moxie</a>',
-'search-results_mobi', '<a href="http://search-results.mobi/" rel="nofollow" title="search-results.mobi [new window]" target="_blank">search-results.mobi</a>',
-'androidsearch', '<a href="http://www.androidsearch.com/" rel="nofollow" title="androidsearch.com [new window]" target="_blank">androidsearch.com</a>',
-'isearch_nation_com', '<a href="http://isearch.nation.com/" rel="nofollow" title="Nation Search [new window]" target="_blank">Nation Search</a>',
-'search_zonealarm_com', '<a href="http://search.zonealarm.com/" rel="nofollow" title="Zone Alarm Search [new window]" target="_blank">Zone Alarm Search</a>',
-'www_buenosearch_com', '<a href="http://www.buenosearch.com/" rel="nofollow" title="BuenoSearch [new window]" target="_blank">BuenoSearch</a>',
-'search_foxtab_com',  '<a href="http://search.foxtab.com/" rel="nofollow" title="Foxtab Search [new window]" target="_blank">Foxtab Search</a>',
-'searches_qone8_com', '<a href="http://searches.qone8.com/" rel="nofollow" title="Omiga-Plus [new window]" target="_blank">Omiga-Plus</a>',
-'startpage_com', '<a href="http://startpage.com/" rel="nofollow" title="Startpage [new window]" target="_blank">Startpage</a>',
-'qwant_com', '<a href="https://www.qwant.com/" rel="nofollow" title="qwant.com [new window]" target="_blank">qwant.com</a>',
-'safehomepage_com', '<a href="http://searches.safehomepage.com/" rel="nofollow" title="safehomepage.com [new window]" target="_blank">safehomepage.com</a>',
-'vi-view_com', '<a href="http://searches.vi-view.com/" rel="nofollow" title="vi-view.com [new window]" target="_blank">vi-view.com</a>',
-'wow_utop_it', '<a href="http://wow.utop.it/" rel="nofollow" title="wow.utop.it [new window]" target="_blank">wow.utop.it</a>',
-'windowssearch_com', '<a href="http://www.windowssearch.com/search?q=AWStats" rel="nofollow" title="Example page [new window]" target="_blank">windowssearch.com</a>',
-'www_wow_com', '<a href="http://www.wow.com/" rel="nofollow" title="www.wow.com [new window]" target="_blank">WOW.com</a>',
-'globososo', 'Various variants of Globososo (Kingtale Technology): <a href="http://www.globososo.com/" rel="nofollow" title="Globososo search page [new window]" target="_blank">www</a>, <a href="http://searches.globososo.com/" rel="nofollow" title="searches subdomain of globososo.com [new window]" target="_blank">searches</a>, <a href="http://searches3.globososo.com/" rel="nofollow" title="searches3 subdomain of globososo.com [new window]" target="_blank">searches3</a>, and at inspsearch.com (<a href="http://globososo.inspsearch.com/" rel="nofollow" title="Globososo search page at globososo.inspsearch.com [new window]" target="_blank">globososo</a>, <a href="http://kingtale3.inspsearch.com/" rel="nofollow" title="Globososo search page at kingtale3.inspsearch.com [new window]" target="_blank">kingtale3</a>)',
-'swisscows_ch', '<a href="https://swisscows.ch/" rel="nofollow" title="Swisscows search page [new window]" target="_blank">Swisscows</a>',
-'preciobarato_xyz', '<a href="http://preciobarato.xyz/" rel="nofollow" title="preciobarato.xyz offline on Oct 2, 2015 [new window]" target="_blank">Yandex</a>',
-'www_dregol_com', '<a href="http://www.dregol.com/" rel="nofollow" title="Dregol Search [new window]" target="_blank">Dregol Search</a>',
-'search_socialdownloadr_com', '<a href="http://search.socialdownloadr.com/" rel="nofollow" title="Socialdownloadr search page [new window]" target="_blank">Socialdownloadr</a>',
-'int_search_myway_com', '<a href="http://int.search.myway.com/" rel="nofollow" title="MyWay search page [new window]" target="_blank">MyWay</a>',
-'de_dolphin_com', '<a href="http://de.dolphin.com/" rel="nofollow" title="Dolphin Search search page [new window]" target="_blank">Dolphin Search</a>',
-'mys_yoursearch_me', '<a href="http://mys.yoursearch.me/" rel="nofollow" title="Yoursearch.me search page [new window]" target="_blank">Yoursearch.me</a>',
-# Chello Portals
-'chelloat','<a href="http://www.chello.at/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Chello Austria</a>',
-'chellobe','<a href="http://www.chello.be/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Chello Belgium</a>',
-'chellocz','<a href="http://www.chello.cz/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Chello Czech Republic</a>',
-'chellofr','<a href="http://www.chello.fr/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Chello France</a>',
-'chellohu','<a href="http://www.chello.hu/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Chello Hungary</a>',
-'chellonl','<a href="http://www.chello.nl/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Chello Netherlands</a>',
-'chellono','<a href="http://www.chello.no/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Chello Norway</a>',
-'chellopl','<a href="http://www.chello.pl/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Chello Poland</a>',
-'chellose','<a href="http://www.chello.se/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Chello Sweden</a>',
-'chellosk','<a href="http://www.chello.sk/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Chello Slovakia</a>',
-'chellocom','<a href="http://www.chello.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Chello (Country not recognized)</a>',
-# Mirago
-'miragobe','<a href="http://www.mirago.be/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Mirago Belgium</a>',
-'miragoch','<a href="http://www.mirago.ch/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Mirago Switzerland</a>',
-'miragode','<a href="http://www.mirago.de/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Mirago Germany</a>',
-'miragodk','<a href="http://www.mirago.dk/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Mirago Denmark</a>',
-'miragoes','<a href="http://es.mirago.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Mirago Spain</a>',
-'miragofr','<a href="http://www.mirago.fr/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Mirago France</a>',
-'miragoit','<a href="http://www.mirago.it/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Mirago Italy</a>',
-'miragonl','<a href="http://www.mirago.nl/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Mirago Netherlands</a>',
-'miragono','<a href="http://no.mirago.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Mirago Norway</a>',
-'miragose','<a href="http://www.mirago.se/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Mirago Sweden</a>',
-'miragocouk','<a href="http://zone.mirago.co.uk/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Mirago UK</a>',
-'mirago','<a href="http://www.mirago.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Mirago (country unknown)</a>',
-'answerbus','<a href="http://www.answerbus.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Answerbus</a>',
-'icq','<a href="http://www.icq.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">icq</a>',
-'nusearch','<a href="http://www.nusearch.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Nusearch</a>',
-'goodsearch','<a href="http://www.goodsearch.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">GoodSearch</a>',
-'scroogle','<a href="http://www.scroogle.org/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Scroogle</a>',
-'questionanswering','<a href="http://www.questionanswering.com/" rel="nofollow" title="Questionanswering home page [new window]" target="_blank">Questionanswering</a>',
-'mywebsearch','<a href="http://search.mywebsearch.com/" rel="nofollow" title="MyWebSearch home page [new window]" target="_blank">MyWebSearch</a>',
-'comettoolbar','<a href="http://as.starware.com/dp/search" rel="nofollow" title="Comet toolbar search home page [new window]" target="_blank">Comet toolbar search</a>',
-# Social Bookmarking Services
-'delicious','<a href="http://del.icio.us/" rel="nofollow" title="del.icio.us home page [new window]" target="_blank">del.icio.us</a> (Social Bookmark)',
-'digg','<a href="http://www.digg.com/" rel="nofollow" title="Digg home page [new window]" target="_blank">Digg</a> (Social Bookmark)',
-'stumbleupon','<a href="http://www.stumbleupon.com/" rel="nofollow" title="Stumbleupon home page [new window]" target="_blank">Stumbleupon</a> (Social Bookmark)',
-'swik','<a href="http://swik.net/" rel="nofollow" title="Swik home page [new window]" target="_blank">Swik</a> (Social Bookmark)',
-'segnalo','<a href="http://segnalo.alice.it/" rel="nofollow" title="Segnalo home page [new window]" target="_blank">Segnalo</a> (Social Bookmark)',
-'ineffabile','<a href="http://www.ineffabile.it/" rel="nofollow" title="Ineffabile.it home page [new window]" target="_blank">Ineffabile.it</a> (Social Bookmark)',
-# Minor Australian search engines
-'anzwers','<a href="http://anzwers.com.au/" rel="nofollow" title="anzwers.com.au home page [new window]" target="_blank">anzwers.com.au</a>',
-# Minor brazilian search engines
-'engine','Cade', 'miner','Meta Miner',
-# Minor chinese search engines
-'baidu','<a href="http://www.baidu.com/" rel="nofollow" target="_blank">Baidu</a>',
-'iask','<a href="http://www.iask.com/" rel="nofollow" target="_blank">Iask</a>',
-'accoona','<a href="http://cn.accoona.com" rel="nofollow" target="_blank">Accoona</a>',
-'3721','<a href="http://www.3721.com/" rel="nofollow" target="_blank">3721</a>',
-'netease', '<a href="http://www.163.com/" rel="nofollow" target="_blank">NetEase</a>',
-'soso','<a href="http://www.soso.com/" rel="nofollow" target="_blank">SoSo</a>',
-'zhongsou','<a href="http://www.zhongsou.com/" rel="nofollow" target="_blank">ZhongSou</a>',
-'sogou', '<a href="http://www.sogou.com/" rel="nofollow" target="_blank">SoGou</a>',
-'vnet','<a href="http://114.vnet.cn/" rel="nofollow" target="_blank">VNet</a>',
-# Minor czech search engines
-'atlas','Atlas.cz',    'seznam','Seznam', 'quick','Quick.cz', 'centrum','Centrum.cz', 'jyxo','Jyxo.cz', 'najdi','Najdi.to', 'redbox','RedBox.cz',
-'avgsearch', '<a href="http://isearch.avg.com" rel="nofollow" target="_blank">AVG Secure Search</a>',
-# Minor danish search-engines
-'opasia','Opasia', 'danielsen','Thor (danielsen.com)', 'sol','SOL', 'jubii','Jubii', 'finddk','Find', 'edderkoppen','Edderkoppen', 'netstjernen','Netstjernen', 'orbis','Orbis', 'tyfon','Tyfon', '1klik','1Klik', 'ofir','Ofir',
-# Minor dutch search engines
-'ilse','Ilse','vindex','Vindex\.nl',
-# Minor english search engines
-'askuk','<a href="http://uk.ask.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Ask UK</a>',
-'bbc','BBC', 'freeserve','Freeserve', 'looksmartuk','Looksmart UK',
-'splut','Splut', 'spotjockey','Spotjockey', 'ukdirectory','UK Directory', 'ukindex','UKIndex', 'ukplus','UK Plus', 'searchy','searchy.co.uk',
-'fbdownloader','<a href="http://search.fbdownloader.com/" rel="nofollow" title="FBDownloader Home Page [new window]" target="_blank">FBDownloader (fbdownloader)</a>',
-'fdownloadr_com', '<a href="http://search.fdownloadr.com/" rel="nofollow" title="FBDownloader Home Page [new window]" target="_blank">FBDownloader (fdownloadr)</a>',
-'babylon','<a href="http://search.babylon.com/" rel="nofollow" title="Babylon Home Page [new window]" target="_blank">Babylon</a>',
-'allgameshome', '<a href="http://my.allgameshome.com/" rel="nofollow" title="AllGamesHome [new window]" target="_blank">AllGamesHome</a>',
-'surfcanyon_com', '<a href="http://search.surfcanyon.com/" rel="nofollow" title="SurfCanyon [new window]" target="_blank">SurfCanyon</a>',
-'uk_foxstart_com', '<a href="http://uk.foxstart.com/" rel="nofollow" title="Foxstart search page [new window]" target="_blank">Foxstart.com</a>',
-'yandex_com', '<a href="http://yandex.com/" rel="nofollow" title="Yandex search page [new window]" target="_blank">Yandex</a>',
-# Minor finnish search engines
-'haku','Ihmemaa',
-# Minor french search engines
-'aolfr','AOL (fr)', 'ctrouve','C\'est trouve', 'francite','Francite', 'lbb', 'LBB', 'libertysurf', 'Libertysurf', 'free', 'Free.fr', 'clubinternet', 'Club-internet',
-'toile', 'Toile du Quebec',
-'biglotron','<a href="http://www.biglotron.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Biglotron</a>',
-'mozbot','<a href="http://www.mozbot.fr/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Mozbot</a>',
-# Minor German search engines
-'aolde','AOL (de)',
-'o2aolde', '<a href="http://o2suche.aol.de/aol/search" rel="nofollow" title="o2 Suche Home Page [new window]" target="_blank">o2 Suche</a>',
-'fireball','Fireball', 'infoseek','Infoseek',
-'webde','<a href="http://suche.web.de" rel="nofollow" title="Web.de Home Page [new window]" target="_blank">Web.de</a>',
-'abacho','Abacho',
-'t-online','T-Online',
-'allesklar','allesklar.de', 'meinestadt','meinestadt.de',
-'metaspinner','metaspinner',
-'metacrawler_de','metacrawler.de',
-'wwweasel','<a href="http://wwweasel.de/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">WWWeasel</a>',
-'netluchs','<a href="http://www.netluchs.de/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Netluchs</a>',
-'schoenerbrausen','<a href="http://www.schoenerbrausen.de/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Schoenerbrausen/</a>',
-'gmxsuche', '<a href="http://suche.gmx.net/" rel="nofollow" title="GMX Suche Home Page [new window]" target="_blank">GMX Suche</a>',
-'gmxsuche_at', '<a href="http://suche.gmx.at/" rel="nofollow" title="GMX Suche Oesterreich Home Page [new window]" target="_blank">GMX Suche Oesterreich</a>',
-'ecosiasearch', '<a href="http://ecosia.org" rel="nofollow" title="Ecosia Search Home Page [new window]" target="_blank">Ecosia Search</a>',
-'aolsearch', '<a href="http://de.aolsearch.com/" rel="nofollow" title="AOL Search Home Page [new window]" target="_blank">AOL Search</a>',
-'aolsuche', '<a href="http://suche.aol.de/" rel="nofollow" title="AOL Suche Home Page [new window]" target="_blank">AOL Suche</a>',
-'startxxl', '<a href="http://www.startxxl.com/" rel="nofollow" title="StartXXL Home Page [new window]" target="_blank">StartXXL</a>',
-'benefind', '<a href="http://www.benefind.de/" rel="nofollow" title="benefind Home Page [new window]" target="_blank">benefind</a>',
-'amazonsearch', '<a href="http://www.amazon.de/gp/bit/apps/web/SERP/search/" rel="nofollow" title="Amazon Web Search Home Page [new window]" target="_blank">Amazon Web Search</a>',
-'wowsearch', '<a href="http://de.wow.com/" rel="nofollow" title="Wow Search Home Page [new window]" target="_blank">Wow Search</a>',
-'vlips_de', '<a href="http://www.vlips.de/semags_proxy.php" rel="nofollow" title="vlips Proxy Page (Homepage not yet ready?) [new window]" target="_blank">vlips.de</a>',
-'metager', '<a href="http://www.metager.de" rel="nofollow" title="MetaGer Home Page [new window]" target="_blank">MetaGer</a>',
-'search_1und1_de', '<a href="http://search.1und1.de/" rel="nofollow" title="1&amp;1 Suche [new window]" target="_blank">1&amp;1 Suche (subdomain "search")</a>',
-'smde', '<a href="http://www.sm.de/" rel="nofollow" title="SM.de - Die SuchMaschine [new window]" target="_blank">SM.de - Die SuchMaschine</a>',
-'sumaja',  '<a href="http://www.sumaja.de/" rel="nofollow" title="Sumaja [new window]" target="_blank">Sumaja</a>',
-'navigationshilfe', '<a href="http://navigationshilfe.t-online.de/" rel="nofollow" title="T-Online Navigationshilfe [new window]" target="_blank">T-Online Navigationshilfe</a>',
-'umfis', '<a href="http://www.umfis.de/" rel="nofollow" title="UMFIS-Online Das Umweltfirmen-Informationssystem der IHKs in Deutschland [new window]" target="_blank">UMFIS-Online Das Umweltfirmen-Informationssystem der IHKs in Deutschland</a>',
-'fastbot_de', '<a href="http://fastbot.de/" rel="nofollow" title="Fastbot.de [new window]" target="_blank">Fastbot.de (Does not provide search keyphrases, using found page instead)</a>',
-'tixuma_de', '<a href="http://www.tixuma.de/" rel="nofollow" title="Tixuma Deutschland [new window]" target="_blank">Tixuma Deutschland</a>',
-'freenet_de', '<a href="http://suche.freenet.de/" rel="nofollow" title="suche.freenet.de [new window]" target="_blank">suche.freenet.de</a>',
-'izito_de',  '<a href="http://www.izito.de/" rel="nofollow" title="iZito Deutschland [new window]" target="_blank">iZito Deutschland</a>',
-'peoplecheck_de', '<a href="http://peoplecheck.de/" rel="nofollow" title="PeopleCheck.de [new window]" target="_blank">PeopleCheck.de</a>',
-'oneseek_de', '<a href="http://www.oneseek.de" rel="nofollow" title="Metasuchmaschine OneSeek.de [new window]" target="_blank">Metasuchmaschine OneSeek.de</a>',
-'de_wiki_gov_cn', '<a href="http://de.wiki.gov.cn/" rel="nofollow" title="Wiki Sucher [new window]" target="_blank">Wiki Sucher</a>',
-'umuwa_de', '<a href="http://umuwa.de/" rel="nofollow" title="Umuwa Deutschland [new window]" target="_blank">Umuwa Deutschland</a>',
-'1und1_de', '<a href="http://suche.1und1.de/" rel="nofollow" title="1&amp;1 Suche [new window]" target="_blank">1&amp;1 Suche (subdomain "suche")</a>',
-'metasuche_ch', '<a href="http://www.metasuche.ch/" rel="nofollow" title="Metasuche search page [new window]" target="_blank">Metasuche.ch</a>',
-# Minor hungarian search engines
-'heureka','Heureka', 'origo','Origo-Vizsla', 'lapkereso','Startlapkereso', 'goliat','Goliat', 'indexhu','Index', 'wahoo','Wahoo', 'webmania','webmania.hu', 'internetto','Internetto Kereso',
-'tango_hu','<a href="http://tango.hu/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Tango</a>',
-'keresolap_hu','<a href="http://keresolap.hu/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Tango keresolap</a>',
-'startlap_hu','<a href="http://kereso.startlap.hu/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Startlab Kereso</a>',
-'polymeta_hu','<a href="http://www.polymeta.hu/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Polymeta</a>',
-# Minor Indian search engines
-'sify','<a href="http://search.sify.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Sify</a>',
-# Minor Italian search engines
-'virgilio','<a href="http://www.virgilio.it/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Virgilio</a>',
-'arianna','<a href="http://arianna.libero.it/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Arianna</a>',
-'supereva','<a href="http://search.supereva.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Supereva</a>',
-'kataweb','<a href="http://www.kataweb.it/ricerca/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Kataweb</a>',
-'aliceitmaster','<a href="http://www.alice.it/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">search.alice.it.master</a>',
-'aliceit','<a href="http://www.alice.it/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">alice.it</a>',
-'gotuneed','<a href="http://www.gotuneed.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">got u need</a>',
-'godado','Godado.it',
-'jumpy\.it','Jumpy.it',
-'shinyseek\.it','Shinyseek.it',
-'teecnoit','<a href="http://www.teecno.it/" rel="nofollow" title="Teecno home page [new window]" target="_blank">Teecno</a>',
-# Minor Israeli search engines
-'genieo','<a href="http://search.genieo.com/" rel="nofollow" title="Genieo home page [new window]" target="_blank">Genieo</a>',
-# Minor Japanese search engines
-'askjp','<a href="http://www.ask.jp/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Ask Japan</a>',
-'sagool','<a href="http://sagool.jp/" rel="nofollow" title="Sagool home page [new window]" target="_blank">Sagool</a>',
-'rakuten', '<a href="http://websearch.rakuten.co.jp" rel="nofollow" title="websearch.rakuten.co.jp [new window]" target="_blank">websearch.rakuten.co.jp</a>',
-# Minor Norwegian search engines
-'start','start.no', 'eniro','<a href="http://www.eniro.no/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Eniro</a>',
-# Minor polish search engines
-'wp','<a href="http://szukaj.wp.pl/" rel="nofollow" title="Wirtualna Polska home page [new window]" target="_blank">Wirtualna Polska</a>',
-'onetpl','<a href="http://szukaj.onet.pl/" rel="nofollow" title="Onet.pl home page [new window]" target="_blank">Onet.pl</a>',
-'dodajpl','<a href="http://www.dodaj.pl/" rel="nofollow" title="Dodaj.pl home page [new window]" target="_blank">Dodaj.pl</a>',
-'gazetapl','<a href="http://szukaj.gazeta.pl/" rel="nofollow" title="Gazeta.pl home page [new window]" target="_blank">Gazeta.pl</a>',
-'gerypl','<a href="http://szukaj.gery.pl/" rel="nofollow" title="Gery.pl home page [new window]" target="_blank">Gery.pl</a>',
-'hogapl','<a href="http://www.hoga.pl/" rel="nofollow" title="Hoga.pl home page [new window]" target="_blank">Hoga.pl</a>',
-'netsprintpl','<a href="http://www.netsprint.pl/" rel="nofollow" title="NetSprint.pl home page [new window]" target="_blank">NetSprint.pl</a>',
-'interiapl','<a href="http://www.google.interia.pl/" rel="nofollow" title="Interia.pl home page [new window]" target="_blank">Interia.pl</a>',
-'katalogonetpl','<a href="http://katalog.onet.pl/" rel="nofollow" title="Katalog.Onet.pl home page [new window]" target="_blank">Katalog.Onet.pl</a>',
-'o2pl','<a href="http://szukaj2.o2.pl/" rel="nofollow" title="o2.pl home page [new window]" target="_blank">o2.pl</a>',
-'polskapl','<a href="http://szukaj.polska.pl/" rel="nofollow" title="Polska home page [new window]" target="_blank">Polska</a>',
-'szukaczpl','<a href="http://www.szukacz.pl/" rel="nofollow" title="Szukacz home page [new window]" target="_blank">Szukacz</a>',
-'wowpl','<a href="http://szukaj.wow.pl/" rel="nofollow" title="Wow.pl home page [new window]" target="_blank">Wow.pl</a>',
-# Minor russian search engines
-'yandex', 'Yandex', 'aport', 'Aport', 'rambler', 'Rambler', 'turtle', 'Turtle', 'metabot', 'MetaBot',
-'mailru','<a href="http://go.mail.ru/" rel="nofollow" title="Mail.Ru home page [new window]" target="_blank">Mail.Ru</a>',
-# Minor Swedish search engines
-'passagen','Evreka',
-'enirose','<a href="http://www.eniro.se/" rel="nofollow" title="Eniro Sverige home page [new window]" target="_blank">Eniro Sverige</a>',
-# Minor Slovak search engines
-'zoznam','<a href="http://www.zoznam.sk/" rel="nofollow" title="Zoznam search engine home page [new window]" target="_blank">Zoznam</a>',
-# Minor Portuguese search engines
-'sapo','<a href="http://www.sapo.pt/" rel="nofollow" title="Sapo search engine home page [new window]" target="_blank">Sapo</a>',
-# Minor Swiss search engines
-'searchch', 'search.ch', 'bluewin', 'search.bluewin.ch',
-'zapmeta_ch', '<a href="http://www.zapmeta.ch/" rel="nofollow" title="ZapMeta.ch [new window]" target="_blank">ZapMeta.ch</a>',
-'etools_ch', '<a href="http://www.etools.ch/" rel="nofollow" title="eTools.ch [new window]" target="_blank">eTools.ch</a>',
-# Minor Croatian, Serbian, Macedonian, Bosnian and Herzegovinian search engines
-'pogodak','<a href="http://www.pogodak.com" rel="nofollow" title="Pogodak search engine home page [new window]" target="_blank">Pogodak.com</a>',
-# Generic search engines
-'search','Unknown search engines'
-);
-
-
-# Sanity check.
-# Enable this code and run perl search_engines.pm to check file entries are ok
-#-----------------------------------------------------------------------------
-#foreach my $key (@SearchEnginesSearchIDOrder_list1) {
-#      if (! $SearchEnginesHashID{$key}) { error("Entry '$key' has been found in SearchEnginesSearchIDOrder_list1 with no value in SearchEnginesHashID");
-#      foreach my $key2 (@SearchEnginesSearchIDOrder_list2) { if ($key2 eq $key) { error("$key is in 1 and 2\n"); } }
-#      foreach my $key2 (@SearchEnginesSearchIDOrder_listgen) { if ($key2 eq $key) { error("$key is in 1 and gen\n"); } }
-#} }
-#foreach my $key (@SearchEnginesSearchIDOrder_list2) {
-#      if (! $SearchEnginesHashID{$key}) { error("Entry '$key' has been found in SearchEnginesSearchIDOrder_list1 with no value in SearchEnginesHashID");
-#      foreach my $key2 (@SearchEnginesSearchIDOrder_list1) { if ($key2 eq $key) { error("$key is in 2 and 1\n"); } }
-#      foreach my $key2 (@SearchEnginesSearchIDOrder_listgen) { if ($key2 eq $key) { error("$key is in 2 and gen\n"); } }
-#} }
-#foreach my $key (@SearchEnginesSearchIDOrder_listgen) { if (! $SearchEnginesHashID{$key}) { error("Entry '$key' has been found in SearchEnginesSearchIDOrder_listgen with no value in SearchEnginesHashID"); } }
-#foreach my $key (keys %NotSearchEnginesKeys) { if (! $SearchEnginesHashID{$key}) { error("Entry '$key' has been found in NotSearchEnginesKeys with no value in SearchEnginesHashID"); } }
-#foreach my $key (keys %SearchEnginesKnownUrl) {
-#      my $found=0;
-#      foreach my $key2 (values %SearchEnginesHashID) {
-#              if ($key eq $key2) { $found=1; last; }
-#      }
-#      if (! $found) { die "Entry '$key' has been found in SearchEnginesKnownUrl with no value in SearchEnginesHashID"; }
-#}
-#foreach my $key (keys %SearchEnginesHashLib) {
-#      my $found=0;
-#      foreach my $key2 (values %SearchEnginesHashID) {
-#              if ($key eq $key2) { $found=1; last; }
-#      }
-#      if (! $found) { die "Entry '$key' has been found in SearchEnginesHashLib with no value in SearchEnginesHashID"; }
-#}
-#print @SearchEnginesSearchIDOrder_list1." ".@SearchEnginesSearchIDOrder_list2." ".@SearchEnginesSearchIDOrder_listgen;
-
-1;
+# AWSTATS SEARCH ENGINES DATABASE\r
+#------------------------------------------------------------------------------\r
+# If you want to add a Search Engine to extend AWStats database detection capabilities,\r
+# you must add an entry in SearchEnginesSearchIDOrder, SearchEnginesHashID and in\r
+# SearchEnginesHashLib.\r
+# An entry if known in SearchEnginesKnownUrl is also welcome.\r
+#\r
+# to eldy: Please check if the following description is correct:\r
+# You need the following information to specify a search engine:\r
+# (a) A regular expression that matches the referrer string of the\r
+#    search engine. Unclear: What about slashes in the name of\r
+#    a search engine, e.g. as in 'ecosia.com/search'. Seems that\r
+#    AWStats will non find search strings containing a slash.\r
+#    Maybe use a search string without a slash, and - if necessary -\r
+#    an entry in %NotSearchEnginesKeys , if this search string\r
+#    matches entries that are not search engines.\r
+#    Example of a web address of a Amazon search engine:\r
+#    http://www.amazon.de/gp/bit/apps/web/SERP/search/ref=bit_bds-p24_serp_cr_de?ie=UTF8tagbase=bds-p24&query=deutsch+8.+klasse+gymnasium+protokoll\r
+# (b) A unique string to identify the search engine within AWStats\r
+# (c) A regular expression that finds the start of the query part in the\r
+#    referrer string\r
+# (d) A HTML-fragment that goes into the reports generated by AWStats which\r
+#    identifies the search engine to human reader of the report. In the\r
+#    simplest case this is a string containing the name of the search\r
+#    engine. You can also provide a hypertext clause that presents the\r
+#    name together with a link to the search engine.\r
+#\r
+# The regular expression (a) goes into SearchEnginesSearchIDOrder_list1\r
+# or ..._list2. List 1 contains common search engines, list 2 those\r
+# that are not so often used.\r
+#\r
+# SearchEnginesHashID contains to consecutive entries for each search\r
+# engine: The regular expression (a) followed bei the search engine\r
+# identifier (b)\r
+#\r
+# SearchEnginesKnownUrl specifies how to find the start of the query.\r
+# For each search engine you enter the search engine identifier (b)\r
+# followed by the regular expression (c). Unclear: It is possible to\r
+# omit this entry. If you do this, how will AWStats find the start of\r
+# the query?\r
+#\r
+# SearchEnginesHashLib contains also two entries for each search engine:\r
+# The search engine identifier (b) followed by the HTML-Fragment (d)\r
+#\r
+# There are search engines that do not use a query part in their URLs.\r
+# They put the search expression in the main part of the URL instead.\r
+# AWStats is able to handle these cases. They are specified as described\r
+# above, except the following two things:\r
+# - The regular expression (c) searches the complete URL and not only\r
+#   the query part.\r
+# - An additional Entry in the list %SearchEnginesWithKeysNotInQuery is\r
+#   necessary.\r
+#\r
+#\r
+# AWStats runs a sanity check of the contents of search_engines.pm. This\r
+# check detects the following things:\r
+# - Inconsistencies (number of entries)\r
+# It does not detect the following errors:\r
+# - If the HTML-Fragment (d) is syntactically incorrect.\r
+#\r
+#------------------------------------------------------------------------------\r
+\r
+# 2005-08-19 Sean Carlos http://www.antezeta.com/awstats.html\r
+#            added minor italian search engines\r
+#                  arianna http://arianna.libero.it/\r
+#                  supereva http://search.supereva.com/\r
+#                  kataweb http://kataweb.it/\r
+#            corrected uk looksmart\r
+#                  'askuk','ask=', 'bbc','q=', 'freeserve','q=', 'looksmart','key=',\r
+#            to\r
+#                  'askuk','ask=', 'bbc','q=', 'freeserve','q=', 'looksmartuk','key=',\r
+#            corrected spelling\r
+#                     internationnal -> international\r
+#            added 'google\.'=>'mail\.google\.', to NotSearchEnginesKeys in order to\r
+#            avoid counting gmail referrals as search engine traffic\r
+# 2005-08-21 Sean Carlos http://www.antezeta.com/awstats.html\r
+#            avoid counting babelfish.altavista referrals as search engine traffic\r
+#            avoid counting translate.google referrals as search engine traffic\r
+# 2005-11-20 Sean Carlos\r
+#           added missing 'tiscali','key=', entry.  Check order\r
+# 2005-11-22 Sean Carlos\r
+#           added Google Base & Froogle.  Froogle not tested.\r
+# 2006-04-18 Sean Carlos http://www.antezeta.com/awstats.html\r
+#           added biglotron.com (France)\r
+#           added blingo http://www.blingo.com/\r
+#           added Clusty & Vivisimo\r
+#           added eniro.no (Norway) [https://sourceforge.net/forum/message.php?msg_id=3134783]\r
+#           added GPU p2p search http://search.centraldatabase.org/\r
+#           added mail.tiscali to "not search engines list" [https://sourceforge.net/forum/message.php?msg_id=3166688]\r
+#           added Ask group's "mysearch"\r
+#           added sify.com (India)\r
+#           added sogou.com (Cina) [https://sourceforge.net/forum/message.php?msg_id=3501603]\r
+#           Ask changes:\r
+#           - added Ask Japan (ask.jp)\r
+#           - break out Ask new country level variants (DE, ES, FR, IT, NL)\r
+#           - updated Ask name from Ask Jevees\r
+#           - added Ask q= parameter - many recent searches probably not recognized; [https://sourceforge.net/forum/message.php?msg_id=3465444]\r
+#           - updated Ask uk (new uk.ask.com added to older ask.co.uk)\r
+#           updated voila kw|rdata parameter [https://sourceforge.net/forum/message.php?msg_id=3373912]\r
+#           for each new engine, added link to Search Engine.  This serves to document engine. Done for major & Italian engines as well. Requires patch\r
+#              to AWStats to allow untranslated html.  Otherwise html will appear instead of link.\r
+#           reviewed mnoGoSearch (http://www.mnogosearch.org/); the search engined mentioned no longer\r
+#              exists https://sourceforge.net/forum/message.php?msg_id=3025426\r
+# 2006-05-13 Sean Carlos http://www.antezeta.com/awstats.html\r
+#            added 10 Chello European broadband portals (Austria, Belgium, Czech Republic, France, Hungary, The Netherlands, Norway, Poland, Slovakia, Sweden)\r
+#           added Alice Internal Search (blends data with Google?) search.alice.it.master:10005\r
+#            added detection of google cache views from IPs 66.249.93.104 72.14.203.104 72.14.207.104\r
+#              To do: add more extensive IP list; keywords not yet detected.\r
+#            added icerocket.com blog search http://www.icerocket.com/\r
+#           added live.com (msn) http://www.live.com/\r
+#           added Meta motor kartoo.  Note: Kartoo does not provide search words in referrers, thus the engine will appear in the\r
+#              search engine list but the actual search words are not available.\r
+#           added netluchs.de http://www.netluchs.de/\r
+#           added sphere.com blog search http://www.sphere.com/\r
+#           added wwweasel.de http://wwweasel.de\r
+#           added Yahoo Mindset! http://mindset.research.yahoo.com/\r
+#            updated Mirago query parameter recognition (qry=); added breakout for each country (France, Germany, Spain, Italy, Norway, Sweden, Denmark, Netherlands, Belgium, Switzerland)\r
+# 2006-05-13 Sean Carlos http://www.antezeta.com/awstats.html\r
+#           added Google cache IPs 64.233.183.104 & 66.102.7.104\r
+# 2006-05-20 Sean Carlos http://www.antezeta.com/awstats.html\r
+#              anzwers.com.au\r
+#              schoenerbrausen.de http://www.schoenerbrausen.de/\r
+#              added Google cache IP 216.239.59.104\r
+#              answerbus http://www.answerbus.com/ (does not provide keywords)\r
+# 2006-05-23 Sean Carlos http://www.antezeta.com/awstats.html\r
+#              added Google cache IP 66.102.9.104, 64.233.161.104\r
+# 2006-06-23 Sean Carlos http://www.antezeta.com/awstats.html\r
+#              added Alice Search search.alice.it\r
+#              added GoodSearch http://www.goodsearch.com/ (does not provide keywords) "a Yahoo-powered search engine that donates money to your favorite charity or school each time you search the web"\r
+#              added googlee.com, variant of Google\r
+#              added gotuneed http://www.gotuneed.com/ Italian search engine, in beta\r
+#              added icq.com\r
+#              added logic to parse Google Cache search keywords. Seems to work for alpha but not numeric cache IDs, i.e. search?q=cache:lWVLmnuGJswJ: is recognized but q=cache:Yv5qxeJNuhgJ: is not recognized. The URL triggering the keywords will also appear.  The URLs are probably too varied to parse out?\r
+#              added Nusearch http://www.nusearch.com/\r
+#              added Polymeta www.polymeta.hu (does not provide keywords)\r
+#              added scroogle http://www.scroogle.org/ (does not always provide keywords)\r
+#              added Tango http://tango.hu/search.php?st=0&q=jeles+napok\r
+#              Changed Google Cache notation 64\.233\.(161|167|179|183|187)\.104 to 64\.233\.1[0-9]{2}\.104\r
+#                                            72\.14\.(203|205|207|209|221)\.104 to 72\.14\.2[0-9]{2}\.104\r
+#                                            216\.239\.(51|59)\.104 to 216\.239\.5[0-9]\.104\r
+#                                            66\.102\.(7|9)\.104 to 66\.102\.[1-9]\.104\r
+# 2006-06-27 Sean Carlos http://www.antezeta.com/awstats.html\r
+#              added Onet.pl http://szukaj.onet.pl/\r
+#              corrected name "Wirtualna Polska" from "Szukaj" (search); added link http://szukaj.wp.pl/\r
+# 2006-06-30 Sean Carlos http://www.antezeta.com/awstats.html\r
+#      Additional Polish Search Engines:\r
+#      added Dodaj.pl http://www.dodaj.pl/\r
+#      added Gazeta.pl http://szukaj.gazeta.pl/\r
+#      added Gery.pl http://szukaj.gery.pl/\r
+#      added Hoga.pl http://www.hoga.pl/\r
+#      added Interia.pl http://www.google.interia.pl/\r
+#      added Katalog.Onet.pl http://katalog.onet.pl/\r
+#      added NetSprint.pl http://www.netsprint.pl/\r
+#      added o2.pl http://szukaj2.o2.pl/\r
+#      added Polska http://szukaj.polska.pl/\r
+#      added Szukacz http://www.szukacz.pl/\r
+#      added Wow.pl http://szukaj.wow.pl/\r
+#      added Sagool http://sagool.jp/\r
+\r
+# 2006-08-25 Social Bookmarks\r
+#      International\r
+#      added del.icio.us/search - for now, just search referrer. To do: consider /tag/(tagname) referrer?\r
+#      added stumbleupon.com - No keywords supplied.\r
+#      added swik.net\r
+#       added digg. Keywords sometimes supplied.\r
+#      Italy\r
+#      added segnalo.alice.it - No keywords supplied.\r
+#      added ineffabile.it - No keywords supplied.\r
+\r
+#       added filter for google groups.  Attempt to parse group name as keyword.\r
+\r
+# 2006-09-14\r
+#      added Eniro Sverige http://www.eniro.se/\r
+#      added MyWebSearch http://search.mywebsearch.com/\r
+#      added Teecno http://www.teecno.it/ Italian Open Source Search Engine\r
+\r
+#package AWSSE;\r
+\r
+# 2006-09-25 (Gabor Moizes)\r
+# added 4-counter (Google alternative) http://4-counter.com/\r
+# added Googlecom (Google alternative) http://googlecom.com/\r
+# added Goggle (Google alternative) http://goggle.co.hu/\r
+# added Comet toolbar http://as.starware.com\r
+# added new IP for Yahoo: 216.109.125.130\r
+# added Ledix http://ledix.net/\r
+# added AT&T search (powered by Google) http://www.att.net/\r
+# added Keresolap (Hungarian search engine) http://www.keresolap.hu/\r
+# added Mozbot (French search engine) http://www.mozbot.fr/\r
+# added Zoznam (Slovak search engine) http://www.zoznam.sk/\r
+# added sapo.pt (Portuguese search engine) http://www.sapo.pt/\r
+# added shaw.ca (powered by Google) http://start.shaw.ca/\r
+# added Searchalot http://www.searchalot.com/\r
+# added Copernic http://www.copernic.com/\r
+# added 216.109.125.130 to Yahoo\r
+# added 66.218.69.11 to Yahoo\r
+# added Avantfind http://www.avantfind.com/\r
+# added Steadysearch http://www.steadysearch.com/\r
+# added Steadysearch http://www.steady-search.com/\r
+# modified 216\.239\.5[0-9]\.104/search to 216\.239\.5[0-9]\.104\r
+\r
+# RobC 2016/09/02 $\r
+#  massive edit..... \r
+#  added all google country TLDs to split count by google country.\r
+#  any google TLD not listed in here goes into 'Google catchall' for each country\r
+#  each google country has 3 possibilities, normal, images, or catchall (a catchall for other google sub domains)\r
+#  Several other search engines added too.\r
+#  Whole file cleaned up and partly sorted, comments taken out to make it easier to \r
+#  add, find and edit entries. Fact is that vast majority of searches are from Google so\r
+#  I made it Google centric which shows you which countries your google searches are coming from.\r
+#  Should now contain all searchengines from awstats 7.5 release (plus a lot more)\r
+#  May be too slow for big log files but you can try and see.\r
+#  Currently tuned for my top search engines. Yours will likely differ.\r
+#  If you put your sites 30 most used search engines at top of SearchEnginesSearchIDOrder_list1 and\r
+#  at top of SearchEnginesHashID starting with most used at top, then performance is improved a tad.\r
+#  SearchEnginesSearchIDOrder_list1 and SearchEnginesHashID must be in exact same order as each other.\r
+#  SearchEnginesKnownUrl and SearchEnginesHashLib can be in any order you like.\r
+#  Good luck  \r
+#            \r
+#  p.s. save your current search-engines.pm file before using this one just in case its too slow or you find an error.\r
+#       I'm bound to have made one or two mistakes but it runs a years worth of log files from one my sites just fine.  \r
+\r
+#------------------------------------------------------------------------------\r
+# SearchEnginesSearchIDOrder\r
+# It contains all matching criteria to search for in log fields. This list is\r
+# used to know in which order to search Search Engines IDs.\r
+# Most frequent one are in list1, used when LevelForSearchEnginesDetection is 1 or more\r
+# Minor robots are in list2, used when LevelForSearchEnginesDetection is 2 or more\r
+# Note: Regex IDs are in lower case and ' ' and '+' are changed into '_'\r
+#------------------------------------------------------------------------------\r
+@SearchEnginesSearchIDOrder_list1=(\r
+'^www\.google\.co\.uk$',\r
+'^images\.google\.co\.uk$',\r
+'google\.co\.uk$',\r
+'^www\.google\.com$',\r
+'^images\.google\.com$',\r
+'google\.com$',\r
+\r
+'bing\.com',\r
+'^(www\.|)yandex\.ru$',\r
+'^(www\.|)yandex\.com\.tr$',\r
+'^(www\.|)yandex\.ua$',\r
+'^(www\.|)yandex\.kz$',\r
+'^(www\.|)yandex\.com$',\r
+'yandex\.',\r
+'r\.search\.yahoo\.com',\r
+\r
+'^www\.google\.de$',\r
+'^images\.google\.de$',\r
+'google\.de$',\r
+'^www\.google\.fr$',\r
+'^images\.google\.fr$',\r
+'google\.fr$',\r
+'^www\.google\.ca$',\r
+'^images\.google\.ca$',\r
+'google\.ca$',\r
+'^www\.google\.es$',\r
+'^images\.google\.es$',\r
+'google\.es$',\r
+'^www\.google\.com\.au$',\r
+'^images\.google\.com\.au$',\r
+'google\.com\.au$',\r
+'^www\.google\.nl$',\r
+'^images\.google\.nl$',\r
+'google\.nl$',\r
+'^www\.google\.gr$',\r
+'^images\.google\.gr$',\r
+'google\.gr$',\r
+'^www\.google\.se$',\r
+'^images\.google\.se$',\r
+'google\.se$',\r
+'^www\.google\.ie$',\r
+'^images\.google\.ie$',\r
+'google\.ie$',\r
+'^www\.google\.it$',\r
+'^images\.google\.it$',\r
+'google\.it$',\r
+'^www\.google\.no$',\r
+'^images\.google\.no$',\r
+'google\.no$',\r
+'^www\.google\.com\.tr$',\r
+'^images\.google\.com\.tr$',\r
+'google\.com\.tr$',\r
+'^www\.google\.co\.in$',\r
+'^images\.google\.co\.in$',\r
+'google\.co\.in$',\r
+'^www\.google\.pt$',\r
+'^images\.google\.pt$',\r
+'google\.pt$',\r
+'^www\.google\.hr$',\r
+'^images\.google\.hr$',\r
+'google\.hr$',\r
+'^www\.google\.co\.nz$',\r
+'^images\.google\.co\.nz$',\r
+'google\.co\.nz$',\r
+'^www\.google\.pl$',\r
+'^images\.google\.pl$',\r
+'google\.pl$',\r
+'^www\.google\.ac$',\r
+'^images\.google\.ac$',\r
+'google\.ac$',\r
+'^www\.google\.ad$',\r
+'^images\.google\.ad$',\r
+'google\.ad$',\r
+'^www\.google\.ae$',\r
+'^images\.google\.ae$',\r
+'google\.ae$',\r
+'^www\.google\.al$',\r
+'^images\.google\.al$',\r
+'google\.al$',\r
+'^www\.google\.am$',\r
+'^images\.google\.am$',\r
+'google\.am$',\r
+'^www\.google\.as$',\r
+'^images\.google\.as$',\r
+'google\.as$',\r
+'^www\.google\.at$',\r
+'^images\.google\.at$',\r
+'google\.at$',\r
+'^www\.google\.az$',\r
+'^images\.google\.az$',\r
+'google\.az$',\r
+'^www\.google\.ba$',\r
+'^images\.google\.ba$',\r
+'google\.ba$',\r
+'^www\.google\.be$',\r
+'^images\.google\.be$',\r
+'google\.be$',\r
+'^www\.google\.bf$',\r
+'^images\.google\.bf$',\r
+'google\.bf$',\r
+'^www\.google\.bg$',\r
+'^images\.google\.bg$',\r
+'google\.bg$',\r
+'^www\.google\.bi$',\r
+'^images\.google\.bi$',\r
+'google\.bi$',\r
+'^www\.google\.bj$',\r
+'^images\.google\.bj$',\r
+'google\.bj$',\r
+'^www\.google\.bs$',\r
+'^images\.google\.bs$',\r
+'google\.bs$',\r
+'^www\.google\.bt$',\r
+'^images\.google\.bt$',\r
+'google\.bt$',\r
+'^www\.google\.by$',\r
+'^images\.google\.by$',\r
+'google\.by$',\r
+'^www\.google\.cat$',\r
+'^images\.google\.cat$',\r
+'google\.cat$',\r
+'^www\.google\.cc$',\r
+'^images\.google\.cc$',\r
+'google\.cc$',\r
+'^www\.google\.cd$',\r
+'^images\.google\.cd$',\r
+'google\.cd$',\r
+'^www\.google\.cf$',\r
+'^images\.google\.cf$',\r
+'google\.cf$',\r
+'^www\.google\.cg$',\r
+'^images\.google\.cg$',\r
+'google\.cg$',\r
+'^www\.google\.ch$',\r
+'^images\.google\.ch$',\r
+'google\.ch$',\r
+'^www\.google\.ci$',\r
+'^images\.google\.ci$',\r
+'google\.ci$',\r
+'^www\.google\.cl$',\r
+'^images\.google\.cl$',\r
+'google\.cl$',\r
+'^www\.google\.cm$',\r
+'^images\.google\.cm$',\r
+'google\.cm$',\r
+'^www\.google\.cn$',\r
+'^images\.google\.cn$',\r
+'google\.cn$',\r
+'^www\.google\.co\.ao$',\r
+'^images\.google\.co\.ao$',\r
+'google\.co\.ao$',\r
+'^www\.google\.co\.bw$',\r
+'^images\.google\.co\.bw$',\r
+'google\.co\.bw$',\r
+'^www\.google\.co\.ck$',\r
+'^images\.google\.co\.ck$',\r
+'google\.co\.ck$',\r
+'^www\.google\.co\.cr$',\r
+'^images\.google\.co\.cr$',\r
+'google\.co\.cr$',\r
+'^www\.google\.co\.id$',\r
+'^images\.google\.co\.id$',\r
+'google\.co\.id$',\r
+'^www\.google\.co\.il$',\r
+'^images\.google\.co\.il$',\r
+'google\.co\.il$',\r
+'^www\.google\.co\.jp$',\r
+'^images\.google\.co\.jp$',\r
+'google\.co\.jp$',\r
+'^www\.google\.co\.ke$',\r
+'^images\.google\.co\.ke$',\r
+'google\.co\.ke$',\r
+'^www\.google\.co\.kr$',\r
+'^images\.google\.co\.kr$',\r
+'google\.co\.kr$',\r
+'^www\.google\.co\.ls$',\r
+'^images\.google\.co\.ls$',\r
+'google\.co\.ls$',\r
+'^www\.google\.co\.ma$',\r
+'^images\.google\.co\.ma$',\r
+'google\.co\.ma$',\r
+'^www\.google\.co\.mz$',\r
+'^images\.google\.co\.mz$',\r
+'google\.co\.mz$',\r
+'^www\.google\.co\.th$',\r
+'^images\.google\.co\.th$',\r
+'google\.co\.th$',\r
+'^www\.google\.co\.tz$',\r
+'^images\.google\.co\.tz$',\r
+'google\.co\.tz$',\r
+'^www\.google\.co\.ug$',\r
+'^images\.google\.co\.ug$',\r
+'google\.co\.ug$',\r
+'^www\.google\.co\.uz$',\r
+'^images\.google\.co\.uz$',\r
+'google\.co\.uz$',\r
+'^www\.google\.co\.ve$',\r
+'^images\.google\.co\.ve$',\r
+'google\.co\.ve$',\r
+'^www\.google\.co\.vi$',\r
+'^images\.google\.co\.vi$',\r
+'google\.co\.vi$',\r
+'^www\.google\.co\.za$',\r
+'^images\.google\.co\.za$',\r
+'google\.co\.za$',\r
+'^www\.google\.co\.zm$',\r
+'^images\.google\.co\.zm$',\r
+'google\.co\.zm$',\r
+'^www\.google\.co\.zw$',\r
+'^images\.google\.co\.zw$',\r
+'google\.co\.zw$',\r
+'^www\.google\.com\.af$',\r
+'^images\.google\.com\.af$',\r
+'google\.com\.af$',\r
+'^www\.google\.com\.ag$',\r
+'^images\.google\.com\.ag$',\r
+'google\.com\.ag$',\r
+'^www\.google\.com\.ai$',\r
+'^images\.google\.com\.ai$',\r
+'google\.com\.ai$',\r
+'^www\.google\.com\.ar$',\r
+'^images\.google\.com\.ar$',\r
+'google\.com\.ar$',\r
+'^www\.google\.com\.bd$',\r
+'^images\.google\.com\.bd$',\r
+'google\.com\.bd$',\r
+'^www\.google\.com\.bh$',\r
+'^images\.google\.com\.bh$',\r
+'google\.com\.bh$',\r
+'^www\.google\.com\.bn$',\r
+'^images\.google\.com\.bn$',\r
+'google\.com\.bn$',\r
+'^www\.google\.com\.bo$',\r
+'^images\.google\.com\.bo$',\r
+'google\.com\.bo$',\r
+'^www\.google\.com\.br$',\r
+'^images\.google\.com\.br$',\r
+'google\.com\.br$',\r
+'^www\.google\.com\.bz$',\r
+'^images\.google\.com\.bz$',\r
+'google\.com\.bz$',\r
+'^www\.google\.com\.co$',\r
+'^images\.google\.com\.co$',\r
+'google\.com\.co$',\r
+'^www\.google\.com\.cu$',\r
+'^images\.google\.com\.cu$',\r
+'google\.com\.cu$',\r
+'^www\.google\.com\.cy$',\r
+'^images\.google\.com\.cy$',\r
+'google\.com\.cy$',\r
+'^www\.google\.com\.do$',\r
+'^images\.google\.com\.do$',\r
+'google\.com\.do$',\r
+'^www\.google\.com\.ec$',\r
+'^images\.google\.com\.ec$',\r
+'google\.com\.ec$',\r
+'^www\.google\.com\.eg$',\r
+'^images\.google\.com\.eg$',\r
+'google\.com\.eg$',\r
+'^www\.google\.com\.et$',\r
+'^images\.google\.com\.et$',\r
+'google\.com\.et$',\r
+'^www\.google\.com\.fj$',\r
+'^images\.google\.com\.fj$',\r
+'google\.com\.fj$',\r
+'^www\.google\.com\.gh$',\r
+'^images\.google\.com\.gh$',\r
+'google\.com\.gh$',\r
+'^www\.google\.com\.gi$',\r
+'^images\.google\.com\.gi$',\r
+'google\.com\.gi$',\r
+'^www\.google\.com\.gt$',\r
+'^images\.google\.com\.gt$',\r
+'google\.com\.gt$',\r
+'^www\.google\.com\.hk$',\r
+'^images\.google\.com\.hk$',\r
+'google\.com\.hk$',\r
+'^www\.google\.com\.jm$',\r
+'^images\.google\.com\.jm$',\r
+'google\.com\.jm$',\r
+'^www\.google\.com\.kh$',\r
+'^images\.google\.com\.kh$',\r
+'google\.com\.kh$',\r
+'^www\.google\.com\.kw$',\r
+'^images\.google\.com\.kw$',\r
+'google\.com\.kw$',\r
+'^www\.google\.com\.lb$',\r
+'^images\.google\.com\.lb$',\r
+'google\.com\.lb$',\r
+'^www\.google\.com\.lc$',\r
+'^images\.google\.com\.lc$',\r
+'google\.com\.lc$',\r
+'^www\.google\.com\.ly$',\r
+'^images\.google\.com\.ly$',\r
+'google\.com\.ly$',\r
+'^www\.google\.com\.mm$',\r
+'^images\.google\.com\.mm$',\r
+'google\.com\.mm$',\r
+'^www\.google\.com\.mt$',\r
+'^images\.google\.com\.mt$',\r
+'google\.com\.mt$',\r
+'^www\.google\.com\.mx$',\r
+'^images\.google\.com\.mx$',\r
+'google\.com\.mx$',\r
+'^www\.google\.com\.my$',\r
+'^images\.google\.com\.my$',\r
+'google\.com\.my$',\r
+'^www\.google\.com\.na$',\r
+'^images\.google\.com\.na$',\r
+'google\.com\.na$',\r
+'^www\.google\.com\.nf$',\r
+'^images\.google\.com\.nf$',\r
+'google\.com\.nf$',\r
+'^www\.google\.com\.ng$',\r
+'^images\.google\.com\.ng$',\r
+'google\.com\.ng$',\r
+'^www\.google\.com\.ni$',\r
+'^images\.google\.com\.ni$',\r
+'google\.com\.ni$',\r
+'^www\.google\.com\.np$',\r
+'^images\.google\.com\.np$',\r
+'google\.com\.np$',\r
+'^www\.google\.com\.om$',\r
+'^images\.google\.com\.om$',\r
+'google\.com\.om$',\r
+'^www\.google\.com\.pa$',\r
+'^images\.google\.com\.pa$',\r
+'google\.com\.pa$',\r
+'^www\.google\.com\.pe$',\r
+'^images\.google\.com\.pe$',\r
+'google\.com\.pe$',\r
+'^www\.google\.com\.pg$',\r
+'^images\.google\.com\.pg$',\r
+'google\.com\.pg$',\r
+'^www\.google\.com\.ph$',\r
+'^images\.google\.com\.ph$',\r
+'google\.com\.ph$',\r
+'^www\.google\.com\.pk$',\r
+'^images\.google\.com\.pk$',\r
+'google\.com\.pk$',\r
+'^www\.google\.com\.pr$',\r
+'^images\.google\.com\.pr$',\r
+'google\.com\.pr$',\r
+'^www\.google\.com\.py$',\r
+'^images\.google\.com\.py$',\r
+'google\.com\.py$',\r
+'^www\.google\.com\.qa$',\r
+'^images\.google\.com\.qa$',\r
+'google\.com\.qa$',\r
+'^www\.google\.com\.sa$',\r
+'^images\.google\.com\.sa$',\r
+'google\.com\.sa$',\r
+'^www\.google\.com\.sb$',\r
+'^images\.google\.com\.sb$',\r
+'google\.com\.sb$',\r
+'^www\.google\.com\.sg$',\r
+'^images\.google\.com\.sg$',\r
+'google\.com\.sg$',\r
+'^www\.google\.com\.sl$',\r
+'^images\.google\.com\.sl$',\r
+'google\.com\.sl$',\r
+'^www\.google\.com\.sv$',\r
+'^images\.google\.com\.sv$',\r
+'google\.com\.sv$',\r
+'^www\.google\.com\.tj$',\r
+'^images\.google\.com\.tj$',\r
+'google\.com\.tj$',\r
+'^www\.google\.com\.tw$',\r
+'^images\.google\.com\.tw$',\r
+'google\.com\.tw$',\r
+'^www\.google\.com\.ua$',\r
+'^images\.google\.com\.ua$',\r
+'google\.com\.ua$',\r
+'^www\.google\.com\.uy$',\r
+'^images\.google\.com\.uy$',\r
+'google\.com\.uy$',\r
+'^www\.google\.com\.vc$',\r
+'^images\.google\.com\.vc$',\r
+'google\.com\.vc$',\r
+'^www\.google\.com\.vn$',\r
+'^images\.google\.com\.vn$',\r
+'google\.com\.vn$',\r
+'^www\.google\.cv$',\r
+'^images\.google\.cv$',\r
+'google\.cv$',\r
+'^www\.google\.cz$',\r
+'^images\.google\.cz$',\r
+'google\.cz$',\r
+'^www\.google\.dj$',\r
+'^images\.google\.dj$',\r
+'google\.dj$',\r
+'^www\.google\.dk$',\r
+'^images\.google\.dk$',\r
+'google\.dk$',\r
+'^www\.google\.dm$',\r
+'^images\.google\.dm$',\r
+'google\.dm$',\r
+'^www\.google\.dz$',\r
+'^images\.google\.dz$',\r
+'google\.dz$',\r
+'^www\.google\.ee$',\r
+'^images\.google\.ee$',\r
+'google\.ee$',\r
+'^www\.google\.fi$',\r
+'^images\.google\.fi$',\r
+'google\.fi$',\r
+'^www\.google\.fm$',\r
+'^images\.google\.fm$',\r
+'google\.fm$',\r
+'^www\.google\.ga$',\r
+'^images\.google\.ga$',\r
+'google\.ga$',\r
+'^www\.google\.ge$',\r
+'^images\.google\.ge$',\r
+'google\.ge$',\r
+'^www\.google\.gf$',\r
+'^images\.google\.gf$',\r
+'google\.gf$',\r
+'^www\.google\.gg$',\r
+'^images\.google\.gg$',\r
+'google\.gg$',\r
+'^www\.google\.gl$',\r
+'^images\.google\.gl$',\r
+'google\.gl$',\r
+'^www\.google\.gm$',\r
+'^images\.google\.gm$',\r
+'google\.gm$',\r
+'^www\.google\.gp$',\r
+'^images\.google\.gp$',\r
+'google\.gp$',\r
+'^www\.google\.gy$',\r
+'^images\.google\.gy$',\r
+'google\.gy$',\r
+'^www\.google\.hn$',\r
+'^images\.google\.hn$',\r
+'google\.hn$',\r
+'^www\.google\.ht$',\r
+'^images\.google\.ht$',\r
+'google\.ht$',\r
+'^www\.google\.hu$',\r
+'^images\.google\.hu$',\r
+'google\.hu$',\r
+'^www\.google\.im$',\r
+'^images\.google\.im$',\r
+'google\.im$',\r
+'^www\.google\.io$',\r
+'^images\.google\.io$',\r
+'google\.io$',\r
+'^www\.google\.iq$',\r
+'^images\.google\.iq$',\r
+'google\.iq$',\r
+'^www\.google\.is$',\r
+'^images\.google\.is$',\r
+'google\.is$',\r
+'^www\.google\.je$',\r
+'^images\.google\.je$',\r
+'google\.je$',\r
+'^www\.google\.jo$',\r
+'^images\.google\.jo$',\r
+'google\.jo$',\r
+'^www\.google\.kg$',\r
+'^images\.google\.kg$',\r
+'google\.kg$',\r
+'^www\.google\.ki$',\r
+'^images\.google\.ki$',\r
+'google\.ki$',\r
+'^www\.google\.kz$',\r
+'^images\.google\.kz$',\r
+'google\.kz$',\r
+'^www\.google\.la$',\r
+'^images\.google\.la$',\r
+'google\.la$',\r
+'^www\.google\.li$',\r
+'^images\.google\.li$',\r
+'google\.li$',\r
+'^www\.google\.lk$',\r
+'^images\.google\.lk$',\r
+'google\.lk$',\r
+'^www\.google\.lt$',\r
+'^images\.google\.lt$',\r
+'google\.lt$',\r
+'^www\.google\.lu$',\r
+'^images\.google\.lu$',\r
+'google\.lu$',\r
+'^www\.google\.lv$',\r
+'^images\.google\.lv$',\r
+'google\.lv$',\r
+'^www\.google\.md$',\r
+'^images\.google\.md$',\r
+'google\.md$',\r
+'^www\.google\.me$',\r
+'^images\.google\.me$',\r
+'google\.me$',\r
+'^www\.google\.mg$',\r
+'^images\.google\.mg$',\r
+'google\.mg$',\r
+'^www\.google\.mk$',\r
+'^images\.google\.mk$',\r
+'google\.mk$',\r
+'^www\.google\.ml$',\r
+'^images\.google\.ml$',\r
+'google\.ml$',\r
+'^www\.google\.mn$',\r
+'^images\.google\.mn$',\r
+'google\.mn$',\r
+'^www\.google\.ms$',\r
+'^images\.google\.ms$',\r
+'google\.ms$',\r
+'^www\.google\.mu$',\r
+'^images\.google\.mu$',\r
+'google\.mu$',\r
+'^www\.google\.mv$',\r
+'^images\.google\.mv$',\r
+'google\.mv$',\r
+'^www\.google\.mw$',\r
+'^images\.google\.mw$',\r
+'google\.mw$',\r
+'^www\.google\.ne$',\r
+'^images\.google\.ne$',\r
+'google\.ne$',\r
+'^www\.google\.nr$',\r
+'^images\.google\.nr$',\r
+'google\.nr$',\r
+'^www\.google\.nu$',\r
+'^images\.google\.nu$',\r
+'google\.nu$',\r
+'^www\.google\.pn$',\r
+'^images\.google\.pn$',\r
+'google\.pn$',\r
+'^www\.google\.ps$',\r
+'^images\.google\.ps$',\r
+'google\.ps$',\r
+'^www\.google\.ro$',\r
+'^images\.google\.ro$',\r
+'google\.ro$',\r
+'^www\.google\.rs$',\r
+'^images\.google\.rs$',\r
+'google\.rs$',\r
+'^www\.google\.ru$',\r
+'^images\.google\.ru$',\r
+'google\.ru$',\r
+'^www\.google\.rw$',\r
+'^images\.google\.rw$',\r
+'google\.rw$',\r
+'^www\.google\.sc$',\r
+'^images\.google\.sc$',\r
+'google\.sc$',\r
+'^www\.google\.sh$',\r
+'^images\.google\.sh$',\r
+'google\.sh$',\r
+'^www\.google\.si$',\r
+'^images\.google\.si$',\r
+'google\.si$',\r
+'^www\.google\.sk$',\r
+'^images\.google\.sk$',\r
+'google\.sk$',\r
+'^www\.google\.sm$',\r
+'^images\.google\.sm$',\r
+'google\.sm$',\r
+'^www\.google\.sn$',\r
+'^images\.google\.sn$',\r
+'google\.sn$',\r
+'^www\.google\.so$',\r
+'^images\.google\.so$',\r
+'google\.so$',\r
+'^www\.google\.sr$',\r
+'^images\.google\.sr$',\r
+'google\.sr$',\r
+'^www\.google\.st$',\r
+'^images\.google\.st$',\r
+'google\.st$',\r
+'^www\.google\.td$',\r
+'^images\.google\.td$',\r
+'google\.td$',\r
+'^www\.google\.tg$',\r
+'^images\.google\.tg$',\r
+'google\.tg$',\r
+'^www\.google\.tk$',\r
+'^images\.google\.tk$',\r
+'google\.tk$',\r
+'^www\.google\.tl$',\r
+'^images\.google\.tl$',\r
+'google\.tl$',\r
+'^www\.google\.tm$',\r
+'^images\.google\.tm$',\r
+'google\.tm$',\r
+'^www\.google\.tn$',\r
+'^images\.google\.tn$',\r
+'google\.tn$',\r
+'^www\.google\.to$',\r
+'^images\.google\.to$',\r
+'google\.to$',\r
+'^www\.google\.tt$',\r
+'^images\.google\.tt$',\r
+'google\.tt$',\r
+'^www\.google\.us$',\r
+'^images\.google\.us$',\r
+'google\.us$',\r
+'^www\.google\.vg$',\r
+'^images\.google\.vg$',\r
+'google\.vg$',\r
+'^www\.google\.vu$',\r
+'^images\.google\.vu$',\r
+'google\.vu$',\r
+'^www\.google\.ws$',\r
+'^images\.google\.ws$',\r
+'google\.ws$',\r
+\r
+'au\.search\.yahoo\.com',\r
+'ca\.search\.yahoo\.com',\r
+'fr\.search\.yahoo\.com',\r
+'image\.search\.yahoo\.co\.jp',\r
+'images\.search\.yahoo\.com',\r
+'it\.search\.yahoo\.com',\r
+'ph\.search\.yahoo\.com',\r
+'se\.search\.yahoo\.com',\r
+'search\.yahoo\.co\.jp',\r
+'sg\.search\.yahoo\.com',\r
+'sg\.yhs4\.search\.yahoo\.com',\r
+'tw\.images\.search\.yahoo\.com',\r
+'uk\.search\.yahoo\.com',\r
+'uk\.yhs4\.search\.yahoo\.com',\r
+'us\.search\.yahoo\.com',\r
+'search\.yahoo\.com',\r
+'search\.yahoo',\r
+\r
+'babylon\.com',\r
+'search\.conduit\.com',\r
+'avg\.com',\r
+'mywebsearch\.com',\r
+'msn\.',\r
+'live\.com',\r
+'search\.aol\.co\.uk',\r
+'searcht\.aol\.co\.uk',\r
+'searcht\.aol\.com',\r
+'search\.aol\.com',\r
+'recherche\.aol\.fr',\r
+'suche\.aol\.de',\r
+'de\.aolsearch\.com',\r
+'sucheaol\.aol\.de',\r
+'search\.hp\.my\.aol\.co\.uk',\r
+'search\.aol\.pl',\r
+'o2suche\.aol\.de',\r
+'search\.aol\.',\r
+'^uk\.ask\.com$',\r
+'^de\.ask\.com$',\r
+'tb\.ask\.com$',\r
+'^images\.ask\.com$',\r
+\r
+'base\.google\.',\r
+'froogle\.google\.',\r
+'google\.[\w.]+/products',\r
+'googlecom\.com',\r
+'groups\.google\.',\r
+'googlee\.',\r
+\r
+'216\.239\.32\.20',\r
+'173\.194\.32\.223',\r
+'216\.239\.(35|37|39|51)\.100',\r
+'216\.239\.(35|37|39|51)\.101',\r
+'216\.239\.5[0-9]\.104',\r
+'64\.233\.1[0-9]{2}\.104',\r
+'66\.102\.[1-9]\.104',\r
+'66\.249\.93\.104',\r
+'72\.14\.2[0-9]{2}\.104',\r
+\r
+'maps\.google',\r
+'translate\.google',\r
+'173\.194\.35\.177',\r
+'google\.',\r
+\r
+'mail.yahoo.net',\r
+'(66\.218\.71\.225|216\.109\.117\.135|216\.109\.125\.130|66\.218\.69\.11)',\r
+'mindset\.research\.yahoo',\r
+'yahoo\.',\r
+\r
+'^www\.ask\.jp$',\r
+'^es\.ask\.com$',\r
+'^fr\.ask\.com$',\r
+'^www\.iask\.com$',\r
+'^it\.ask\.com$',\r
+'^nl\.ask\.com$',\r
+'(^|\.)ask\.com$',\r
+\r
+'www\.tesco\.net',\r
+'yell\.',\r
+'zapmeta\.ch',\r
+'zapmeta\.com',\r
+'zapmeta\.de',\r
+'zapmeta',\r
+\r
+'(^|\.)go\.com',\r
+'(161\.58\.227\.204|161\.58\.247\.101|212\.40\.165\.90|213\.133\.108\.202|217\.160\.108\.151|217\.160\.111\.99|217\.160\.131\.108|217\.160\.142\.227|217\.160\.176\.42)',\r
+'\.facemoods\.com',\r
+'\.funmoods\.com',\r
+'\.metasearch\.',\r
+'\.wow\.com',\r
+'163\.com',\r
+'1klik\.dk',\r
+'1search-board\.com',\r
+'212\.227\.33\.241',\r
+'3721\.com',\r
+'4\-counter\.com',\r
+'a9\.com',\r
+'accoona\.com',\r
+'alexa\.com',\r
+'allesklar\.de',\r
+'alltheweb\.com',\r
+'altavista\.',\r
+'amazon\.',\r
+'androidsearch\.com',\r
+'answerbus\.com',\r
+'anzwers\.com\.au',\r
+'aport\.ru',\r
+'arianna\.libero\.it',\r
+'as\.starware\.com',\r
+'asevenboard\.com',\r
+'atlanticbb\.net',\r
+'atlas\.cz',\r
+'atomz\.',\r
+'att\.net',\r
+'auone\.jp',\r
+'avantfind\.com',\r
+'baidu\.com',\r
+'bbc\.co\.uk/cgi-bin/search',\r
+'biglotron\.com',\r
+'blekko\.com',\r
+'blingo\.com',\r
+'bungeebonesdotcom',\r
+'centraldatabase\.org',\r
+'centrum\.cz',\r
+'centurylink\.net',\r
+'charter\.net',\r
+'chatzum\.com',\r
+'checkparams\.com',\r
+'chello\.at',\r
+'chello\.be',\r
+'chello\.cz',\r
+'chello\.fr',\r
+'chello\.hu',\r
+'chello\.nl',\r
+'chello\.no',\r
+'chello\.pl',\r
+'chello\.se',\r
+'chello\.sk',\r
+'chello',\r
+'claro-search\.com',\r
+'clinck\.in',\r
+'clusty\.com',\r
+'copernic\.com',\r
+'crawler\.com',\r
+'ctrouve\.',\r
+'dalesearch\.com',\r
+'danielsen\.com',\r
+'daum\.net',\r
+'de\.dolphin\.com',\r
+'de\.wiki\.gov\.cn',\r
+'de\.wow\.com',\r
+'dejanews\.',\r
+'del\.icio\.us',\r
+'delta-search',\r
+'digg\.com',\r
+'dmoz\.org',\r
+'dodaj\.pl',\r
+'dogpile\.com',\r
+'duckduckgo',\r
+'easysearch\.org\.uk',\r
+'ecosia\.org',\r
+'edderkoppen\.dk',\r
+'engine\.exe',\r
+'eniro\.no',\r
+'eniro\.se',\r
+'ereadingsource\.com',\r
+'es\.mirago\.com',\r
+'etools\.ch',\r
+'euroseek\.',\r
+'everyclick\.com',\r
+'evreka\.passagen\.se',\r
+'excite\.',\r
+'extern\.peoplecheck\.de',\r
+'fastbot\.de',\r
+'find\.dk',\r
+'find1friend\.com',\r
+'findamo\.com',\r
+'findarticles\.com',\r
+'fireball\.de',\r
+'forums\.iboats\.com',\r
+'foxstart\.com',\r
+'francite\.',\r
+'gazeta\.pl',\r
+'gery\.pl',\r
+'globososo\.',\r
+'go\.mail\.ru',\r
+'go\.speedbit\.com',\r
+'go2net\.com',\r
+'godado',\r
+'goggle\.co\.hu$',\r
+'goliat\.hu',\r
+'goodsearch\.com',\r
+'gotuneed\.com',\r
+'haku\.www\.fi',\r
+'heureka\.hu',\r
+'hoga\.pl',\r
+'hotbot\.',\r
+'hubwe\.net',\r
+'icerocket\.com',\r
+'icq\.com\/search',\r
+'ifind\.freeserve',\r
+'ilse\.',\r
+'inbox\.com',\r
+'index\.hu',\r
+'ineffabile\.it',\r
+'info\.co\.uk',\r
+'infoseek\.de',\r
+'infospace\.com',\r
+'inspsearch\.com',\r
+'int\.search\.myway\.com',\r
+'int\.search-results\.com',\r
+'interia\.pl',\r
+'isearch\.nation\.com',\r
+'i-une\.com',\r
+'ixquick\.com',\r
+'izito\.co\.uk',\r
+'izito\.co\.de',\r
+'izito\.',\r
+'jubii\.dk',\r
+'jumpy\.it',\r
+'juno\.com',\r
+'jyxo\.(cz|com)',\r
+'kartoo\.com',\r
+'katalog\.onet\.pl',\r
+'kataweb\.it',\r
+'kereso\.startlap\.hu',\r
+'keresolap\.hu',\r
+'kvasir\.',\r
+'kvitters\.',\r
+'lapkereso\.hu',\r
+'lbb\.org',\r
+'ledix\.net',\r
+'libero\.it/',\r
+'localmoxie\.com',\r
+'looksmart\.co\.uk',\r
+'looksmart\.',\r
+'lycos\.',\r
+'mamma\.',\r
+'meinestadt\.de',\r
+'meta\.ua',\r
+'metabot\.ru',\r
+'metacrawler\.',\r
+'metager\.de',\r
+'miner\.bol\.com\.br',\r
+'mirago\.be',\r
+'mirago\.ch',\r
+'mirago\.co\.uk',\r
+'mirago\.de',\r
+'mirago\.dk',\r
+'mirago\.fr',\r
+'mirago\.it',\r
+'mirago\.nl',\r
+'mirago\.se',\r
+'mirago',\r
+'mitrasites\.com',\r
+'mozbot\.fr',\r
+'my\.allgameshome\.com',\r
+'mys\.yoursearch\.me',\r
+'mysearch\.',\r
+'mysearchdial\.com',\r
+'mysearchresults\.com',\r
+'myway\.com',\r
+'najdi\.to',\r
+'nation\.',\r
+'navigationshilfe\.t-online\.de',\r
+'nbci\.com\/search',\r
+'netluchs\.de',\r
+'netscape\.',\r
+'netsprint\.pl',\r
+'netstjernen\.dk',\r
+'netzero\.net',\r
+'no\.mirago\.com',\r
+'northernlight\.',\r
+'nusearch\.com',\r
+'o2\.pl',\r
+'ofir\.dk',\r
+'opasia\.dk',\r
+'orangeworld\.co\.uk',\r
+'orbis\.dk',\r
+'overture\.com',\r
+'pch\.com',\r
+'picsearch\.de',\r
+'pictures\.com',\r
+'plusnetwork\.com',\r
+'pogodak\.',\r
+'polska\.pl',\r
+'polymeta\.hu',\r
+'preciobarato\.xyz',\r
+'questionanswering\.com',\r
+'quick\.cz',\r
+'rambler\.ru',\r
+'recherche\.club-internet\.fr',\r
+'rechercher\.libertysurf\.fr',\r
+'redbox\.cz',\r
+'rr\.com',\r
+'sagool\.jp',\r
+'sapo\.pt',\r
+'schoenerbrausen\.de',\r
+'scroogle\.org',\r
+'search[\w\-]+\.free\.fr',\r
+'search\.1und1\.de',\r
+'search\.alice\.it\.master',\r
+'search\.alice\.it',\r
+'search\.alot\.com',\r
+'search\.bluewin\.ch',\r
+'search\.bt\.com',\r
+'search\.certified-toolbar\.com',\r
+'search\.ch',\r
+'search\.comcast\.net',\r
+'search\.earthlink\.net',\r
+'search\.fbdownloader\.com',\r
+'search\.fdownloadr\.com',\r
+'search\.foxtab\.com',\r
+'search\.genieo\.com',\r
+'search\.goo\.ne\.jp',\r
+'search\.handycafe\.com',\r
+'search\.incredibar\.com',\r
+'search\.incredimail\.com',\r
+'search\.internetto\.hu',\r
+'search\.orange\.co\.uk',\r
+'search\.sky\.com',\r
+'search\.sli\.sympatico\.ca',\r
+'search\.socialdownloadr\.com',\r
+'search\.sweetim\.com',\r
+'search\.terra\.',\r
+'search\.zonealarm\.com',\r
+'searchalgo\.com',\r
+'searchalot\.com',\r
+'searchcompletion\.com',\r
+'searches\.qone8\.com',\r
+'searches\.safehomepage\.com',\r
+'searches\.vi-view\.com',\r
+'searchesnavigator\.com',\r
+'searchgol\.com',\r
+'searchlistingsite\.com',\r
+'searchmobileonline\.com',\r
+'search-results\.com',\r
+'search-results\.mobi',\r
+'searchsafer\.com',\r
+'searchy\.co\.uk',\r
+'searchya\.com',\r
+'segnalo\.alice\.it',\r
+'semalt\.com',\r
+'sensis\.com\.au',\r
+'seznam\.cz',\r
+'shinyseek\.it',\r
+'shoppstop\.com',\r
+'sify\.com',\r
+'sm\.de',\r
+'smartsuggestor\.com',\r
+'snapdo\.com',\r
+'softonic\.com',\r
+'sogou\.com',\r
+'sok\.start\.no',\r
+'sol\.dk',\r
+'soso\.com',\r
+'sphere\.com',\r
+'splut\.',\r
+'spotjockey\.',\r
+'spray\.',\r
+'sr\.searchfunmoods\.com',\r
+'start\.iminent\.com',\r
+'start\.shaw\.ca',\r
+'start\.toshiba\.com',\r
+'startpage\.com',\r
+'startsiden\.no',\r
+'static\.flipora\.com',\r
+'steadysearch\.com',\r
+'steady-search\.com',\r
+'stumbleupon\.com',\r
+'suche\.1und1\.de',\r
+'suche\.freenet\.de',\r
+'suche\.gmx\.at',\r
+'suche\.gmx\.net',\r
+'suche\d?\.web\.de',\r
+'suchen\.abacho\.de',\r
+'sumaja\.de',\r
+'supereva\.com',\r
+'surfcanyon\.com',\r
+'sweetpacks-search\.com',\r
+'swik\.net',\r
+'swisscows\.ch',\r
+'szukacz\.pl',\r
+'szukaj\.onet\.pl',\r
+'szukaj\.wp\.pl',\r
+'talktalk\.co\.uk',\r
+'tango\.hu',\r
+'teecno\.it',\r
+'teoma\.',\r
+'theallsearches\.com',\r
+'three\.co\.uk',\r
+'tiscali\.',\r
+'tixuma\.de',\r
+'toile\.com',\r
+'t-online\.de',\r
+'t-online',\r
+'turtle\.ru',\r
+'tyfon\.dk',\r
+'uk\.foxstart\.com',\r
+'ukdirectory\.',\r
+'ukindex\.co\.uk',\r
+'ukplus\.',\r
+'umfis\.de',\r
+'umuwa\.de',\r
+'uni-hannover\.de',\r
+'vindex\.',\r
+'virgilio\.it',\r
+'virginmedia\.com',\r
+'vivisimo\.com',\r
+'vizsla\.origo\.hu',\r
+'vnet\.cn',\r
+'voila\.',\r
+'wahoo\.hu',\r
+'webalta\.ru',\r
+'webcrawler\.',\r
+'webmania\.hu',\r
+'websearch\.rakuten\.co\.jp',\r
+'whorush\.com',\r
+'windowssearch\.com',\r
+'wisenut\.com',\r
+'wow\.pl',\r
+'wow\.utop\.it',\r
+'www\.benefind\.de',\r
+'www\.buenosearch\.com',\r
+'www\.dregol\.com',\r
+'www\.govome\.com',\r
+'www\.holasearch\.com',\r
+'www\.metasuche\.ch',\r
+'www\.oneseek\.de',\r
+'www\.qwant\.com',\r
+'www\.search\.com',\r
+'www\.startxxl\.com',\r
+'www\.vlips\.de',\r
+'www\.wow\.com',\r
+'www1\.search-results\.com',\r
+'wwweasel\.de',\r
+'yourbestsearch\.net',\r
+'youtube\.com',\r
+'zhongsou\.com',\r
+'zoeken\.nl',\r
+'zoznam\.sk'\r
+);\r
+\r
+@SearchEnginesSearchIDOrder_list2=(\r
+# Minor search engines\r
+);\r
+@SearchEnginesSearchIDOrder_listgen=(\r
+# Generic search engines\r
+'search\..*\.\w+'\r
+);\r
+\r
+# NotSearchEnginesKeys\r
+# If a search engine key is found, we check its exclude list to know if it's\r
+# really a search engine\r
+#------------------------------------------------------------------------------\r
+%NotSearchEnginesKeys=(\r
+'altavista\.'=>'babelfish\.altavista\.',\r
+'google\.'=>'mail\.google\.',\r
+'google\.'=>'translate\.google\.',\r
+'msn\.'=>'hotmail\.msn\.',\r
+'tiscali\.'=>'mail\.tiscali\.',\r
+'yahoo\.'=>'mail\.yahoo\.',\r
+'yandex\.'=>'direct\.yandex\.'\r
+);\r
+\r
+# SearchEnginesHashID\r
+# Each Search Engine Search ID is associated to an AWStats id string\r
+#------------------------------------------------------------------------------\r
+%SearchEnginesHashID = (\r
+# Major search engines\r
+\r
+'^www\.google\.co\.uk$','www_google_co_uk',\r
+'^images\.google\.co\.uk$','images_google_co_uk',\r
+'google\.co\.uk$','google_co_uk',\r
+'^www\.google\.com$','www_google_com',\r
+'^images\.google\.com$','images_google_com',\r
+'google\.com$','google_com',\r
+\r
+'bing\.com','bing',\r
+'^(www\.|)yandex\.ru$','yandexru',\r
+'^(www\.|)yandex\.com\.tr$','yandexcomtr',\r
+'^(www\.|)yandex\.ua$','yandexua',\r
+'^(www\.|)yandex\.kz$','yandexkz',\r
+'^(www\.|)yandex\.com$','yandexcom',\r
+'yandex\.','yandex',\r
+'r\.search\.yahoo\.com','r_search_yahoo_com',\r
+\r
+'^www\.google\.de$','www_google_de',\r
+'^images\.google\.de$','images_google_de',\r
+'google\.de$','google_de',\r
+'^www\.google\.fr$','www_google_fr',\r
+'^images\.google\.fr$','images_google_fr',\r
+'google\.fr$','google_fr',\r
+'^www\.google\.ca$','www_google_ca',\r
+'^images\.google\.ca$','images_google_ca',\r
+'google\.ca$','google_ca',\r
+'^www\.google\.es$','www_google_es',\r
+'^images\.google\.es$','images_google_es',\r
+'google\.es$','google_es',\r
+'^www\.google\.com\.au$','www_google_com_au',\r
+'^images\.google\.com\.au$','images_google_com_au',\r
+'google\.com\.au$','google_com_au',\r
+'^www\.google\.nl$','www_google_nl',\r
+'^images\.google\.nl$','images_google_nl',\r
+'google\.nl$','google_nl',\r
+'^www\.google\.gr$','www_google_gr',\r
+'^images\.google\.gr$','images_google_gr',\r
+'google\.gr$','google_gr',\r
+'^www\.google\.se$','www_google_se',\r
+'^images\.google\.se$','images_google_se',\r
+'google\.se$','google_se',\r
+'^www\.google\.ie$','www_google_ie',\r
+'^images\.google\.ie$','images_google_ie',\r
+'google\.ie$','google_ie',\r
+'^www\.google\.it$','www_google_it',\r
+'^images\.google\.it$','images_google_it',\r
+'google\.it$','google_it',\r
+'^www\.google\.no$','www_google_no',\r
+'^images\.google\.no$','images_google_no',\r
+'google\.no$','google_no',\r
+'^www\.google\.com\.tr$','www_google_com_tr',\r
+'^images\.google\.com\.tr$','images_google_com_tr',\r
+'google\.com\.tr$','google_com_tr',\r
+'^www\.google\.co\.in$','www_google_co_in',\r
+'^images\.google\.co\.in$','images_google_co_in',\r
+'google\.co\.in$','google_co_in',\r
+'^www\.google\.pt$','www_google_pt',\r
+'^images\.google\.pt$','images_google_pt',\r
+'google\.pt$','google_pt',\r
+'^www\.google\.hr$','www_google_hr',\r
+'^images\.google\.hr$','images_google_hr',\r
+'google\.hr$','google_hr',\r
+'^www\.google\.co\.nz$','www_google_co_nz',\r
+'^images\.google\.co\.nz$','images_google_co_nz',\r
+'google\.co\.nz$','google_co_nz',\r
+'^www\.google\.pl$','www_google_pl',\r
+'^images\.google\.pl$','images_google_pl',\r
+'google\.pl$','google_pl',\r
+'^www\.google\.ac$','www_google_ac',\r
+'^images\.google\.ac$','images_google_ac',\r
+'google\.ac$','google_ac',\r
+'^www\.google\.ad$','www_google_ad',\r
+'^images\.google\.ad$','images_google_ad',\r
+'google\.ad$','google_ad',\r
+'^www\.google\.ae$','www_google_ae',\r
+'^images\.google\.ae$','images_google_ae',\r
+'google\.ae$','google_ae',\r
+'^www\.google\.al$','www_google_al',\r
+'^images\.google\.al$','images_google_al',\r
+'google\.al$','google_al',\r
+'^www\.google\.am$','www_google_am',\r
+'^images\.google\.am$','images_google_am',\r
+'google\.am$','google_am',\r
+'^www\.google\.as$','www_google_as',\r
+'^images\.google\.as$','images_google_as',\r
+'google\.as$','google_as',\r
+'^www\.google\.at$','www_google_at',\r
+'^images\.google\.at$','images_google_at',\r
+'google\.at$','google_at',\r
+'^www\.google\.az$','www_google_az',\r
+'^images\.google\.az$','images_google_az',\r
+'google\.az$','google_az',\r
+'^www\.google\.ba$','www_google_ba',\r
+'^images\.google\.ba$','images_google_ba',\r
+'google\.ba$','google_ba',\r
+'^www\.google\.be$','www_google_be',\r
+'^images\.google\.be$','images_google_be',\r
+'google\.be$','google_be',\r
+'^www\.google\.bf$','www_google_bf',\r
+'^images\.google\.bf$','images_google_bf',\r
+'google\.bf$','google_bf',\r
+'^www\.google\.bg$','www_google_bg',\r
+'^images\.google\.bg$','images_google_bg',\r
+'google\.bg$','google_bg',\r
+'^www\.google\.bi$','www_google_bi',\r
+'^images\.google\.bi$','images_google_bi',\r
+'google\.bi$','google_bi',\r
+'^www\.google\.bj$','www_google_bj',\r
+'^images\.google\.bj$','images_google_bj',\r
+'google\.bj$','google_bj',\r
+'^www\.google\.bs$','www_google_bs',\r
+'^images\.google\.bs$','images_google_bs',\r
+'google\.bs$','google_bs',\r
+'^www\.google\.bt$','www_google_bt',\r
+'^images\.google\.bt$','images_google_bt',\r
+'google\.bt$','google_bt',\r
+'^www\.google\.by$','www_google_by',\r
+'^images\.google\.by$','images_google_by',\r
+'google\.by$','google_by',\r
+'^www\.google\.cat$','www_google_cat',\r
+'^images\.google\.cat$','images_google_cat',\r
+'google\.cat$','google_cat',\r
+'^www\.google\.cc$','www_google_cc',\r
+'^images\.google\.cc$','images_google_cc',\r
+'google\.cc$','google_cc',\r
+'^www\.google\.cd$','www_google_cd',\r
+'^images\.google\.cd$','images_google_cd',\r
+'google\.cd$','google_cd',\r
+'^www\.google\.cf$','www_google_cf',\r
+'^images\.google\.cf$','images_google_cf',\r
+'google\.cf$','google_cf',\r
+'^www\.google\.cg$','www_google_cg',\r
+'^images\.google\.cg$','images_google_cg',\r
+'google\.cg$','google_cg',\r
+'^www\.google\.ch$','www_google_ch',\r
+'^images\.google\.ch$','images_google_ch',\r
+'google\.ch$','google_ch',\r
+'^www\.google\.ci$','www_google_ci',\r
+'^images\.google\.ci$','images_google_ci',\r
+'google\.ci$','google_ci',\r
+'^www\.google\.cl$','www_google_cl',\r
+'^images\.google\.cl$','images_google_cl',\r
+'google\.cl$','google_cl',\r
+'^www\.google\.cm$','www_google_cm',\r
+'^images\.google\.cm$','images_google_cm',\r
+'google\.cm$','google_cm',\r
+'^www\.google\.cn$','www_google_cn',\r
+'^images\.google\.cn$','images_google_cn',\r
+'google\.cn$','google_cn',\r
+'^www\.google\.co\.ao$','www_google_co_ao',\r
+'^images\.google\.co\.ao$','images_google_co_ao',\r
+'google\.co\.ao$','google_co_ao',\r
+'^www\.google\.co\.bw$','www_google_co_bw',\r
+'^images\.google\.co\.bw$','images_google_co_bw',\r
+'google\.co\.bw$','google_co_bw',\r
+'^www\.google\.co\.ck$','www_google_co_ck',\r
+'^images\.google\.co\.ck$','images_google_co_ck',\r
+'google\.co\.ck$','google_co_ck',\r
+'^www\.google\.co\.cr$','www_google_co_cr',\r
+'^images\.google\.co\.cr$','images_google_co_cr',\r
+'google\.co\.cr$','google_co_cr',\r
+'^www\.google\.co\.id$','www_google_co_id',\r
+'^images\.google\.co\.id$','images_google_co_id',\r
+'google\.co\.id$','google_co_id',\r
+'^www\.google\.co\.il$','www_google_co_il',\r
+'^images\.google\.co\.il$','images_google_co_il',\r
+'google\.co\.il$','google_co_il',\r
+'^www\.google\.co\.jp$','www_google_co_jp',\r
+'^images\.google\.co\.jp$','images_google_co_jp',\r
+'google\.co\.jp$','google_co_jp',\r
+'^www\.google\.co\.ke$','www_google_co_ke',\r
+'^images\.google\.co\.ke$','images_google_co_ke',\r
+'google\.co\.ke$','google_co_ke',\r
+'^www\.google\.co\.kr$','www_google_co_kr',\r
+'^images\.google\.co\.kr$','images_google_co_kr',\r
+'google\.co\.kr$','google_co_kr',\r
+'^www\.google\.co\.ls$','www_google_co_ls',\r
+'^images\.google\.co\.ls$','images_google_co_ls',\r
+'google\.co\.ls$','google_co_ls',\r
+'^www\.google\.co\.ma$','www_google_co_ma',\r
+'^images\.google\.co\.ma$','images_google_co_ma',\r
+'google\.co\.ma$','google_co_ma',\r
+'^www\.google\.co\.mz$','www_google_co_mz',\r
+'^images\.google\.co\.mz$','images_google_co_mz',\r
+'google\.co\.mz$','google_co_mz',\r
+'^www\.google\.co\.th$','www_google_co_th',\r
+'^images\.google\.co\.th$','images_google_co_th',\r
+'google\.co\.th$','google_co_th',\r
+'^www\.google\.co\.tz$','www_google_co_tz',\r
+'^images\.google\.co\.tz$','images_google_co_tz',\r
+'google\.co\.tz$','google_co_tz',\r
+'^www\.google\.co\.ug$','www_google_co_ug',\r
+'^images\.google\.co\.ug$','images_google_co_ug',\r
+'google\.co\.ug$','google_co_ug',\r
+'^www\.google\.co\.uz$','www_google_co_uz',\r
+'^images\.google\.co\.uz$','images_google_co_uz',\r
+'google\.co\.uz$','google_co_uz',\r
+'^www\.google\.co\.ve$','www_google_co_ve',\r
+'^images\.google\.co\.ve$','images_google_co_ve',\r
+'google\.co\.ve$','google_co_ve',\r
+'^www\.google\.co\.vi$','www_google_co_vi',\r
+'^images\.google\.co\.vi$','images_google_co_vi',\r
+'google\.co\.vi$','google_co_vi',\r
+'^www\.google\.co\.za$','www_google_co_za',\r
+'^images\.google\.co\.za$','images_google_co_za',\r
+'google\.co\.za$','google_co_za',\r
+'^www\.google\.co\.zm$','www_google_co_zm',\r
+'^images\.google\.co\.zm$','images_google_co_zm',\r
+'google\.co\.zm$','google_co_zm',\r
+'^www\.google\.co\.zw$','www_google_co_zw',\r
+'^images\.google\.co\.zw$','images_google_co_zw',\r
+'google\.co\.zw$','google_co_zw',\r
+'^www\.google\.com\.af$','www_google_com_af',\r
+'^images\.google\.com\.af$','images_google_com_af',\r
+'google\.com\.af$','google_com_af',\r
+'^www\.google\.com\.ag$','www_google_com_ag',\r
+'^images\.google\.com\.ag$','images_google_com_ag',\r
+'google\.com\.ag$','google_com_ag',\r
+'^www\.google\.com\.ai$','www_google_com_ai',\r
+'^images\.google\.com\.ai$','images_google_com_ai',\r
+'google\.com\.ai$','google_com_ai',\r
+'^www\.google\.com\.ar$','www_google_com_ar',\r
+'^images\.google\.com\.ar$','images_google_com_ar',\r
+'google\.com\.ar$','google_com_ar',\r
+'^www\.google\.com\.bd$','www_google_com_bd',\r
+'^images\.google\.com\.bd$','images_google_com_bd',\r
+'google\.com\.bd$','google_com_bd',\r
+'^www\.google\.com\.bh$','www_google_com_bh',\r
+'^images\.google\.com\.bh$','images_google_com_bh',\r
+'google\.com\.bh$','google_com_bh',\r
+'^www\.google\.com\.bn$','www_google_com_bn',\r
+'^images\.google\.com\.bn$','images_google_com_bn',\r
+'google\.com\.bn$','google_com_bn',\r
+'^www\.google\.com\.bo$','www_google_com_bo',\r
+'^images\.google\.com\.bo$','images_google_com_bo',\r
+'google\.com\.bo$','google_com_bo',\r
+'^www\.google\.com\.br$','www_google_com_br',\r
+'^images\.google\.com\.br$','images_google_com_br',\r
+'google\.com\.br$','google_com_br',\r
+'^www\.google\.com\.bz$','www_google_com_bz',\r
+'^images\.google\.com\.bz$','images_google_com_bz',\r
+'google\.com\.bz$','google_com_bz',\r
+'^www\.google\.com\.co$','www_google_com_co',\r
+'^images\.google\.com\.co$','images_google_com_co',\r
+'google\.com\.co$','google_com_co',\r
+'^www\.google\.com\.cu$','www_google_com_cu',\r
+'^images\.google\.com\.cu$','images_google_com_cu',\r
+'google\.com\.cu$','google_com_cu',\r
+\r
+'^www\.google\.com\.cy$','www_google_com_cy',\r
+'^images\.google\.com\.cy$','images_google_com_cy',\r
+'google\.com\.cy$','google_com_cy',\r
+'^www\.google\.com\.do$','www_google_com_do',\r
+'^images\.google\.com\.do$','images_google_com_do',\r
+'google\.com\.do$','google_com_do',\r
+'^www\.google\.com\.ec$','www_google_com_ec',\r
+'^images\.google\.com\.ec$','images_google_com_ec',\r
+'google\.com\.ec$','google_com_ec',\r
+'^www\.google\.com\.eg$','www_google_com_eg',\r
+'^images\.google\.com\.eg$','images_google_com_eg',\r
+'google\.com\.eg$','google_com_eg',\r
+'^www\.google\.com\.et$','www_google_com_et',\r
+'^images\.google\.com\.et$','images_google_com_et',\r
+'google\.com\.et$','google_com_et',\r
+'^www\.google\.com\.fj$','www_google_com_fj',\r
+'^images\.google\.com\.fj$','images_google_com_fj',\r
+'google\.com\.fj$','google_com_fj',\r
+'^www\.google\.com\.gh$','www_google_com_gh',\r
+'^images\.google\.com\.gh$','images_google_com_gh',\r
+'google\.com\.gh$','google_com_gh',\r
+'^www\.google\.com\.gi$','www_google_com_gi',\r
+'^images\.google\.com\.gi$','images_google_com_gi',\r
+'google\.com\.gi$','google_com_gi',\r
+'^www\.google\.com\.gt$','www_google_com_gt',\r
+'^images\.google\.com\.gt$','images_google_com_gt',\r
+'google\.com\.gt$','google_com_gt',\r
+'^www\.google\.com\.hk$','www_google_com_hk',\r
+'^images\.google\.com\.hk$','images_google_com_hk',\r
+'google\.com\.hk$','google_com_hk',\r
+'^www\.google\.com\.jm$','www_google_com_jm',\r
+'^images\.google\.com\.jm$','images_google_com_jm',\r
+'google\.com\.jm$','google_com_jm',\r
+'^www\.google\.com\.kh$','www_google_com_kh',\r
+'^images\.google\.com\.kh$','images_google_com_kh',\r
+'google\.com\.kh$','google_com_kh',\r
+'^www\.google\.com\.kw$','www_google_com_kw',\r
+'^images\.google\.com\.kw$','images_google_com_kw',\r
+'google\.com\.kw$','google_com_kw',\r
+'^www\.google\.com\.lb$','www_google_com_lb',\r
+'^images\.google\.com\.lb$','images_google_com_lb',\r
+'google\.com\.lb$','google_com_lb',\r
+'^www\.google\.com\.lc$','www_google_com_lc',\r
+'^images\.google\.com\.lc$','images_google_com_lc',\r
+'google\.com\.lc$','google_com_lc',\r
+'^www\.google\.com\.ly$','www_google_com_ly',\r
+'^images\.google\.com\.ly$','images_google_com_ly',\r
+'google\.com\.ly$','google_com_ly',\r
+'^www\.google\.com\.mm$','www_google_com_mm',\r
+'^images\.google\.com\.mm$','images_google_com_mm',\r
+'google\.com\.mm$','google_com_mm',\r
+'^www\.google\.com\.mt$','www_google_com_mt',\r
+'^images\.google\.com\.mt$','images_google_com_mt',\r
+'google\.com\.mt$','google_com_mt',\r
+'^www\.google\.com\.mx$','www_google_com_mx',\r
+'^images\.google\.com\.mx$','images_google_com_mx',\r
+'google\.com\.mx$','google_com_mx',\r
+'^www\.google\.com\.my$','www_google_com_my',\r
+'^images\.google\.com\.my$','images_google_com_my',\r
+'google\.com\.my$','google_com_my',\r
+'^www\.google\.com\.na$','www_google_com_na',\r
+'^images\.google\.com\.na$','images_google_com_na',\r
+'google\.com\.na$','google_com_na',\r
+'^www\.google\.com\.nf$','www_google_com_nf',\r
+'^images\.google\.com\.nf$','images_google_com_nf',\r
+'google\.com\.nf$','google_com_nf',\r
+'^www\.google\.com\.ng$','www_google_com_ng',\r
+'^images\.google\.com\.ng$','images_google_com_ng',\r
+'google\.com\.ng$','google_com_ng',\r
+'^www\.google\.com\.ni$','www_google_com_ni',\r
+'^images\.google\.com\.ni$','images_google_com_ni',\r
+'google\.com\.ni$','google_com_ni',\r
+'^www\.google\.com\.np$','www_google_com_np',\r
+'^images\.google\.com\.np$','images_google_com_np',\r
+'google\.com\.np$','google_com_np',\r
+'^www\.google\.com\.om$','www_google_com_om',\r
+'^images\.google\.com\.om$','images_google_com_om',\r
+'google\.com\.om$','google_com_om',\r
+'^www\.google\.com\.pa$','www_google_com_pa',\r
+'^images\.google\.com\.pa$','images_google_com_pa',\r
+'google\.com\.pa$','google_com_pa',\r
+'^www\.google\.com\.pe$','www_google_com_pe',\r
+'^images\.google\.com\.pe$','images_google_com_pe',\r
+'google\.com\.pe$','google_com_pe',\r
+'^www\.google\.com\.pg$','www_google_com_pg',\r
+'^images\.google\.com\.pg$','images_google_com_pg',\r
+'google\.com\.pg$','google_com_pg',\r
+'^www\.google\.com\.ph$','www_google_com_ph',\r
+'^images\.google\.com\.ph$','images_google_com_ph',\r
+'google\.com\.ph$','google_com_ph',\r
+'^www\.google\.com\.pk$','www_google_com_pk',\r
+'^images\.google\.com\.pk$','images_google_com_pk',\r
+'google\.com\.pk$','google_com_pk',\r
+'^www\.google\.com\.pr$','www_google_com_pr',\r
+'^images\.google\.com\.pr$','images_google_com_pr',\r
+'google\.com\.pr$','google_com_pr',\r
+'^www\.google\.com\.py$','www_google_com_py',\r
+'^images\.google\.com\.py$','images_google_com_py',\r
+'google\.com\.py$','google_com_py',\r
+'^www\.google\.com\.qa$','www_google_com_qa',\r
+'^images\.google\.com\.qa$','images_google_com_qa',\r
+'google\.com\.qa$','google_com_qa',\r
+'^www\.google\.com\.sa$','www_google_com_sa',\r
+'^images\.google\.com\.sa$','images_google_com_sa',\r
+'google\.com\.sa$','google_com_sa',\r
+'^www\.google\.com\.sb$','www_google_com_sb',\r
+'^images\.google\.com\.sb$','images_google_com_sb',\r
+'google\.com\.sb$','google_com_sb',\r
+'^www\.google\.com\.sg$','www_google_com_sg',\r
+'^images\.google\.com\.sg$','images_google_com_sg',\r
+'google\.com\.sg$','google_com_sg',\r
+'^www\.google\.com\.sl$','www_google_com_sl',\r
+'^images\.google\.com\.sl$','images_google_com_sl',\r
+'google\.com\.sl$','google_com_sl',\r
+'^www\.google\.com\.sv$','www_google_com_sv',\r
+'^images\.google\.com\.sv$','images_google_com_sv',\r
+'google\.com\.sv$','google_com_sv',\r
+'^www\.google\.com\.tj$','www_google_com_tj',\r
+'^images\.google\.com\.tj$','images_google_com_tj',\r
+'google\.com\.tj$','google_com_tj',\r
+'^www\.google\.com\.tw$','www_google_com_tw',\r
+'^images\.google\.com\.tw$','images_google_com_tw',\r
+'google\.com\.tw$','google_com_tw',\r
+'^www\.google\.com\.ua$','www_google_com_ua',\r
+'^images\.google\.com\.ua$','images_google_com_ua',\r
+'google\.com\.ua$','google_com_ua',\r
+'^www\.google\.com\.uy$','www_google_com_uy',\r
+'^images\.google\.com\.uy$','images_google_com_uy',\r
+'google\.com\.uy$','google_com_uy',\r
+'^www\.google\.com\.vc$','www_google_com_vc',\r
+'^images\.google\.com\.vc$','images_google_com_vc',\r
+'google\.com\.vc$','google_com_vc',\r
+'^www\.google\.com\.vn$','www_google_com_vn',\r
+'^images\.google\.com\.vn$','images_google_com_vn',\r
+'google\.com\.vn$','google_com_vn',\r
+'^www\.google\.cv$','www_google_cv',\r
+'^images\.google\.cv$','images_google_cv',\r
+'google\.cv$','google_cv',\r
+'^www\.google\.cz$','www_google_cz',\r
+'^images\.google\.cz$','images_google_cz',\r
+'google\.cz$','google_cz',\r
+'^www\.google\.dj$','www_google_dj',\r
+'^images\.google\.dj$','images_google_dj',\r
+'google\.dj$','google_dj',\r
+'^www\.google\.dk$','www_google_dk',\r
+'^images\.google\.dk$','images_google_dk',\r
+'google\.dk$','google_dk',\r
+'^www\.google\.dm$','www_google_dm',\r
+'^images\.google\.dm$','images_google_dm',\r
+'google\.dm$','google_dm',\r
+'^www\.google\.dz$','www_google_dz',\r
+'^images\.google\.dz$','images_google_dz',\r
+'google\.dz$','google_dz',\r
+'^www\.google\.ee$','www_google_ee',\r
+'^images\.google\.ee$','images_google_ee',\r
+'google\.ee$','google_ee',\r
+'^www\.google\.fi$','www_google_fi',\r
+'^images\.google\.fi$','images_google_fi',\r
+'google\.fi$','google_fi',\r
+'^www\.google\.fm$','www_google_fm',\r
+'^images\.google\.fm$','images_google_fm',\r
+'google\.fm$','google_fm',\r
+'^www\.google\.ga$','www_google_ga',\r
+'^images\.google\.ga$','images_google_ga',\r
+'google\.ga$','google_ga',\r
+'^www\.google\.ge$','www_google_ge',\r
+'^images\.google\.ge$','images_google_ge',\r
+'google\.ge$','google_ge',\r
+'^www\.google\.gf$','www_google_gf',\r
+'^images\.google\.gf$','images_google_gf',\r
+'google\.gf$','google_gf',\r
+'^www\.google\.gg$','www_google_gg',\r
+'^images\.google\.gg$','images_google_gg',\r
+'google\.gg$','google_gg',\r
+'^www\.google\.gl$','www_google_gl',\r
+'^images\.google\.gl$','images_google_gl',\r
+'google\.gl$','google_gl',\r
+'^www\.google\.gm$','www_google_gm',\r
+'^images\.google\.gm$','images_google_gm',\r
+'google\.gm$','google_gm',\r
+'^www\.google\.gp$','www_google_gp',\r
+'^images\.google\.gp$','images_google_gp',\r
+'google\.gp$','google_gp',\r
+'^www\.google\.gy$','www_google_gy',\r
+'^images\.google\.gy$','images_google_gy',\r
+'google\.gy$','google_gy',\r
+'^www\.google\.hn$','www_google_hn',\r
+'^images\.google\.hn$','images_google_hn',\r
+'google\.hn$','google_hn',\r
+'^www\.google\.ht$','www_google_ht',\r
+'^images\.google\.ht$','images_google_ht',\r
+'google\.ht$','google_ht',\r
+'^www\.google\.hu$','www_google_hu',\r
+'^images\.google\.hu$','images_google_hu',\r
+'google\.hu$','google_hu',\r
+'^www\.google\.im$','www_google_im',\r
+'^images\.google\.im$','images_google_im',\r
+'google\.im$','google_im',\r
+'^www\.google\.io$','www_google_io',\r
+'^images\.google\.io$','images_google_io',\r
+'google\.io$','google_io',\r
+'^www\.google\.iq$','www_google_iq',\r
+'^images\.google\.iq$','images_google_iq',\r
+'google\.iq$','google_iq',\r
+'^www\.google\.is$','www_google_is',\r
+'^images\.google\.is$','images_google_is',\r
+'google\.is$','google_is',\r
+'^www\.google\.je$','www_google_je',\r
+'^images\.google\.je$','images_google_je',\r
+'google\.je$','google_je',\r
+'^www\.google\.jo$','www_google_jo',\r
+'^images\.google\.jo$','images_google_jo',\r
+'google\.jo$','google_jo',\r
+'^www\.google\.kg$','www_google_kg',\r
+'^images\.google\.kg$','images_google_kg',\r
+'google\.kg$','google_kg',\r
+'^www\.google\.ki$','www_google_ki',\r
+'^images\.google\.ki$','images_google_ki',\r
+'google\.ki$','google_ki',\r
+'^www\.google\.kz$','www_google_kz',\r
+'^images\.google\.kz$','images_google_kz',\r
+'google\.kz$','google_kz',\r
+'^www\.google\.la$','www_google_la',\r
+'^images\.google\.la$','images_google_la',\r
+'google\.la$','google_la',\r
+'^www\.google\.li$','www_google_li',\r
+'^images\.google\.li$','images_google_li',\r
+'google\.li$','google_li',\r
+'^www\.google\.lk$','www_google_lk',\r
+'^images\.google\.lk$','images_google_lk',\r
+'google\.lk$','google_lk',\r
+'^www\.google\.lt$','www_google_lt',\r
+'^images\.google\.lt$','images_google_lt',\r
+'google\.lt$','google_lt',\r
+'^www\.google\.lu$','www_google_lu',\r
+'^images\.google\.lu$','images_google_lu',\r
+'google\.lu$','google_lu',\r
+'^www\.google\.lv$','www_google_lv',\r
+'^images\.google\.lv$','images_google_lv',\r
+'google\.lv$','google_lv',\r
+'^www\.google\.md$','www_google_md',\r
+'^images\.google\.md$','images_google_md',\r
+'google\.md$','google_md',\r
+'^www\.google\.me$','www_google_me',\r
+'^images\.google\.me$','images_google_me',\r
+'google\.me$','google_me',\r
+'^www\.google\.mg$','www_google_mg',\r
+'^images\.google\.mg$','images_google_mg',\r
+'google\.mg$','google_mg',\r
+'^www\.google\.mk$','www_google_mk',\r
+'^images\.google\.mk$','images_google_mk',\r
+'google\.mk$','google_mk',\r
+'^www\.google\.ml$','www_google_ml',\r
+'^images\.google\.ml$','images_google_ml',\r
+'google\.ml$','google_ml',\r
+'^www\.google\.mn$','www_google_mn',\r
+'^images\.google\.mn$','images_google_mn',\r
+'google\.mn$','google_mn',\r
+'^www\.google\.ms$','www_google_ms',\r
+'^images\.google\.ms$','images_google_ms',\r
+'google\.ms$','google_ms',\r
+'^www\.google\.mu$','www_google_mu',\r
+'^images\.google\.mu$','images_google_mu',\r
+'google\.mu$','google_mu',\r
+'^www\.google\.mv$','www_google_mv',\r
+'^images\.google\.mv$','images_google_mv',\r
+'google\.mv$','google_mv',\r
+'^www\.google\.mw$','www_google_mw',\r
+'^images\.google\.mw$','images_google_mw',\r
+'google\.mw$','google_mw',\r
+'^www\.google\.ne$','www_google_ne',\r
+'^images\.google\.ne$','images_google_ne',\r
+'google\.ne$','google_ne',\r
+'^www\.google\.nr$','www_google_nr',\r
+'^images\.google\.nr$','images_google_nr',\r
+'google\.nr$','google_nr',\r
+'^www\.google\.nu$','www_google_nu',\r
+'^images\.google\.nu$','images_google_nu',\r
+'google\.nu$','google_nu',\r
+'^www\.google\.pn$','www_google_pn',\r
+'^images\.google\.pn$','images_google_pn',\r
+'google\.pn$','google_pn',\r
+'^www\.google\.ps$','www_google_ps',\r
+'^images\.google\.ps$','images_google_ps',\r
+'google\.ps$','google_ps',\r
+'^www\.google\.ro$','www_google_ro',\r
+'^images\.google\.ro$','images_google_ro',\r
+'google\.ro$','google_ro',\r
+'^www\.google\.rs$','www_google_rs',\r
+'^images\.google\.rs$','images_google_rs',\r
+'google\.rs$','google_rs',\r
+'^www\.google\.ru$','www_google_ru',\r
+'^images\.google\.ru$','images_google_ru',\r
+'google\.ru$','google_ru',\r
+'^www\.google\.rw$','www_google_rw',\r
+'^images\.google\.rw$','images_google_rw',\r
+'google\.rw$','google_rw',\r
+'^www\.google\.sc$','www_google_sc',\r
+'^images\.google\.sc$','images_google_sc',\r
+'google\.sc$','google_sc',\r
+'^www\.google\.sh$','www_google_sh',\r
+'^images\.google\.sh$','images_google_sh',\r
+'google\.sh$','google_sh',\r
+'^www\.google\.si$','www_google_si',\r
+'^images\.google\.si$','images_google_si',\r
+'google\.si$','google_si',\r
+'^www\.google\.sk$','www_google_sk',\r
+'^images\.google\.sk$','images_google_sk',\r
+'google\.sk$','google_sk',\r
+'^www\.google\.sm$','www_google_sm',\r
+'^images\.google\.sm$','images_google_sm',\r
+'google\.sm$','google_sm',\r
+'^www\.google\.sn$','www_google_sn',\r
+'^images\.google\.sn$','images_google_sn',\r
+'google\.sn$','google_sn',\r
+'^www\.google\.so$','www_google_so',\r
+'^images\.google\.so$','images_google_so',\r
+'google\.so$','google_so',\r
+'^www\.google\.sr$','www_google_sr',\r
+'^images\.google\.sr$','images_google_sr',\r
+'google\.sr$','google_sr',\r
+'^www\.google\.st$','www_google_st',\r
+'^images\.google\.st$','images_google_st',\r
+'google\.st$','google_st',\r
+'^www\.google\.td$','www_google_td',\r
+'^images\.google\.td$','images_google_td',\r
+'google\.td$','google_td',\r
+'^www\.google\.tg$','www_google_tg',\r
+'^images\.google\.tg$','images_google_tg',\r
+'google\.tg$','google_tg',\r
+'^www\.google\.tk$','www_google_tk',\r
+'^images\.google\.tk$','images_google_tk',\r
+'google\.tk$','google_tk',\r
+'^www\.google\.tl$','www_google_tl',\r
+'^images\.google\.tl$','images_google_tl',\r
+'google\.tl$','google_tl',\r
+'^www\.google\.tm$','www_google_tm',\r
+'^images\.google\.tm$','images_google_tm',\r
+'google\.tm$','google_tm',\r
+'^www\.google\.tn$','www_google_tn',\r
+'^images\.google\.tn$','images_google_tn',\r
+'google\.tn$','google_tn',\r
+'^www\.google\.to$','www_google_to',\r
+'^images\.google\.to$','images_google_to',\r
+'google\.to$','google_to',\r
+'^www\.google\.tt$','www_google_tt',\r
+'^images\.google\.tt$','images_google_tt',\r
+'google\.tt$','google_tt',\r
+'^www\.google\.us$','www_google_us',\r
+'^images\.google\.us$','images_google_us',\r
+'google\.us$','google_us',\r
+'^www\.google\.vg$','www_google_vg',\r
+'^images\.google\.vg$','images_google_vg',\r
+'google\.vg$','google_vg',\r
+'^www\.google\.vu$','www_google_vu',\r
+'^images\.google\.vu$','images_google_vu',\r
+'google\.vu$','google_vu',\r
+'^www\.google\.ws$','www_google_ws',\r
+'^images\.google\.ws$','images_google_ws',\r
+'google\.ws$','google_ws',\r
+\r
+'au\.search\.yahoo\.com','au_search_yahoo_com',\r
+'ca\.search\.yahoo\.com','ca_search_yahoo_com',\r
+'fr\.search\.yahoo\.com','fr_search_yahoo_com',\r
+'image\.search\.yahoo\.co\.jp','image_search_yahoo_co_jp',\r
+'images\.search\.yahoo\.com','images_search_yahoo_com',\r
+'it\.search\.yahoo\.com','it_search_yahoo_com',\r
+'ph\.search\.yahoo\.com','ph_search_yahoo_com',\r
+'se\.search\.yahoo\.com','se_search_yahoo_com',\r
+'search\.yahoo\.co\.jp','search_yahoo_co_jp',\r
+'sg\.search\.yahoo\.com','sg_search_yahoo_com',\r
+'sg\.yhs4\.search\.yahoo\.com','sg_yhs4_search_yahoo_com',\r
+'tw\.images\.search\.yahoo\.com','tw_images_search_yahoo_com',\r
+'uk\.search\.yahoo\.com','uk_search_yahoo_com',\r
+'uk\.yhs4\.search\.yahoo\.com','uk_yhs4_search_yahoo_com',\r
+'us\.search\.yahoo\.com','us_search_yahoo_com',\r
+'search\.yahoo\.com','search_yahoo_com',\r
+'search\.yahoo','yahoo_catchall',\r
+\r
+'babylon\.com','babylon',\r
+'search\.conduit\.com','conduit',\r
+'avg\.com','avg',\r
+'mywebsearch\.com','mywebsearch',\r
+\r
+'msn\.','msn',\r
+'live\.com','live',\r
+\r
+'search\.aol\.co\.uk','aoluk',\r
+'searcht\.aol\.co\.uk','aoluk',\r
+'searcht\.aol\.com','aolcom',\r
+'search\.aol\.com','aolcom',\r
+'recherche\.aol\.fr','aolfr',\r
+'suche\.aol\.de','aolde',\r
+'de\.aolsearch\.com','aolsearchde',\r
+'sucheaol\.aol\.de','sucheaolde',\r
+'search\.hp\.my\.aol\.co\.uk','hp_my_aol',\r
+'search\.aol\.pl','aolpl',\r
+'o2suche\.aol\.de','aol_o2suche_de',\r
+'search\.aol\.','aolcatchall',\r
+\r
+'^uk\.ask\.com$','askuk',\r
+'^de\.ask\.com$','askde',\r
+'tb\.ask\.com$','tbask',\r
+'^images\.ask\.com$','askimages',\r
+\r
+'base\.google\.','google_base',\r
+'froogle\.google\.','google_froogle',\r
+'google\.[\w.]+/products','google_products',\r
+'googlecom\.com','google_catchall',\r
+'groups\.google\.','google_groups',\r
+'googlee\.','google_catchall',\r
+\r
+'216\.239\.32\.20','google_catchall',\r
+'173\.194\.32\.223','google_catchall',\r
+'216\.239\.(35|37|39|51)\.100','google_cache',\r
+'216\.239\.(35|37|39|51)\.101','google_cache',\r
+'216\.239\.5[0-9]\.104','google_cache',\r
+'64\.233\.1[0-9]{2}\.104','google_cache',\r
+'66\.102\.[1-9]\.104','google_cache',\r
+'66\.249\.93\.104','google_cache',\r
+'72\.14\.2[0-9]{2}\.104','google_cache',\r
+\r
+'maps\.google','google_maps',\r
+'translate\.google','google_translate',\r
+'173\.194\.35\.177','googleByIP',\r
+'google\.','google_catchall',\r
+\r
+'mail.yahoo.net','yahoo_catchall',\r
+'(66\.218\.71\.225|216\.109\.117\.135|216\.109\.125\.130|66\.218\.69\.11)','yahoo_catchall',\r
+'mindset\.research\.yahoo','yahoo_mindset',\r
+'yahoo\.','yahoo_catchall',\r
+'^www\.ask\.jp$','askjp',\r
+'^es\.ask\.com$','askes',\r
+'^fr\.ask\.com$','askfr',\r
+'^www\.iask\.com$','iask',\r
+'^it\.ask\.com$','askit',\r
+'^nl\.ask\.com$','asknl',\r
+'(^|\.)ask\.com$','askcatchall',\r
+\r
+'www\.tesco\.net','tesco',\r
+'yell\.','yell',\r
+'zapmeta\.ch','zapmeta_ch',\r
+'zapmeta\.com','zapmeta_com',\r
+'zapmeta\.de','zapmeta_de',\r
+'zapmeta','zapmeta_catchall',\r
+\r
+'(^|\.)go\.com','go',\r
+'(161\.58\.227\.204|161\.58\.247\.101|212\.40\.165\.90|213\.133\.108\.202|217\.160\.108\.151|217\.160\.111\.99|217\.160\.131\.108|217\.160\.142\.227|217\.160\.176\.42)','metacrawler_de',\r
+'\.facemoods\.com','facemoods',\r
+'\.funmoods\.com','funmoods',\r
+'\.metasearch\.','metasearch',\r
+'\.wow\.com','wowuk',\r
+'163\.com','netease',\r
+'1klik\.dk','1klik',\r
+'1search-board\.com','1search',\r
+'212\.227\.33\.241','metaspinner',\r
+'3721\.com','3721',\r
+'4\-counter\.com','google4counter',\r
+'a9\.com','a9',\r
+'accoona\.com','accoona',\r
+'alexa\.com','alexa',\r
+'allesklar\.de','allesklar',\r
+'alltheweb\.com','alltheweb',\r
+'altavista\.','altavista',\r
+'amazon\.','amazon',\r
+'androidsearch\.com','androidsearch',\r
+'answerbus\.com','answerbus',\r
+'anzwers\.com\.au','anzwers',\r
+'aport\.ru','aport',\r
+'arianna\.libero\.it','arianna',\r
+'as\.starware\.com','comettoolbar',\r
+'asevenboard\.com','asevenboard',\r
+'atlanticbb\.net','atlanticbb',\r
+'atlas\.cz','atlas',\r
+'atomz\.','atomz',\r
+'att\.net','att',\r
+'auone\.jp','auone',\r
+'avantfind\.com','avantfind',\r
+'baidu\.com','baidu',\r
+'bbc\.co\.uk/cgi-bin/search','bbc',\r
+'biglotron\.com', 'biglotron',\r
+'blekko\.com','blekko',\r
+'blingo\.com','blingo',\r
+'bungeebonesdotcom','bungeebonesdotcom',\r
+'centraldatabase\.org','centraldatabase',\r
+'centrum\.cz','centrum',\r
+'centurylink\.net','centurylink',\r
+'charter\.net','charter',\r
+'chatzum\.com','chatzum',\r
+'checkparams\.com','checkparams',\r
+'chello\.at','chelloat',\r
+'chello\.be','chellobe',\r
+'chello\.cz','chellocz',\r
+'chello\.fr','chellofr',\r
+'chello\.hu','chellohu',\r
+'chello\.nl','chellonl',\r
+'chello\.no','chellono',\r
+'chello\.pl','chellopl',\r
+'chello\.se','chellose',\r
+'chello\.sk','chellosk',\r
+'chello','chellocom',\r
+'claro-search\.com','clarosearch',\r
+'clinck\.in','clinck',\r
+'clusty\.com','clusty',\r
+'copernic\.com','copernic',\r
+'crawler\.com','crawler',\r
+'ctrouve\.','ctrouve',\r
+'dalesearch\.com','dalesearch',\r
+'danielsen\.com','danielsen',\r
+'daum\.net','daum',\r
+'de\.dolphin\.com','de_dolphin_com',\r
+'de\.wiki\.gov\.cn','de_wiki_gov_cn',\r
+'de\.wow\.com','wowsearch',\r
+'dejanews\.','dejanews',\r
+'del\.icio\.us','delicious',\r
+'delta-search','delta-search',\r
+'digg\.com','digg',\r
+'dmoz\.org','dmoz',\r
+'dodaj\.pl','dodajpl',\r
+'dogpile\.com','dogpile',\r
+'duckduckgo','duckduckgo',\r
+'easysearch\.org\.uk','easysearch',\r
+'ecosia\.org','ecosia',\r
+'edderkoppen\.dk','edderkoppen',\r
+'engine\.exe','engine',\r
+'eniro\.no','eniro',\r
+'eniro\.se','enirose',\r
+'ereadingsource\.com','ereadingsource',\r
+'es\.mirago\.com','miragoes',\r
+'etools\.ch','etools_ch',\r
+'euroseek\.','euroseek',\r
+'everyclick\.com','everyclick',\r
+'evreka\.passagen\.se','passagen',\r
+'excite\.','excite',\r
+'extern\.peoplecheck\.de','peoplecheck_de',\r
+'fastbot\.de','fastbot_de',\r
+'find\.dk','finddk',\r
+'find1friend\.com','find1friend',\r
+'findamo\.com','findamo',\r
+'findarticles\.com','findarticles',\r
+'fireball\.de','fireball',\r
+'forums\.iboats\.com','iboats',\r
+'foxstart\.com','foxstart',\r
+'francite\.','francite',\r
+'gazeta\.pl','gazetapl',\r
+'gery\.pl','gerypl',\r
+'globososo\.','globososo',\r
+'go\.mail\.ru','go.mail.ru',\r
+'go\.speedbit\.com','speedbit',\r
+'go2net\.com','go2net',\r
+'godado','godado',\r
+'goggle\.co\.hu$','goggle (what)',\r
+'goliat\.hu','goliat',\r
+'goodsearch\.com','goodsearch',\r
+'gotuneed\.com','gotuneed',\r
+'haku\.www\.fi','haku',\r
+'heureka\.hu','heureka',\r
+'hoga\.pl','hogapl',\r
+'hotbot\.','hotbot',\r
+'hubwe\.net','hubwe',\r
+'icerocket\.com','icerocket',\r
+'icq\.com\/search','icq',\r
+'ifind\.freeserve','freeserve',\r
+'ilse\.','ilse',\r
+'inbox\.com','inbox',\r
+'index\.hu','indexhu',\r
+'ineffabile\.it','ineffabile',\r
+'info\.co\.uk','infouk',\r
+'infoseek\.de','infoseek',\r
+'infospace\.com','infospace',\r
+'inspsearch\.com','inspsearch',\r
+'int\.search\.myway\.com','int_search_myway_com',\r
+'int\.search-results\.com','nortonsavesearch',\r
+'interia\.pl','interiapl',\r
+'isearch\.nation\.com','isearch_nation_com',\r
+'i-une\.com','iune',\r
+'ixquick\.com','ixquick',\r
+'izito\.co\.uk','izito_uk',\r
+'izito\.co\.de','izito_co_de',\r
+'izito\.','izito_catchall',\r
+'jubii\.dk','jubii',\r
+'jumpy\.it','jumpyit',\r
+'juno\.com','juno',\r
+'jyxo\.(cz|com)','jyxo',\r
+'kartoo\.com','kartoo',\r
+'katalog\.onet\.pl','katalogonetpl',\r
+'kataweb\.it','kataweb',\r
+'kereso\.startlap\.hu','startlap_hu',\r
+'keresolap\.hu','keresolap_hu',\r
+'kvasir\.','kvasir',\r
+'kvitters\.','kvitters',\r
+'lapkereso\.hu','lapkereso_hu',\r
+'lbb\.org','lbb',\r
+'ledix\.net','ledix',\r
+'libero\.it/','libero',\r
+'localmoxie\.com','localmoxie',\r
+'looksmart\.co\.uk','looksmart_co_uk',\r
+'looksmart\.','looksmart_catchall',\r
+'lycos\.','lycos',\r
+'mamma\.','mamma',\r
+'meinestadt\.de','meinestadt',\r
+'meta\.ua','metaua',\r
+'metabot\.ru','metabot',\r
+'metacrawler\.','metacrawler',\r
+'metager\.de','metager',\r
+'miner\.bol\.com\.br','miner',\r
+'mirago\.be','miragobe',\r
+'mirago\.ch','miragoch',\r
+'mirago\.co\.uk','miragocouk',\r
+'mirago\.de','miragode',\r
+'mirago\.dk','miragodk',\r
+'mirago\.fr','miragofr',\r
+'mirago\.it','miragoit',\r
+'mirago\.nl','miragonl',\r
+'mirago\.se','miragose',\r
+'mirago','mirago',\r
+'mitrasites\.com','mitrasites',\r
+'mozbot\.fr', 'mozbot',\r
+'my\.allgameshome\.com','allgameshome',\r
+'mys\.yoursearch\.me','mys_yoursearch_me',\r
+'mysearch\.','mysearch',\r
+'mysearchdial\.com','mysearchdial',\r
+'mysearchresults\.com','mysearchresults',\r
+'myway\.com','myway',\r
+'najdi\.to','najdi',\r
+'nation\.','nation',\r
+'navigationshilfe\.t-online\.de','navigationshilfe_t_online',\r
+'nbci\.com\/search','nbci',\r
+'netluchs\.de','netluchs',\r
+'netscape\.','netscape',\r
+'netsprint\.pl','netsprintpl',\r
+'netstjernen\.dk','netstjernen',\r
+'netzero\.net','netzero',\r
+'no\.mirago\.com','miragono',\r
+'northernlight\.','northernlight',\r
+'nusearch\.com','nusearch',\r
+'o2\.pl','o2pl',\r
+'ofir\.dk','ofir',\r
+'opasia\.dk','opasia',\r
+'orangeworld\.co\.uk','orangeworld',\r
+'orbis\.dk','orbis',\r
+'overture\.com','overture',\r
+'pch\.com','pch',\r
+'picsearch\.de','picsearch',\r
+'pictures\.com','pictures',\r
+'plusnetwork\.com','plusnetwork',\r
+'pogodak\.','pogodak',\r
+'polska\.pl','polskapl',\r
+'polymeta\.hu','polymeta_hu',\r
+'preciobarato\.xyz','preciobarato_xyz',\r
+'questionanswering\.com','questionanswering',\r
+'quick\.cz','quick',\r
+'rambler\.ru','rambler',\r
+'recherche\.club-internet\.fr','clubinternet',\r
+'rechercher\.libertysurf\.fr','libertysurf',\r
+'redbox\.cz','redbox',\r
+'rr\.com','rr',\r
+'sagool\.jp','sagool',\r
+'sapo\.pt','sapo',\r
+'schoenerbrausen\.de','schoenerbrausen',\r
+'scroogle\.org','scroogle',\r
+'search[\w\-]+\.free\.fr','free',\r
+'search\.1und1\.de','search_1und1_de',\r
+'search\.alice\.it\.master','aliceitmaster',\r
+'search\.alice\.it','aliceit',\r
+'search\.alot\.com','alot',\r
+'search\.bluewin\.ch','bluewin',\r
+'search\.bt\.com','bt',\r
+'search\.certified-toolbar\.com','certifiedtoolbarsearch',\r
+'search\.ch','searchch',\r
+'search\.comcast\.net','comcast',\r
+'search\.earthlink\.net','earthlink',\r
+'search\.fbdownloader\.com','fbdownloader',\r
+'search\.fdownloadr\.com','fdownloadr_com',\r
+'search\.foxtab\.com','search_foxtab_com',\r
+'search\.genieo\.com','genieo',\r
+'search\.goo\.ne\.jp','ichiro',\r
+'search\.handycafe\.com','handycafe',\r
+'search\.incredibar\.com','incredibar',\r
+'search\.incredimail\.com','incredimail',\r
+'search\.internetto\.hu','internetto',\r
+'search\.orange\.co\.uk','orange',\r
+'search\.sky\.com','sky',\r
+'search\.sli\.sympatico\.ca','sympatico',\r
+'search\.socialdownloadr\.com','search_socialdownloadr_com',\r
+'search\.sweetim\.com','sweetim',\r
+'search\.terra\.','terra',\r
+'search\.zonealarm\.com','search_zonealarm_com',\r
+'searchalgo\.com','searchalgo',\r
+'searchalot\.com','searchalot',\r
+'searchcompletion\.com','searchcompletion',\r
+'searches\.qone8\.com','searches_qone8_com',\r
+'searches\.safehomepage\.com','safehomepage_com',\r
+'searches\.vi-view\.com','vi-view_com',\r
+'searchesnavigator\.com','searchesnavigator',\r
+'searchgol\.com','searchgol',\r
+'searchlistingsite\.com','searchlistingsite',\r
+'searchmobileonline\.com','searchmobileonline',\r
+'search-results\.com','searchresultscom',\r
+'search-results\.mobi','search-results_mobi',\r
+'searchsafer\.com','searchsafer',\r
+'searchy\.co\.uk','searchy',\r
+'searchya\.com','searchya',\r
+'segnalo\.alice\.it','segnalo',\r
+'semalt\.com','semalt',\r
+'sensis\.com\.au','sensis',\r
+'seznam\.cz','seznam',\r
+'shinyseek\.it','shinyseek\.it',\r
+'shoppstop\.com','shoppstop',\r
+'sify\.com','sify',\r
+'sm\.de','smde',\r
+'smartsuggestor\.com','smartsuggestor',\r
+'snapdo\.com','snapdo',\r
+'softonic\.com','softonic',\r
+'sogou\.com','sogou',\r
+'sok\.start\.no','start',\r
+'sol\.dk','sol',\r
+'soso\.com','soso',\r
+'sphere\.com','sphere',\r
+'splut\.','splut',\r
+'spotjockey\.','spotjockey',\r
+'spray\.','spray',\r
+'sr\.searchfunmoods\.com','searchfunmoods',\r
+'start\.iminent\.com','iminent',\r
+'start\.shaw\.ca','shawca',\r
+'start\.toshiba\.com','toshiba',\r
+'startpage\.com','startpage',\r
+'startsiden\.no','startsiden',\r
+'static\.flipora\.com','flipora',\r
+'steadysearch\.com','steadysearch',\r
+'steady-search\.com','steadysearch',\r
+'stumbleupon\.com','stumbleupon',\r
+'suche\.1und1\.de','1und1_de',\r
+'suche\.freenet\.de','freenet_de',\r
+'suche\.gmx\.at','gmxsuche_at',\r
+'suche\.gmx\.net','gmxsuche',\r
+'suche\d?\.web\.de','webde',\r
+'suchen\.abacho\.de','abacho',\r
+'sumaja\.de','sumaja',\r
+'supereva\.com','supereva',\r
+'surfcanyon\.com','surfcanyon_com',\r
+'sweetpacks-search\.com','sweetpacks',\r
+'swik\.net','swik',\r
+'swisscows\.ch','swisscows_ch',\r
+'szukacz\.pl','szukaczpl',\r
+'szukaj\.onet\.pl','onetpl',\r
+'szukaj\.wp\.pl','wp',\r
+'talktalk\.co\.uk','talktalk_uk',\r
+'tango\.hu','tango_hu',\r
+'teecno\.it','teecnoit',\r
+'teoma\.','teoma',\r
+'theallsearches\.com','theallsearches',\r
+'three\.co\.uk','three',\r
+'tiscali\.','tiscali',\r
+'tixuma\.de','tixuma_de',\r
+'toile\.com','toile',\r
+'t-online\.de','t_online_de',\r
+'t-online','t_online_catchall',\r
+'turtle\.ru','turtle',\r
+'tyfon\.dk','tyfon',\r
+'uk\.foxstart\.com','uk_foxstart_com',\r
+'ukdirectory\.','ukdirectory',\r
+'ukindex\.co\.uk','ukindex',\r
+'ukplus\.','ukplus',\r
+'umfis\.de','umfis',\r
+'umuwa\.de','umuwa_de',\r
+'uni-hannover\.de','metahannover',\r
+'vindex\.','vindex',\r
+'virgilio\.it','virgilio',\r
+'virginmedia\.com','virginmedia',\r
+'vivisimo\.com','vivisimo',\r
+'vizsla\.origo\.hu','origo',\r
+'vnet\.cn','vnet',\r
+'voila\.','voila',\r
+'wahoo\.hu','wahoo',\r
+'webalta\.ru','webalta',\r
+'webcrawler\.','webcrawler',\r
+'webmania\.hu','webmania',\r
+'websearch\.rakuten\.co\.jp','rakuten',\r
+'whorush\.com','whorush_com',\r
+'windowssearch\.com','windowssearch_com',\r
+'wisenut\.com','wisenut',\r
+'wow\.pl','wowpl',\r
+'wow\.utop\.it','wow_utop_it',\r
+'www\.benefind\.de','benefind',\r
+'www\.buenosearch\.com','www_buenosearch_com',\r
+'www\.dregol\.com','www_dregol_com',\r
+'www\.govome\.com','govome',\r
+'www\.holasearch\.com','holasearch',\r
+'www\.metasuche\.ch','metasuche_ch',\r
+'www\.oneseek\.de','oneseek_de',\r
+'www\.qwant\.com','qwant_com',\r
+'www\.search\.com','search.com',\r
+'www\.startxxl\.com','startxxl',\r
+'www\.vlips\.de','vlips_de',\r
+'www\.wow\.com','www_wow_com',\r
+'www1\.search-results\.com','searchresults',\r
+'wwweasel\.de','wwweasel',\r
+'yourbestsearch\.net','yourbestsearch',\r
+'youtube\.com','youtube',\r
+'zhongsou\.com','zhongsou',\r
+'zoeken\.nl','zoeken',\r
+'zoznam\.sk','zoznam',\r
+# Generic search engines\r
+'search\..*\.\w+','search'\r
+);\r
+\r
+# SearchEnginesWithKeysNotInQuery\r
+# List of search engines that store keyword as page instead of query parameter\r
+#------------------------------------------------------------------------------\r
+%SearchEnginesWithKeysNotInQuery=(\r
+'a9',1    # www.a9.com/searckey1%20searchkey2\r
+);\r
+\r
+# SearchEnginesKnownUrl\r
+# Known rules to extract keywords from a referrer search engine URL\r
+#------------------------------------------------------------------------------\r
+%SearchEnginesKnownUrl=(\r
+# Query keys\r
+\r
+'www_google_co_uk','(p|q|as_p|as_q)=',\r
+'images_google_co_uk','(p|q|as_p|as_q)=',\r
+'google_co_uk','(p|q|as_p|as_q)=',\r
+'www_google_com','(p|q|as_p|as_q)=',\r
+'images_google_com','(p|q|as_p|as_q)=',\r
+'google_com','(p|q|as_p|as_q)=',\r
+'www_google_de','(p|q|as_p|as_q)=',\r
+'images_google_de','(p|q|as_p|as_q)=',\r
+'google_de','(p|q|as_p|as_q)=',\r
+'www_google_fr','(p|q|as_p|as_q)=',\r
+'images_google_fr','(p|q|as_p|as_q)=',\r
+'google_fr','(p|q|as_p|as_q)=',\r
+'www_google_ca','(p|q|as_p|as_q)=',\r
+'images_google_ca','(p|q|as_p|as_q)=',\r
+'google_ca','(p|q|as_p|as_q)=',\r
+'www_google_es','(p|q|as_p|as_q)=',\r
+'images_google_es','(p|q|as_p|as_q)=',\r
+'google_es','(p|q|as_p|as_q)=',\r
+'www_google_com_au','(p|q|as_p|as_q)=',\r
+'images_google_com_au','(p|q|as_p|as_q)=',\r
+'google_com_au','(p|q|as_p|as_q)=',\r
+'www_google_nl','(p|q|as_p|as_q)=',\r
+'images_google_nl','(p|q|as_p|as_q)=',\r
+'google_nl','(p|q|as_p|as_q)=',\r
+'www_google_gr','(p|q|as_p|as_q)=',\r
+'images_google_gr','(p|q|as_p|as_q)=',\r
+'google_gr','(p|q|as_p|as_q)=',\r
+'www_google_se','(p|q|as_p|as_q)=',\r
+'images_google_se','(p|q|as_p|as_q)=',\r
+'google_se','(p|q|as_p|as_q)=',\r
+'www_google_ie','(p|q|as_p|as_q)=',\r
+'images_google_ie','(p|q|as_p|as_q)=',\r
+'google_ie','(p|q|as_p|as_q)=',\r
+'www_google_it','(p|q|as_p|as_q)=',\r
+'images_google_it','(p|q|as_p|as_q)=',\r
+'google_it','(p|q|as_p|as_q)=',\r
+'www_google_no','(p|q|as_p|as_q)=',\r
+'images_google_no','(p|q|as_p|as_q)=',\r
+'google_no','(p|q|as_p|as_q)=',\r
+'www_google_com_tr','(p|q|as_p|as_q)=',\r
+'images_google_com_tr','(p|q|as_p|as_q)=',\r
+'google_com_tr','(p|q|as_p|as_q)=',\r
+'www_google_co_in','(p|q|as_p|as_q)=',\r
+'images_google_co_in','(p|q|as_p|as_q)=',\r
+'google_co_in','(p|q|as_p|as_q)=',\r
+'www_google_pt','(p|q|as_p|as_q)=',\r
+'images_google_pt','(p|q|as_p|as_q)=',\r
+'google_pt','(p|q|as_p|as_q)=',\r
+'www_google_hr','(p|q|as_p|as_q)=',\r
+'images_google_hr','(p|q|as_p|as_q)=',\r
+'google_hr','(p|q|as_p|as_q)=',\r
+'www_google_co_nz','(p|q|as_p|as_q)=',\r
+'images_google_co_nz','(p|q|as_p|as_q)=',\r
+'google_co_nz','(p|q|as_p|as_q)=',\r
+'www_google_pl','(p|q|as_p|as_q)=',\r
+'images_google_pl','(p|q|as_p|as_q)=',\r
+'google_pl','(p|q|as_p|as_q)=',\r
+'www_google_ac','(p|q|as_p|as_q)=',\r
+'images_google_ac','(p|q|as_p|as_q)=',\r
+'google_ac','(p|q|as_p|as_q)=',\r
+'www_google_ad','(p|q|as_p|as_q)=',\r
+'images_google_ad','(p|q|as_p|as_q)=',\r
+'google_ad','(p|q|as_p|as_q)=',\r
+'www_google_ae','(p|q|as_p|as_q)=',\r
+'images_google_ae','(p|q|as_p|as_q)=',\r
+'google_ae','(p|q|as_p|as_q)=',\r
+'www_google_al','(p|q|as_p|as_q)=',\r
+'images_google_al','(p|q|as_p|as_q)=',\r
+'google_al','(p|q|as_p|as_q)=',\r
+'www_google_am','(p|q|as_p|as_q)=',\r
+'images_google_am','(p|q|as_p|as_q)=',\r
+'google_am','(p|q|as_p|as_q)=',\r
+'www_google_as','(p|q|as_p|as_q)=',\r
+'images_google_as','(p|q|as_p|as_q)=',\r
+'google_as','(p|q|as_p|as_q)=',\r
+'www_google_at','(p|q|as_p|as_q)=',\r
+'images_google_at','(p|q|as_p|as_q)=',\r
+'google_at','(p|q|as_p|as_q)=',\r
+'www_google_az','(p|q|as_p|as_q)=',\r
+'images_google_az','(p|q|as_p|as_q)=',\r
+'google_az','(p|q|as_p|as_q)=',\r
+'www_google_ba','(p|q|as_p|as_q)=',\r
+'images_google_ba','(p|q|as_p|as_q)=',\r
+'google_ba','(p|q|as_p|as_q)=',\r
+'www_google_be','(p|q|as_p|as_q)=',\r
+'images_google_be','(p|q|as_p|as_q)=',\r
+'google_be','(p|q|as_p|as_q)=',\r
+'www_google_bf','(p|q|as_p|as_q)=',\r
+'images_google_bf','(p|q|as_p|as_q)=',\r
+'google_bf','(p|q|as_p|as_q)=',\r
+'www_google_bg','(p|q|as_p|as_q)=',\r
+'images_google_bg','(p|q|as_p|as_q)=',\r
+'google_bg','(p|q|as_p|as_q)=',\r
+'www_google_bi','(p|q|as_p|as_q)=',\r
+'images_google_bi','(p|q|as_p|as_q)=',\r
+'google_bi','(p|q|as_p|as_q)=',\r
+'www_google_bj','(p|q|as_p|as_q)=',\r
+'images_google_bj','(p|q|as_p|as_q)=',\r
+'google_bj','(p|q|as_p|as_q)=',\r
+'www_google_bs','(p|q|as_p|as_q)=',\r
+'images_google_bs','(p|q|as_p|as_q)=',\r
+'google_bs','(p|q|as_p|as_q)=',\r
+'www_google_bt','(p|q|as_p|as_q)=',\r
+'images_google_bt','(p|q|as_p|as_q)=',\r
+'google_bt','(p|q|as_p|as_q)=',\r
+'www_google_by','(p|q|as_p|as_q)=',\r
+'images_google_by','(p|q|as_p|as_q)=',\r
+'google_by','(p|q|as_p|as_q)=',\r
+'www_google_cat','(p|q|as_p|as_q)=',\r
+'images_google_cat','(p|q|as_p|as_q)=',\r
+'google_cat','(p|q|as_p|as_q)=',\r
+'www_google_cc','(p|q|as_p|as_q)=',\r
+'images_google_cc','(p|q|as_p|as_q)=',\r
+'google_cc','(p|q|as_p|as_q)=',\r
+'www_google_cd','(p|q|as_p|as_q)=',\r
+'images_google_cd','(p|q|as_p|as_q)=',\r
+'google_cd','(p|q|as_p|as_q)=',\r
+'www_google_cf','(p|q|as_p|as_q)=',\r
+'images_google_cf','(p|q|as_p|as_q)=',\r
+'google_cf','(p|q|as_p|as_q)=',\r
+'www_google_cg','(p|q|as_p|as_q)=',\r
+'images_google_cg','(p|q|as_p|as_q)=',\r
+'google_cg','(p|q|as_p|as_q)=',\r
+'www_google_ch','(p|q|as_p|as_q)=',\r
+'images_google_ch','(p|q|as_p|as_q)=',\r
+'google_ch','(p|q|as_p|as_q)=',\r
+'www_google_ci','(p|q|as_p|as_q)=',\r
+'images_google_ci','(p|q|as_p|as_q)=',\r
+'google_ci','(p|q|as_p|as_q)=',\r
+'www_google_cl','(p|q|as_p|as_q)=',\r
+'images_google_cl','(p|q|as_p|as_q)=',\r
+'google_cl','(p|q|as_p|as_q)=',\r
+'www_google_cm','(p|q|as_p|as_q)=',\r
+'images_google_cm','(p|q|as_p|as_q)=',\r
+'google_cm','(p|q|as_p|as_q)=',\r
+'www_google_cn','(p|q|as_p|as_q)=',\r
+'images_google_cn','(p|q|as_p|as_q)=',\r
+'google_cn','(p|q|as_p|as_q)=',\r
+'www_google_co_ao','(p|q|as_p|as_q)=',\r
+'images_google_co_ao','(p|q|as_p|as_q)=',\r
+'google_co_ao','(p|q|as_p|as_q)=',\r
+'www_google_co_bw','(p|q|as_p|as_q)=',\r
+'images_google_co_bw','(p|q|as_p|as_q)=',\r
+'google_co_bw','(p|q|as_p|as_q)=',\r
+'www_google_co_ck','(p|q|as_p|as_q)=',\r
+'images_google_co_ck','(p|q|as_p|as_q)=',\r
+'google_co_ck','(p|q|as_p|as_q)=',\r
+'www_google_co_cr','(p|q|as_p|as_q)=',\r
+'images_google_co_cr','(p|q|as_p|as_q)=',\r
+'google_co_cr','(p|q|as_p|as_q)=',\r
+'www_google_co_id','(p|q|as_p|as_q)=',\r
+'images_google_co_id','(p|q|as_p|as_q)=',\r
+'google_co_id','(p|q|as_p|as_q)=',\r
+'www_google_co_il','(p|q|as_p|as_q)=',\r
+'images_google_co_il','(p|q|as_p|as_q)=',\r
+'google_co_il','(p|q|as_p|as_q)=',\r
+'www_google_co_jp','(p|q|as_p|as_q)=',\r
+'images_google_co_jp','(p|q|as_p|as_q)=',\r
+'google_co_jp','(p|q|as_p|as_q)=',\r
+'www_google_co_ke','(p|q|as_p|as_q)=',\r
+'images_google_co_ke','(p|q|as_p|as_q)=',\r
+'google_co_ke','(p|q|as_p|as_q)=',\r
+'www_google_co_kr','(p|q|as_p|as_q)=',\r
+'images_google_co_kr','(p|q|as_p|as_q)=',\r
+'google_co_kr','(p|q|as_p|as_q)=',\r
+'www_google_co_ls','(p|q|as_p|as_q)=',\r
+'images_google_co_ls','(p|q|as_p|as_q)=',\r
+'google_co_ls','(p|q|as_p|as_q)=',\r
+'www_google_co_ma','(p|q|as_p|as_q)=',\r
+'images_google_co_ma','(p|q|as_p|as_q)=',\r
+'google_co_ma','(p|q|as_p|as_q)=',\r
+'www_google_co_mz','(p|q|as_p|as_q)=',\r
+'images_google_co_mz','(p|q|as_p|as_q)=',\r
+'google_co_mz','(p|q|as_p|as_q)=',\r
+'www_google_co_th','(p|q|as_p|as_q)=',\r
+'images_google_co_th','(p|q|as_p|as_q)=',\r
+'google_co_th','(p|q|as_p|as_q)=',\r
+'www_google_co_tz','(p|q|as_p|as_q)=',\r
+'images_google_co_tz','(p|q|as_p|as_q)=',\r
+'google_co_tz','(p|q|as_p|as_q)=',\r
+'www_google_co_ug','(p|q|as_p|as_q)=',\r
+'images_google_co_ug','(p|q|as_p|as_q)=',\r
+'google_co_ug','(p|q|as_p|as_q)=',\r
+'www_google_co_uz','(p|q|as_p|as_q)=',\r
+'images_google_co_uz','(p|q|as_p|as_q)=',\r
+'google_co_uz','(p|q|as_p|as_q)=',\r
+'www_google_co_ve','(p|q|as_p|as_q)=',\r
+'images_google_co_ve','(p|q|as_p|as_q)=',\r
+'google_co_ve','(p|q|as_p|as_q)=',\r
+'www_google_co_vi','(p|q|as_p|as_q)=',\r
+'images_google_co_vi','(p|q|as_p|as_q)=',\r
+'google_co_vi','(p|q|as_p|as_q)=',\r
+'www_google_co_za','(p|q|as_p|as_q)=',\r
+'images_google_co_za','(p|q|as_p|as_q)=',\r
+'google_co_za','(p|q|as_p|as_q)=',\r
+'www_google_co_zm','(p|q|as_p|as_q)=',\r
+'images_google_co_zm','(p|q|as_p|as_q)=',\r
+'google_co_zm','(p|q|as_p|as_q)=',\r
+'www_google_co_zw','(p|q|as_p|as_q)=',\r
+'images_google_co_zw','(p|q|as_p|as_q)=',\r
+'google_co_zw','(p|q|as_p|as_q)=',\r
+'www_google_com_af','(p|q|as_p|as_q)=',\r
+'images_google_com_af','(p|q|as_p|as_q)=',\r
+'google_com_af','(p|q|as_p|as_q)=',\r
+'www_google_com_ag','(p|q|as_p|as_q)=',\r
+'images_google_com_ag','(p|q|as_p|as_q)=',\r
+'google_com_ag','(p|q|as_p|as_q)=',\r
+'www_google_com_ai','(p|q|as_p|as_q)=',\r
+'images_google_com_ai','(p|q|as_p|as_q)=',\r
+'google_com_ai','(p|q|as_p|as_q)=',\r
+'www_google_com_ar','(p|q|as_p|as_q)=',\r
+'images_google_com_ar','(p|q|as_p|as_q)=',\r
+'google_com_ar','(p|q|as_p|as_q)=',\r
+'www_google_com_bd','(p|q|as_p|as_q)=',\r
+'images_google_com_bd','(p|q|as_p|as_q)=',\r
+'google_com_bd','(p|q|as_p|as_q)=',\r
+'www_google_com_bh','(p|q|as_p|as_q)=',\r
+'images_google_com_bh','(p|q|as_p|as_q)=',\r
+'google_com_bh','(p|q|as_p|as_q)=',\r
+'www_google_com_bn','(p|q|as_p|as_q)=',\r
+'images_google_com_bn','(p|q|as_p|as_q)=',\r
+'google_com_bn','(p|q|as_p|as_q)=',\r
+'www_google_com_bo','(p|q|as_p|as_q)=',\r
+'images_google_com_bo','(p|q|as_p|as_q)=',\r
+'google_com_bo','(p|q|as_p|as_q)=',\r
+'www_google_com_br','(p|q|as_p|as_q)=',\r
+'images_google_com_br','(p|q|as_p|as_q)=',\r
+'google_com_br','(p|q|as_p|as_q)=',\r
+'www_google_com_bz','(p|q|as_p|as_q)=',\r
+'images_google_com_bz','(p|q|as_p|as_q)=',\r
+'google_com_bz','(p|q|as_p|as_q)=',\r
+'www_google_com_co','(p|q|as_p|as_q)=',\r
+'images_google_com_co','(p|q|as_p|as_q)=',\r
+'google_com_co','(p|q|as_p|as_q)=',\r
+'www_google_com_cu','(p|q|as_p|as_q)=',\r
+'images_google_com_cu','(p|q|as_p|as_q)=',\r
+'google_com_cu','(p|q|as_p|as_q)=',\r
+'www_google_com_cy','(p|q|as_p|as_q)=',\r
+'images_google_com_cy','(p|q|as_p|as_q)=',\r
+'google_com_cy','(p|q|as_p|as_q)=',\r
+'www_google_com_do','(p|q|as_p|as_q)=',\r
+'images_google_com_do','(p|q|as_p|as_q)=',\r
+'google_com_do','(p|q|as_p|as_q)=',\r
+'www_google_com_ec','(p|q|as_p|as_q)=',\r
+'images_google_com_ec','(p|q|as_p|as_q)=',\r
+'google_com_ec','(p|q|as_p|as_q)=',\r
+'www_google_com_eg','(p|q|as_p|as_q)=',\r
+'images_google_com_eg','(p|q|as_p|as_q)=',\r
+'google_com_eg','(p|q|as_p|as_q)=',\r
+'www_google_com_et','(p|q|as_p|as_q)=',\r
+'images_google_com_et','(p|q|as_p|as_q)=',\r
+'google_com_et','(p|q|as_p|as_q)=',\r
+'www_google_com_fj','(p|q|as_p|as_q)=',\r
+'images_google_com_fj','(p|q|as_p|as_q)=',\r
+'google_com_fj','(p|q|as_p|as_q)=',\r
+'www_google_com_gh','(p|q|as_p|as_q)=',\r
+'images_google_com_gh','(p|q|as_p|as_q)=',\r
+'google_com_gh','(p|q|as_p|as_q)=',\r
+'www_google_com_gi','(p|q|as_p|as_q)=',\r
+'images_google_com_gi','(p|q|as_p|as_q)=',\r
+'google_com_gi','(p|q|as_p|as_q)=',\r
+'www_google_com_gt','(p|q|as_p|as_q)=',\r
+'images_google_com_gt','(p|q|as_p|as_q)=',\r
+'google_com_gt','(p|q|as_p|as_q)=',\r
+'www_google_com_hk','(p|q|as_p|as_q)=',\r
+'images_google_com_hk','(p|q|as_p|as_q)=',\r
+'google_com_hk','(p|q|as_p|as_q)=',\r
+'www_google_com_jm','(p|q|as_p|as_q)=',\r
+'images_google_com_jm','(p|q|as_p|as_q)=',\r
+'google_com_jm','(p|q|as_p|as_q)=',\r
+'www_google_com_kh','(p|q|as_p|as_q)=',\r
+'images_google_com_kh','(p|q|as_p|as_q)=',\r
+'google_com_kh','(p|q|as_p|as_q)=',\r
+'www_google_com_kw','(p|q|as_p|as_q)=',\r
+'images_google_com_kw','(p|q|as_p|as_q)=',\r
+'google_com_kw','(p|q|as_p|as_q)=',\r
+'www_google_com_lb','(p|q|as_p|as_q)=',\r
+'images_google_com_lb','(p|q|as_p|as_q)=',\r
+'google_com_lb','(p|q|as_p|as_q)=',\r
+'www_google_com_lc','(p|q|as_p|as_q)=',\r
+'images_google_com_lc','(p|q|as_p|as_q)=',\r
+'google_com_lc','(p|q|as_p|as_q)=',\r
+'www_google_com_ly','(p|q|as_p|as_q)=',\r
+'images_google_com_ly','(p|q|as_p|as_q)=',\r
+'google_com_ly','(p|q|as_p|as_q)=',\r
+'www_google_com_mm','(p|q|as_p|as_q)=',\r
+'images_google_com_mm','(p|q|as_p|as_q)=',\r
+'google_com_mm','(p|q|as_p|as_q)=',\r
+'www_google_com_mt','(p|q|as_p|as_q)=',\r
+'images_google_com_mt','(p|q|as_p|as_q)=',\r
+'google_com_mt','(p|q|as_p|as_q)=',\r
+'www_google_com_mx','(p|q|as_p|as_q)=',\r
+'images_google_com_mx','(p|q|as_p|as_q)=',\r
+'google_com_mx','(p|q|as_p|as_q)=',\r
+'www_google_com_my','(p|q|as_p|as_q)=',\r
+'images_google_com_my','(p|q|as_p|as_q)=',\r
+'google_com_my','(p|q|as_p|as_q)=',\r
+'www_google_com_na','(p|q|as_p|as_q)=',\r
+'images_google_com_na','(p|q|as_p|as_q)=',\r
+'google_com_na','(p|q|as_p|as_q)=',\r
+'www_google_com_nf','(p|q|as_p|as_q)=',\r
+'images_google_com_nf','(p|q|as_p|as_q)=',\r
+'google_com_nf','(p|q|as_p|as_q)=',\r
+'www_google_com_ng','(p|q|as_p|as_q)=',\r
+'images_google_com_ng','(p|q|as_p|as_q)=',\r
+'google_com_ng','(p|q|as_p|as_q)=',\r
+'www_google_com_ni','(p|q|as_p|as_q)=',\r
+'images_google_com_ni','(p|q|as_p|as_q)=',\r
+'google_com_ni','(p|q|as_p|as_q)=',\r
+'www_google_com_np','(p|q|as_p|as_q)=',\r
+'images_google_com_np','(p|q|as_p|as_q)=',\r
+'google_com_np','(p|q|as_p|as_q)=',\r
+'www_google_com_om','(p|q|as_p|as_q)=',\r
+'images_google_com_om','(p|q|as_p|as_q)=',\r
+'google_com_om','(p|q|as_p|as_q)=',\r
+'www_google_com_pa','(p|q|as_p|as_q)=',\r
+'images_google_com_pa','(p|q|as_p|as_q)=',\r
+'google_com_pa','(p|q|as_p|as_q)=',\r
+'www_google_com_pe','(p|q|as_p|as_q)=',\r
+'images_google_com_pe','(p|q|as_p|as_q)=',\r
+'google_com_pe','(p|q|as_p|as_q)=',\r
+'www_google_com_pg','(p|q|as_p|as_q)=',\r
+'images_google_com_pg','(p|q|as_p|as_q)=',\r
+'google_com_pg','(p|q|as_p|as_q)=',\r
+'www_google_com_ph','(p|q|as_p|as_q)=',\r
+'images_google_com_ph','(p|q|as_p|as_q)=',\r
+'google_com_ph','(p|q|as_p|as_q)=',\r
+'www_google_com_pk','(p|q|as_p|as_q)=',\r
+'images_google_com_pk','(p|q|as_p|as_q)=',\r
+'google_com_pk','(p|q|as_p|as_q)=',\r
+'www_google_com_pr','(p|q|as_p|as_q)=',\r
+'images_google_com_pr','(p|q|as_p|as_q)=',\r
+'google_com_pr','(p|q|as_p|as_q)=',\r
+'www_google_com_py','(p|q|as_p|as_q)=',\r
+'images_google_com_py','(p|q|as_p|as_q)=',\r
+'google_com_py','(p|q|as_p|as_q)=',\r
+'www_google_com_qa','(p|q|as_p|as_q)=',\r
+'images_google_com_qa','(p|q|as_p|as_q)=',\r
+'google_com_qa','(p|q|as_p|as_q)=',\r
+'www_google_com_sa','(p|q|as_p|as_q)=',\r
+'images_google_com_sa','(p|q|as_p|as_q)=',\r
+'google_com_sa','(p|q|as_p|as_q)=',\r
+'www_google_com_sb','(p|q|as_p|as_q)=',\r
+'images_google_com_sb','(p|q|as_p|as_q)=',\r
+'google_com_sb','(p|q|as_p|as_q)=',\r
+'www_google_com_sg','(p|q|as_p|as_q)=',\r
+'images_google_com_sg','(p|q|as_p|as_q)=',\r
+'google_com_sg','(p|q|as_p|as_q)=',\r
+'www_google_com_sl','(p|q|as_p|as_q)=',\r
+'images_google_com_sl','(p|q|as_p|as_q)=',\r
+'google_com_sl','(p|q|as_p|as_q)=',\r
+'www_google_com_sv','(p|q|as_p|as_q)=',\r
+'images_google_com_sv','(p|q|as_p|as_q)=',\r
+'google_com_sv','(p|q|as_p|as_q)=',\r
+'www_google_com_tj','(p|q|as_p|as_q)=',\r
+'images_google_com_tj','(p|q|as_p|as_q)=',\r
+'google_com_tj','(p|q|as_p|as_q)=',\r
+'www_google_com_tw','(p|q|as_p|as_q)=',\r
+'images_google_com_tw','(p|q|as_p|as_q)=',\r
+'google_com_tw','(p|q|as_p|as_q)=',\r
+'www_google_com_ua','(p|q|as_p|as_q)=',\r
+'images_google_com_ua','(p|q|as_p|as_q)=',\r
+'google_com_ua','(p|q|as_p|as_q)=',\r
+'www_google_com_uy','(p|q|as_p|as_q)=',\r
+'images_google_com_uy','(p|q|as_p|as_q)=',\r
+'google_com_uy','(p|q|as_p|as_q)=',\r
+'www_google_com_vc','(p|q|as_p|as_q)=',\r
+'images_google_com_vc','(p|q|as_p|as_q)=',\r
+'google_com_vc','(p|q|as_p|as_q)=',\r
+'www_google_com_vn','(p|q|as_p|as_q)=',\r
+'images_google_com_vn','(p|q|as_p|as_q)=',\r
+'google_com_vn','(p|q|as_p|as_q)=',\r
+'www_google_cv','(p|q|as_p|as_q)=',\r
+'images_google_cv','(p|q|as_p|as_q)=',\r
+'google_cv','(p|q|as_p|as_q)=',\r
+'www_google_cz','(p|q|as_p|as_q)=',\r
+'images_google_cz','(p|q|as_p|as_q)=',\r
+'google_cz','(p|q|as_p|as_q)=',\r
+'www_google_dj','(p|q|as_p|as_q)=',\r
+'images_google_dj','(p|q|as_p|as_q)=',\r
+'google_dj','(p|q|as_p|as_q)=',\r
+'www_google_dk','(p|q|as_p|as_q)=',\r
+'images_google_dk','(p|q|as_p|as_q)=',\r
+'google_dk','(p|q|as_p|as_q)=',\r
+'www_google_dm','(p|q|as_p|as_q)=',\r
+'images_google_dm','(p|q|as_p|as_q)=',\r
+'google_dm','(p|q|as_p|as_q)=',\r
+'www_google_dz','(p|q|as_p|as_q)=',\r
+'images_google_dz','(p|q|as_p|as_q)=',\r
+'google_dz','(p|q|as_p|as_q)=',\r
+'www_google_ee','(p|q|as_p|as_q)=',\r
+'images_google_ee','(p|q|as_p|as_q)=',\r
+'google_ee','(p|q|as_p|as_q)=',\r
+'www_google_fi','(p|q|as_p|as_q)=',\r
+'images_google_fi','(p|q|as_p|as_q)=',\r
+'google_fi','(p|q|as_p|as_q)=',\r
+'www_google_fm','(p|q|as_p|as_q)=',\r
+'images_google_fm','(p|q|as_p|as_q)=',\r
+'google_fm','(p|q|as_p|as_q)=',\r
+'www_google_ga','(p|q|as_p|as_q)=',\r
+'images_google_ga','(p|q|as_p|as_q)=',\r
+'google_ga','(p|q|as_p|as_q)=',\r
+'www_google_ge','(p|q|as_p|as_q)=',\r
+'images_google_ge','(p|q|as_p|as_q)=',\r
+'google_ge','(p|q|as_p|as_q)=',\r
+'www_google_gf','(p|q|as_p|as_q)=',\r
+'images_google_gf','(p|q|as_p|as_q)=',\r
+'google_gf','(p|q|as_p|as_q)=',\r
+'www_google_gg','(p|q|as_p|as_q)=',\r
+'images_google_gg','(p|q|as_p|as_q)=',\r
+'google_gg','(p|q|as_p|as_q)=',\r
+'www_google_gl','(p|q|as_p|as_q)=',\r
+'images_google_gl','(p|q|as_p|as_q)=',\r
+'google_gl','(p|q|as_p|as_q)=',\r
+'www_google_gm','(p|q|as_p|as_q)=',\r
+'images_google_gm','(p|q|as_p|as_q)=',\r
+'google_gm','(p|q|as_p|as_q)=',\r
+'www_google_gp','(p|q|as_p|as_q)=',\r
+'images_google_gp','(p|q|as_p|as_q)=',\r
+'google_gp','(p|q|as_p|as_q)=',\r
+'www_google_gy','(p|q|as_p|as_q)=',\r
+'images_google_gy','(p|q|as_p|as_q)=',\r
+'google_gy','(p|q|as_p|as_q)=',\r
+'www_google_hn','(p|q|as_p|as_q)=',\r
+'images_google_hn','(p|q|as_p|as_q)=',\r
+'google_hn','(p|q|as_p|as_q)=',\r
+'www_google_ht','(p|q|as_p|as_q)=',\r
+'images_google_ht','(p|q|as_p|as_q)=',\r
+'google_ht','(p|q|as_p|as_q)=',\r
+'www_google_hu','(p|q|as_p|as_q)=',\r
+'images_google_hu','(p|q|as_p|as_q)=',\r
+'google_hu','(p|q|as_p|as_q)=',\r
+'www_google_im','(p|q|as_p|as_q)=',\r
+'images_google_im','(p|q|as_p|as_q)=',\r
+'google_im','(p|q|as_p|as_q)=',\r
+'www_google_io','(p|q|as_p|as_q)=',\r
+'images_google_io','(p|q|as_p|as_q)=',\r
+'google_io','(p|q|as_p|as_q)=',\r
+'www_google_iq','(p|q|as_p|as_q)=',\r
+'images_google_iq','(p|q|as_p|as_q)=',\r
+'google_iq','(p|q|as_p|as_q)=',\r
+'www_google_is','(p|q|as_p|as_q)=',\r
+'images_google_is','(p|q|as_p|as_q)=',\r
+'google_is','(p|q|as_p|as_q)=',\r
+'www_google_je','(p|q|as_p|as_q)=',\r
+'images_google_je','(p|q|as_p|as_q)=',\r
+'google_je','(p|q|as_p|as_q)=',\r
+'www_google_jo','(p|q|as_p|as_q)=',\r
+'images_google_jo','(p|q|as_p|as_q)=',\r
+'google_jo','(p|q|as_p|as_q)=',\r
+'www_google_kg','(p|q|as_p|as_q)=',\r
+'images_google_kg','(p|q|as_p|as_q)=',\r
+'google_kg','(p|q|as_p|as_q)=',\r
+'www_google_ki','(p|q|as_p|as_q)=',\r
+'images_google_ki','(p|q|as_p|as_q)=',\r
+'google_ki','(p|q|as_p|as_q)=',\r
+'www_google_kz','(p|q|as_p|as_q)=',\r
+'images_google_kz','(p|q|as_p|as_q)=',\r
+'google_kz','(p|q|as_p|as_q)=',\r
+'www_google_la','(p|q|as_p|as_q)=',\r
+'images_google_la','(p|q|as_p|as_q)=',\r
+'google_la','(p|q|as_p|as_q)=',\r
+'www_google_li','(p|q|as_p|as_q)=',\r
+'images_google_li','(p|q|as_p|as_q)=',\r
+'google_li','(p|q|as_p|as_q)=',\r
+'www_google_lk','(p|q|as_p|as_q)=',\r
+'images_google_lk','(p|q|as_p|as_q)=',\r
+'google_lk','(p|q|as_p|as_q)=',\r
+'www_google_lt','(p|q|as_p|as_q)=',\r
+'images_google_lt','(p|q|as_p|as_q)=',\r
+'google_lt','(p|q|as_p|as_q)=',\r
+'www_google_lu','(p|q|as_p|as_q)=',\r
+'images_google_lu','(p|q|as_p|as_q)=',\r
+'google_lu','(p|q|as_p|as_q)=',\r
+'www_google_lv','(p|q|as_p|as_q)=',\r
+'images_google_lv','(p|q|as_p|as_q)=',\r
+'google_lv','(p|q|as_p|as_q)=',\r
+'www_google_md','(p|q|as_p|as_q)=',\r
+'images_google_md','(p|q|as_p|as_q)=',\r
+'google_md','(p|q|as_p|as_q)=',\r
+'www_google_me','(p|q|as_p|as_q)=',\r
+'images_google_me','(p|q|as_p|as_q)=',\r
+'google_me','(p|q|as_p|as_q)=',\r
+'www_google_mg','(p|q|as_p|as_q)=',\r
+'images_google_mg','(p|q|as_p|as_q)=',\r
+'google_mg','(p|q|as_p|as_q)=',\r
+'www_google_mk','(p|q|as_p|as_q)=',\r
+'images_google_mk','(p|q|as_p|as_q)=',\r
+'google_mk','(p|q|as_p|as_q)=',\r
+'www_google_ml','(p|q|as_p|as_q)=',\r
+'images_google_ml','(p|q|as_p|as_q)=',\r
+'google_ml','(p|q|as_p|as_q)=',\r
+'www_google_mn','(p|q|as_p|as_q)=',\r
+'images_google_mn','(p|q|as_p|as_q)=',\r
+'google_mn','(p|q|as_p|as_q)=',\r
+'www_google_ms','(p|q|as_p|as_q)=',\r
+'images_google_ms','(p|q|as_p|as_q)=',\r
+'google_ms','(p|q|as_p|as_q)=',\r
+'www_google_mu','(p|q|as_p|as_q)=',\r
+'images_google_mu','(p|q|as_p|as_q)=',\r
+'google_mu','(p|q|as_p|as_q)=',\r
+'www_google_mv','(p|q|as_p|as_q)=',\r
+'images_google_mv','(p|q|as_p|as_q)=',\r
+'google_mv','(p|q|as_p|as_q)=',\r
+'www_google_mw','(p|q|as_p|as_q)=',\r
+'images_google_mw','(p|q|as_p|as_q)=',\r
+'google_mw','(p|q|as_p|as_q)=',\r
+'www_google_ne','(p|q|as_p|as_q)=',\r
+'images_google_ne','(p|q|as_p|as_q)=',\r
+'google_ne','(p|q|as_p|as_q)=',\r
+'www_google_nr','(p|q|as_p|as_q)=',\r
+'images_google_nr','(p|q|as_p|as_q)=',\r
+'google_nr','(p|q|as_p|as_q)=',\r
+'www_google_nu','(p|q|as_p|as_q)=',\r
+'images_google_nu','(p|q|as_p|as_q)=',\r
+'google_nu','(p|q|as_p|as_q)=',\r
+'www_google_pn','(p|q|as_p|as_q)=',\r
+'images_google_pn','(p|q|as_p|as_q)=',\r
+'google_pn','(p|q|as_p|as_q)=',\r
+'www_google_ps','(p|q|as_p|as_q)=',\r
+'images_google_ps','(p|q|as_p|as_q)=',\r
+'google_ps','(p|q|as_p|as_q)=',\r
+'www_google_ro','(p|q|as_p|as_q)=',\r
+'images_google_ro','(p|q|as_p|as_q)=',\r
+'google_ro','(p|q|as_p|as_q)=',\r
+'www_google_rs','(p|q|as_p|as_q)=',\r
+'images_google_rs','(p|q|as_p|as_q)=',\r
+'google_rs','(p|q|as_p|as_q)=',\r
+'www_google_ru','(p|q|as_p|as_q)=',\r
+'images_google_ru','(p|q|as_p|as_q)=',\r
+'google_ru','(p|q|as_p|as_q)=',\r
+'www_google_rw','(p|q|as_p|as_q)=',\r
+'images_google_rw','(p|q|as_p|as_q)=',\r
+'google_rw','(p|q|as_p|as_q)=',\r
+'www_google_sc','(p|q|as_p|as_q)=',\r
+'images_google_sc','(p|q|as_p|as_q)=',\r
+'google_sc','(p|q|as_p|as_q)=',\r
+'www_google_sh','(p|q|as_p|as_q)=',\r
+'images_google_sh','(p|q|as_p|as_q)=',\r
+'google_sh','(p|q|as_p|as_q)=',\r
+'www_google_si','(p|q|as_p|as_q)=',\r
+'images_google_si','(p|q|as_p|as_q)=',\r
+'google_si','(p|q|as_p|as_q)=',\r
+'www_google_sk','(p|q|as_p|as_q)=',\r
+'images_google_sk','(p|q|as_p|as_q)=',\r
+'google_sk','(p|q|as_p|as_q)=',\r
+'www_google_sm','(p|q|as_p|as_q)=',\r
+'images_google_sm','(p|q|as_p|as_q)=',\r
+'google_sm','(p|q|as_p|as_q)=',\r
+'www_google_sn','(p|q|as_p|as_q)=',\r
+'images_google_sn','(p|q|as_p|as_q)=',\r
+'google_sn','(p|q|as_p|as_q)=',\r
+'www_google_so','(p|q|as_p|as_q)=',\r
+'images_google_so','(p|q|as_p|as_q)=',\r
+'google_so','(p|q|as_p|as_q)=',\r
+'www_google_sr','(p|q|as_p|as_q)=',\r
+'images_google_sr','(p|q|as_p|as_q)=',\r
+'google_sr','(p|q|as_p|as_q)=',\r
+'www_google_st','(p|q|as_p|as_q)=',\r
+'images_google_st','(p|q|as_p|as_q)=',\r
+'google_st','(p|q|as_p|as_q)=',\r
+'www_google_td','(p|q|as_p|as_q)=',\r
+'images_google_td','(p|q|as_p|as_q)=',\r
+'google_td','(p|q|as_p|as_q)=',\r
+'www_google_tg','(p|q|as_p|as_q)=',\r
+'images_google_tg','(p|q|as_p|as_q)=',\r
+'google_tg','(p|q|as_p|as_q)=',\r
+'www_google_tk','(p|q|as_p|as_q)=',\r
+'images_google_tk','(p|q|as_p|as_q)=',\r
+'google_tk','(p|q|as_p|as_q)=',\r
+'www_google_tl','(p|q|as_p|as_q)=',\r
+'images_google_tl','(p|q|as_p|as_q)=',\r
+'google_tl','(p|q|as_p|as_q)=',\r
+'www_google_tm','(p|q|as_p|as_q)=',\r
+'images_google_tm','(p|q|as_p|as_q)=',\r
+'google_tm','(p|q|as_p|as_q)=',\r
+'www_google_tn','(p|q|as_p|as_q)=',\r
+'images_google_tn','(p|q|as_p|as_q)=',\r
+'google_tn','(p|q|as_p|as_q)=',\r
+'www_google_to','(p|q|as_p|as_q)=',\r
+'images_google_to','(p|q|as_p|as_q)=',\r
+'google_to','(p|q|as_p|as_q)=',\r
+'www_google_tt','(p|q|as_p|as_q)=',\r
+'images_google_tt','(p|q|as_p|as_q)=',\r
+'google_tt','(p|q|as_p|as_q)=',\r
+'www_google_us','(p|q|as_p|as_q)=',\r
+'images_google_us','(p|q|as_p|as_q)=',\r
+'google_us','(p|q|as_p|as_q)=',\r
+'www_google_vg','(p|q|as_p|as_q)=',\r
+'images_google_vg','(p|q|as_p|as_q)=',\r
+'google_vg','(p|q|as_p|as_q)=',\r
+'www_google_vu','(p|q|as_p|as_q)=',\r
+'images_google_vu','(p|q|as_p|as_q)=',\r
+'google_vu','(p|q|as_p|as_q)=',\r
+'www_google_ws','(p|q|as_p|as_q)=',\r
+'images_google_ws','(p|q|as_p|as_q)=',\r
+'google_ws','(p|q|as_p|as_q)=',\r
+\r
+'google_base','(q|p|as_p|as_q)=',\r
+'google_translate','q=',\r
+'googleByIP','googleByIP','q=',\r
+'google_catchall','(q|p|as_p|as_q)=',\r
+'google_cache','(p|q|as_p|as_q)=cache:[0-9A-Za-z]{12}:',\r
+'google_froogle','(q|p|as_p|as_q)=',\r
+'google_groups','group\/', # does not work\r
+'google_maps','(dq|q|p|as_p|as_q)=',\r
+'google_products','(q|p|as_p|as_q)=',\r
+'google4counter','(q|p|as_p|as_q)=',\r
+\r
+'1klik','query=',\r
+'1search','query=',\r
+'1und1_de','q=',\r
+'3721','(p|name)=',\r
+'a9','a9\.com\/', \r
+'abacho','q=',\r
+'accoona','qt=',\r
+'alexa','q=',\r
+'aliceit','qs=',\r
+'aliceitmaster','qs=',\r
+'allesklar','q=',\r
+'allgameshome','s=',\r
+'alltheweb','q(|uery)=',\r
+'alot','q=',\r
+'altavista','p=',\r
+'amazon','query=',\r
+'androidsearch','q=',\r
+'answerbus','',\r
+'anzwers','search=',\r
+'aol_o2suche_de','q(|uery)=',\r
+'aolcatchall','q(|query)=',\r
+'aolcom','q(|query)=',\r
+'aolde','q(|query)=',\r
+'aolfr','q(|uery)=',\r
+'aolpl','q(|query)=',\r
+'aolsearchde','q(|query)=',\r
+'aoluk','q(|query)=',\r
+'aport','r=',\r
+'arianna','query=',\r
+'asevenboard','query=',\r
+'askcatchall','q=',\r
+'askde','q=',\r
+'askes','q=',\r
+'askfr','q=',\r
+'askimages','q=',\r
+'askit','q=',\r
+'askjp','q=',\r
+'asknl','q=',\r
+'askuk','q=',\r
+'atlanticbb','q=',\r
+'atlas','(searchtext|q)=', \r
+'atomz','sp-q=',\r
+'att','qry=',\r
+'au_search_yahoo_com','p=',\r
+'auone','q=',\r
+'avantfind','keywords=',\r
+'avg','q=',\r
+'babylon','q=',\r
+'baidu','(word|wd)=',\r
+'bbc','q=', \r
+'benefind','q=',\r
+'biglotron','question=',\r
+'bing','q(|pvt)=',\r
+'blekko','q=',\r
+'blingo','q=',\r
+'bluewin', 'qry=',\r
+'bt','p=',\r
+'bungeebonesdotcom','query=',\r
+'ca_search_yahoo_com','p=',\r
+'centraldatabase','query=',\r
+'centrum','q=', \r
+'centurylink','q=',\r
+'certifiedtoolbarsearch','q=',\r
+'charter','q=',\r
+'chatzum','q=',\r
+'checkparams','q=',\r
+'chelloat','q1=',\r
+'chellobe','q1=',\r
+'chellocom','q1=',\r
+'chellocz','q1=',\r
+'chellofr','q1=',\r
+'chellohu','q1=',\r
+'chellonl','q1=',\r
+'chellono','q1=',\r
+'chellopl','q1=',\r
+'chellose','q1=',\r
+'chellosk','q1=',\r
+'clarosearch','q=',\r
+'clinck','q=',\r
+'clubinternet', 'q=',\r
+'clusty','query=',\r
+'comcast','q=',\r
+'comettoolbar','qry=',\r
+'conduit','q=',\r
+'copernic','web\/',\r
+'crawler','q=',\r
+'ctrouve','q=',\r
+'dalesearch','q=',\r
+'danielsen','q=', \r
+'daum','q=',\r
+'de_dolphin_com','q=',\r
+'de_wiki_gov_cn','de\.wiki\.gov\.cn\/s_',\r
+'dejanews','q=',\r
+'delicious','all=',\r
+'delta-search','q=',\r
+'digg','s=',\r
+'dmoz','search=',\r
+'dodajpl','keyword=',\r
+'dogpile', '(q=|kw=|web/)',\r
+'duckduckgo','nokey=',\r
+'earthlink', 'q=',\r
+'easysearch','s=',\r
+'ecosia','q=',\r
+'edderkoppen','query=', \r
+'engine','p1=', \r
+'eniro','q=',\r
+'enirose','q=',\r
+'ereadingsource','q=',\r
+'etools_ch','query=',\r
+'euroseek','query=',\r
+'everyclick','keyword=',\r
+'excite','search=',\r
+'facemoods','(q|s)=',\r
+'fastbot_de','red=[0-9]*\+',\r
+'fbdownloader','q=',\r
+'fdownloadr_com','q=',\r
+'find1friend','q=',\r
+'findamo','q=',\r
+'findarticles','key=',\r
+'finddk','words=', \r
+'fireball','q=', \r
+'flipora','q=',\r
+'foxstart','q=',\r
+'fr_search_yahoo_com','p=',\r
+'francite','name=', \r
+'free','q=',\r
+'freenet_de','query=',\r
+'freeserve','q=',\r
+'funmoods','(q|s)=',\r
+'gazetapl','slowo=',\r
+'genieo','q=',\r
+'gerypl','q=',\r
+'globososo','q=',\r
+'gmxsuche','q=',\r
+'gmxsuche_at','q=',\r
+'go','qt=',\r
+'go.mail.ru','q=',\r
+'go2net','general=',\r
+'godado','Keywords=',\r
+'goliat','KERESES=',\r
+'goodsearch','Keywords=',\r
+'gotuneed','', # Not yet known\r
+'govome','q=',\r
+'haku','w=',\r
+'handycafe','q=',\r
+'heureka','heureka=', \r
+'hogapl','qt=',\r
+'holasearch','q=',\r
+'hotbot','mt=',\r
+'hp_my_aol','q(|uery)=',\r
+'hubwe','p=',\r
+'iask','(w|k)=',\r
+'iboats','highlight=',\r
+'icerocket','q=',\r
+'ichiro','MT=',\r
+'icq','q=',\r
+'ilse','search_for=', \r
+'image_search_yahoo_co_jp','p=',\r
+'images_search_yahoo_com','p=',\r
+'iminent','q=',\r
+'inbox','q=',\r
+'incredibar','q=',\r
+'incredimail','q=',\r
+'indexhu','q=', \r
+'ineffabile','',\r
+'infoseek','qt=',\r
+'infospace','qkw=',\r
+'infouk','qkw=',\r
+'inspsearch','q=',\r
+'int_search_myway_com','searchfor=',\r
+'interiapl','q=',\r
+'internetto','searchstr=',\r
+'isearch_nation_com','q=',\r
+'it_search_yahoo_com','p=',\r
+'iune','(keywords|q)=',\r
+'ixquick', 'query=',\r
+'izito_catchall','(query|OVKEY|q)=',\r
+'izito_de','(query|OVKEY|q)=',\r
+'izito_uk','(query|OVKEY|q)=',\r
+'jubii','soegeord=', \r
+'jumpyit','searchWord=',\r
+'juno','query=',\r
+'jyxo','(s|q)=', \r
+'kartoo','',\r
+'katalogonetpl','qt=',\r
+'kataweb','q=',\r
+'keresolap_hu','q=',\r
+'kvasir', 'q=',\r
+'kvitters','query=',\r
+'lapkereso_hu','q=',\r
+'lbb','q=', \r
+'ledix','q=',\r
+'libero','qs=',\r
+'libertysurf','q=',\r
+'live','q=',\r
+'localmoxie','keyword=',\r
+'looksmart_catchall','key=',\r
+'looksmart_co_uk','key=',\r
+'lycos','query=',\r
+'mamma','query=',\r
+'meinestadt','q=',\r
+'metabot','st=',\r
+'metacrawler','general=',\r
+'metacrawler_de','qry=',\r
+'metager','eingabe=',\r
+'metahannover','q=',\r
+'metasearch','q=',\r
+'metaspinner','qry=',\r
+'metasuche_ch','q=',\r
+'metaua','q=',\r
+'miner','q=',\r
+'mirago','(txtsearch|qry)=',\r
+'miragobe','(txtsearch|qry)=',\r
+'miragoch','(txtsearch|qry)=',\r
+'miragocouk','(txtsearch|qry)=',\r
+'miragode','(txtsearch|qry)=',\r
+'miragodk','(txtsearch|qry)=',\r
+'miragoes','(txtsearch|qry)=',\r
+'miragofr','(txtsearch|qry)=',\r
+'miragoit','(txtsearch|qry)=',\r
+'miragonl','(txtsearch|qry)=',\r
+'miragono','(txtsearch|qry)=',\r
+'miragose','(txtsearch|qry)=',\r
+'mitrasites','q=',\r
+'mozbot','q=',\r
+'msn','q=',\r
+'mys_yoursearch_me','q=',\r
+'mysearch','searchfor=',\r
+'mysearchdial','q=',\r
+'mysearchresults','q=',\r
+'myway','searchfor=',\r
+'mywebsearch','searchfor=',\r
+'najdi','dotaz=',\r
+'nation','q=',\r
+'navigationshilfe_t_online','q=',\r
+'nbci','keyword=',\r
+'netease','q=',\r
+'netluchs','query=',\r
+'netscape','search=',\r
+'netsprintpl','q=',\r
+'netstjernen','q=',\r
+'netzero','query=',\r
+'no query string available',\r
+'northernlight','qr=',\r
+'nortonsavesearch','q=',\r
+'nusearch','nusearch_terms=',\r
+'o2pl','qt=',\r
+'ofir','querytext=',\r
+'oneseek_de','q=',\r
+'onetpl','qt=',\r
+'opasia','q=', \r
+'orange','q=',\r
+'orangeworld','q=',\r
+'orbis','search_field=',\r
+'origo','(q|search)=', \r
+'overture','keywords=',\r
+'passagen','q=',\r
+'pch','q=',\r
+'peoplecheck_de','q=',\r
+'ph_search_yahoo_com','p=',\r
+'picsearch','q=',\r
+'pictures','q=',\r
+'plusnetwork','q=',\r
+'pogodak','q=',\r
+'polskapl','qt=',\r
+'polymeta_hu','',\r
+'preciobarato_xyz','s=',\r
+'questionanswering','',\r
+'quick','query=', \r
+'qwant_com','q=',\r
+'r_search_yahoo_com','p=',\r
+'rakuten','qt=',\r
+'rambler','words=',\r
+'redbox','srch=',\r
+'rr','q=',\r
+'safehomepage_com','q=',\r
+'sagool','q=',\r
+'sapo','q=',\r
+'schoenerbrausen','q=',\r
+'scroogle','Gw=',\r
+'se_search_yahoo_com','p=',\r
+'search.com','q=',\r
+'search_1und1_de','q=',\r
+'search_foxtab_com','q=',\r
+'search_socialdownloadr_com','q=',\r
+'search_yahoo_co_jp','p=',\r
+'search_yahoo_com','p=',\r
+'search_zonealarm_com','q=',\r
+'searchalgo','q=',\r
+'searchalot','q=',\r
+'searchch', 'q=',\r
+'searchcompletion','q=',\r
+'searches_qone8_com','q=',\r
+'searchesnavigator','query=',\r
+'searchfunmoods','q=',\r
+'searchgol','q=',\r
+'searchlistingsite','keyword=',\r
+'searchmobileonline','q=',\r
+'searchresults','q=',\r
+'search-results_mobi','q=',\r
+'searchresultscom','q=',\r
+'searchresultsmobi','q=',\r
+'searchsafer','q=',\r
+'searchy', 'search_term=',\r
+'searchya','q=',\r
+'segnalo','',\r
+'semalt','u=',\r
+'sensis','find=',\r
+'seznam','(w|q)=', \r
+'sg_search_yahoo_com','p=',\r
+'sg_yhs4_search_yahoo_com','p=',\r
+'shawca','q=',\r
+'shinyseek\.it','KEY=',\r
+'shoppstop','keywords=',\r
+'sify','keyword=',\r
+'sky','term=',\r
+'smartsuggestor','s=',\r
+'smde','q=',\r
+'snapdo','q=',\r
+'softonic','q=',\r
+'sogou', 'query=',\r
+'sol','q=', \r
+'soso','q=',\r
+'speedbit','q=',\r
+'sphere','q=',\r
+'splut','pattern=', \r
+'spotjockey','Search_Keyword=', \r
+'spray','string=',\r
+'start','q=',\r
+'startlap_hu','q=',\r
+'startpage','query=', \r
+'startsiden','q=',\r
+'startxxl','q=',\r
+'steadysearch','w=',\r
+'stumbleupon','',\r
+'sucheaolde','q(|query)=',\r
+'supereva','q=',\r
+'surfcanyon_com','q=',\r
+'sweetim','q=',\r
+'sweetpacks','q=',\r
+'swik','swik\.net/',\r
+'swisscows_ch','query=',\r
+'sympatico', 'query=', \r
+'szukaczpl','q=',\r
+'t_online_catchall','q=',\r
+'t_online_de','q=',\r
+'talktalk_uk', 'query=',\r
+'tango_hu','q=',\r
+'tbask','searchfor=',\r
+'teecnoit','q=',\r
+'teoma','q=',\r
+'terra','query=',\r
+'tesco','q=',\r
+'theallsearches','query=',\r
+'three','q=',\r
+'tiscali','key=',\r
+'tixuma_de','sc=',\r
+'toile', 'q=',\r
+'toshiba','q=',\r
+'turtle','q=',\r
+'tw_images_search_yahoo_com','p=',\r
+'tyfon','q=',\r
+'uk_foxstart_com','q=',\r
+'uk_search_yahoo_com','p=',\r
+'uk_yhs4_search_yahoo_com','p=',\r
+'ukdirectory','k=', \r
+'ukindex', 'stext=', \r
+'ukplus','search=', \r
+'umfis','suchbegriff=',\r
+'umuwa_de','umuwa\.de\/',\r
+'us_search_yahoo_com','p=',\r
+'vindex','in=',\r
+'virgilio','qs=',\r
+'virginmedia','q=',\r
+'vi-view_com','q=',\r
+'vivisimo','query=',\r
+'vlips_de','q=',\r
+'vnet','kw=',\r
+'voila','(kw|rdata)=',\r
+'wahoo','q=',\r
+'webalta','q=',\r
+'webcrawler','(q|searchText)=',\r
+'webde','su=',\r
+'webmania','q=',\r
+'whorush_com','q=',\r
+'windowssearch_com','q=',\r
+'wisenut','query=', \r
+'wow_utop_it','q=',\r
+'wowpl','q=',\r
+'wowsearch','q=',\r
+'wowuk','q=',\r
+'wp','szukaj=',\r
+'www_buenosearch_com','q=',\r
+'www_dregol_com','q=',\r
+'www_wow_com','q=',\r
+'wwweasel','q=',\r
+'yahoo_catchall','p=',\r
+'yahoo_mindset','p=',\r
+'yandex','text=',\r
+'yandexcom','text=',\r
+'yandexcomtr','text=',\r
+'yandexkz','text=',\r
+'yandexru','text=',\r
+'yandexua','text=',\r
+'yell','keywords=',\r
+'yourbestsearch','k=',\r
+'youtube','q=',\r
+'zapmeta_catchall','query=',\r
+'zapmeta_ch','query=',\r
+'zapmeta_com','query=',\r
+'zapmeta_de','query=',\r
+'zhongsou','(word|w)=',\r
+'zoeken','q(|uery)=',\r
+'zoznam','q='\r
+);\r
+\r
+# SearchEnginesKnownUrlNotFound\r
+# Known rules to extract not found keywords from a referrer search engine URL\r
+#------------------------------------------------------------------------------\r
+%SearchEnginesKnownUrlNotFound=(\r
+# Most common search engines\r
+'msn','origq='\r
+);\r
+\r
+# If no rules are known, WordsToExtractSearchUrl will be used to search keyword parameter\r
+# If no rules are known and search in WordsToExtractSearchUrl failed, this will be used to clean URL of not keyword parameters.\r
+#------------------------------------------------------------------------------\r
+@WordsToExtractSearchUrl= ('all=','as_q=','ask=','claus=','dotaz=','find=','general=','Gw=','heureka=','highlight=','ie=','image keys=','imgurl=','in=','iu=','k=','KERESES=','key=','keyword=','keywords=','kw=','mt=','name=','nusearch_terms=','OVKEY=','p=','p1=','pattern=','q=','q1=','qkw=','qpvt=','qr=','qr=','qry=','qs=','qt=','query=','querytext=','question=','r=','rdata=','req=','s=','search=','search_field=','search_for=','Search_Keyword=','search_term=','searchfor=','searchstr=','searchtext=','searchWord=','Serbian=','slowo=','soegeord=','sp-q=','srch=','st=','stext=','string=','su=','szukaj=','term=','text=','tn=','txtsearch=','uery=','w=','wd=','word=','words=');\r
+@WordsToCleanSearchUrl= ('act=','annuaire=','btng=','cat=','categoria=','cfg=','cof=','cou=','count=','cp=','dd=','domain=','dt=','dw=','enc=','exec=','geo=','hc=','height=','hits=','hl=','hq=','hs=','id=','kl=','lang=','loc=','lr=','matchmode=','medor=','message=','meta=','mode=','order=','page=','par=','pays=','pg=','pos=','prg=','qc=','refer=','sa=','safe=','sc=','sort=','src=','start=','style=','stype=','sum=','tag=','temp=','theme=','type=','url=','user=','width=','what=','\\.x=','\\.y=','y=','look=');\r
+\r
+# SearchEnginesKnownUTFCoding\r
+# Known parameter that proves a search engine has coded its parameters in UTF-8\r
+#------------------------------------------------------------------------------\r
+%SearchEnginesKnownUTFCoding=(\r
+# Most common search engines\r
+'google','ie=utf-8',\r
+'alltheweb','cs=utf-8'\r
+);\r
+\r
+\r
+# SearchEnginesHashLib\r
+# List of search engines names\r
+# 'search_engine_id', 'search_engine_name',\r
+#------------------------------------------------------------------------------\r
+%SearchEnginesHashLib=(\r
+# Search engine output links or not as the case may be\r
+\r
+'www_google_co_uk','<a href="http://www.google.co.uk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google United Kingdom</a>',\r
+'images_google_co_uk','<a href="http://images.google.co.uk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google United Kingdom ( images )</a>',\r
+'google_co_uk','<a href="http://google.co.uk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google United Kingdom ( catchall )</a>',\r
+'www_google_com','<a href="http://www.google.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google .com</a>',\r
+'images_google_com','<a href="http://images.google.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google .com ( images )</a>',\r
+'google_com','<a href="http://google.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google .com ( catchall )</a>',\r
+'www_google_de','<a href="http://www.google.de/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Germany</a>',\r
+'images_google_de','<a href="http://images.google.de/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Germany ( images )</a>',\r
+'google_de','<a href="http://google.de/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Germany ( catchall )</a>',\r
+'www_google_fr','<a href="http://www.google.fr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google France</a>',\r
+'images_google_fr','<a href="http://images.google.fr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google France ( images )</a>',\r
+'google_fr','<a href="http://google.fr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google France ( catchall )</a>',\r
+'www_google_ca','<a href="http://www.google.ca/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Canada</a>',\r
+'images_google_ca','<a href="http://images.google.ca/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Canada ( images )</a>',\r
+'google_ca','<a href="http://google.ca/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Canada ( catchall )</a>',\r
+'www_google_es','<a href="http://www.google.es/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Spain</a>',\r
+'images_google_es','<a href="http://images.google.es/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Spain ( images )</a>',\r
+'google_es','<a href="http://google.es/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Spain ( catchall )</a>',\r
+'www_google_com_au','<a href="http://www.google.com.au/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Australia</a>',\r
+'images_google_com_au','<a href="http://images.google.com.au/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Australia ( images )</a>',\r
+'google_com_au','<a href="http://google.com.au/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Australia ( catchall )</a>',\r
+'www_google_nl','<a href="http://www.google.nl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Netherlands</a>',\r
+'images_google_nl','<a href="http://images.google.nl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Netherlands ( images )</a>',\r
+'google_nl','<a href="http://google.nl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Netherlands ( catchall )</a>',\r
+'www_google_gr','<a href="http://www.google.gr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Greece</a>',\r
+'images_google_gr','<a href="http://images.google.gr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Greece ( images )</a>',\r
+'google_gr','<a href="http://google.gr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Greece ( catchall )</a>',\r
+'www_google_se','<a href="http://www.google.se/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Sweden</a>',\r
+'images_google_se','<a href="http://images.google.se/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Sweden ( images )</a>',\r
+'google_se','<a href="http://google.se/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Sweden ( catchall )</a>',\r
+'www_google_ie','<a href="http://www.google.ie/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ireland</a>',\r
+'images_google_ie','<a href="http://images.google.ie/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ireland ( images )</a>',\r
+'google_ie','<a href="http://google.ie/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ireland ( catchall )</a>',\r
+'www_google_it','<a href="http://www.google.it/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Italy</a>',\r
+'images_google_it','<a href="http://images.google.it/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Italy ( images )</a>',\r
+'google_it','<a href="http://google.it/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Italy ( catchall )</a>',\r
+'www_google_no','<a href="http://www.google.no/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Norway</a>',\r
+'images_google_no','<a href="http://images.google.no/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Norway ( images )</a>',\r
+'google_no','<a href="http://google.no/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Norway ( catchall )</a>',\r
+'www_google_com_tr','<a href="http://www.google.com.tr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Turkey</a>',\r
+'images_google_com_tr','<a href="http://images.google.com.tr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Turkey ( images )</a>',\r
+'google_com_tr','<a href="http://google.com.tr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Turkey ( catchall )</a>',\r
+'www_google_co_in','<a href="http://www.google.co.in/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google India</a>',\r
+'images_google_co_in','<a href="http://images.google.co.in/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google India ( images )</a>',\r
+'google_co_in','<a href="http://google.co.in/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google India ( catchall )</a>',\r
+'www_google_pt','<a href="http://www.google.pt/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Portugal</a>',\r
+'images_google_pt','<a href="http://images.google.pt/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Portugal ( images )</a>',\r
+'google_pt','<a href="http://google.pt/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Portugal ( catchall )</a>',\r
+'www_google_hr','<a href="http://www.google.hr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Croatia</a>',\r
+'images_google_hr','<a href="http://images.google.hr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Croatia ( images )</a>',\r
+'google_hr','<a href="http://google.hr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Croatia ( catchall )</a>',\r
+'www_google_co_nz','<a href="http://www.google.co.nz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google New Zealand</a>',\r
+'images_google_co_nz','<a href="http://images.google.co.nz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google New Zealand ( images )</a>',\r
+'google_co_nz','<a href="http://google.co.nz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google New Zealand ( catchall )</a>',\r
+'www_google_pl','<a href="http://www.google.pl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Poland</a>',\r
+'images_google_pl','<a href="http://images.google.pl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Poland ( images )</a>',\r
+'google_pl','<a href="http://google.pl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Poland ( catchall )</a>',\r
+'www_google_ac','<a href="http://www.google.ac/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ascension Island</a>',\r
+'images_google_ac','<a href="http://images.google.ac/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ascension Island ( images )</a>',\r
+'google_ac','<a href="http://google.ac/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ascension Island ( catchall )</a>',\r
+'www_google_ad','<a href="http://www.google.ad/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Andorra</a>',\r
+'images_google_ad','<a href="http://images.google.ad/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Andorra ( images )</a>',\r
+'google_ad','<a href="http://google.ad/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Andorra ( catchall )</a>',\r
+'www_google_ae','<a href="http://www.google.ae/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google United Arab Emirates</a>',\r
+'images_google_ae','<a href="http://images.google.ae/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google United Arab Emirates ( images )</a>',\r
+'google_ae','<a href="http://google.ae/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google United Arab Emirates ( catchall )</a>',\r
+'www_google_al','<a href="http://www.google.al/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Albania</a>',\r
+'images_google_al','<a href="http://images.google.al/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Albania ( images )</a>',\r
+'google_al','<a href="http://google.al/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Albania ( catchall )</a>',\r
+'www_google_am','<a href="http://www.google.am/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Armenia</a>',\r
+'images_google_am','<a href="http://images.google.am/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Armenia ( images )</a>',\r
+'google_am','<a href="http://google.am/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Armenia ( catchall )</a>',\r
+'www_google_as','<a href="http://www.google.as/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google American Samoa</a>',\r
+'images_google_as','<a href="http://images.google.as/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google American Samoa ( images )</a>',\r
+'google_as','<a href="http://google.as/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google American Samoa ( catchall )</a>',\r
+'www_google_at','<a href="http://www.google.at/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Austria</a>',\r
+'images_google_at','<a href="http://images.google.at/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Austria ( images )</a>',\r
+'google_at','<a href="http://google.at/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Austria ( catchall )</a>',\r
+'www_google_az','<a href="http://www.google.az/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Azerbaijan</a>',\r
+'images_google_az','<a href="http://images.google.az/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Azerbaijan ( images )</a>',\r
+'google_az','<a href="http://google.az/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Azerbaijan ( catchall )</a>',\r
+'www_google_ba','<a href="http://www.google.ba/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bosnia and Herzegovina</a>',\r
+'images_google_ba','<a href="http://images.google.ba/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bosnia and Herzegovina ( images )</a>',\r
+'google_ba','<a href="http://google.ba/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bosnia and Herzegovina ( catchall )</a>',\r
+'www_google_be','<a href="http://www.google.be/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Belgium</a>',\r
+'images_google_be','<a href="http://images.google.be/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Belgium ( images )</a>',\r
+'google_be','<a href="http://google.be/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Belgium ( catchall )</a>',\r
+'www_google_bf','<a href="http://www.google.bf/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Burkina Faso</a>',\r
+'images_google_bf','<a href="http://images.google.bf/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Burkina Faso ( images )</a>',\r
+'google_bf','<a href="http://google.bf/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Burkina Faso ( catchall )</a>',\r
+'www_google_bg','<a href="http://www.google.bg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bulgaria</a>',\r
+'images_google_bg','<a href="http://images.google.bg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bulgaria ( images )</a>',\r
+'google_bg','<a href="http://google.bg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bulgaria ( catchall )</a>',\r
+'www_google_bi','<a href="http://www.google.bi/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Burundi</a>',\r
+'images_google_bi','<a href="http://images.google.bi/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Burundi ( images )</a>',\r
+'google_bi','<a href="http://google.bi/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Burundi ( catchall )</a>',\r
+'www_google_bj','<a href="http://www.google.bj/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Benin</a>',\r
+'images_google_bj','<a href="http://images.google.bj/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Benin ( images )</a>',\r
+'google_bj','<a href="http://google.bj/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Benin ( catchall )</a>',\r
+'www_google_bs','<a href="http://www.google.bs/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bahamas</a>',\r
+'images_google_bs','<a href="http://images.google.bs/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bahamas ( images )</a>',\r
+'google_bs','<a href="http://google.bs/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bahamas ( catchall )</a>',\r
+'www_google_bt','<a href="http://www.google.bt/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bhutan</a>',\r
+'images_google_bt','<a href="http://images.google.bt/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bhutan ( images )</a>',\r
+'google_bt','<a href="http://google.bt/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bhutan ( catchall )</a>',\r
+'www_google_by','<a href="http://www.google.by/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Belarus</a>',\r
+'images_google_by','<a href="http://images.google.by/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Belarus ( images )</a>',\r
+'google_by','<a href="http://google.by/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Belarus ( catchall )</a>',\r
+'www_google_cat','<a href="http://www.google.cat/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Catalan Countries</a>',\r
+'images_google_cat','<a href="http://images.google.cat/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Catalan Countries ( images )</a>',\r
+'google_cat','<a href="http://google.cat/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Catalan Countries ( catchall )</a>',\r
+'www_google_cc','<a href="http://www.google.cc/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cocos (Keeling) Islands</a>',\r
+'images_google_cc','<a href="http://images.google.cc/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cocos (Keeling) Islands ( images )</a>',\r
+'google_cc','<a href="http://google.cc/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cocos (Keeling) Islands ( catchall )</a>',\r
+'www_google_cd','<a href="http://www.google.cd/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Democratic Republic of the Congo</a>',\r
+'images_google_cd','<a href="http://images.google.cd/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Democratic Republic of the Congo ( images )</a>',\r
+'google_cd','<a href="http://google.cd/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Democratic Republic of the Congo ( catchall )</a>',\r
+'www_google_cf','<a href="http://www.google.cf/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Central African Republic</a>',\r
+'images_google_cf','<a href="http://images.google.cf/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Central African Republic ( images )</a>',\r
+'google_cf','<a href="http://google.cf/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Central African Republic ( catchall )</a>',\r
+'www_google_cg','<a href="http://www.google.cg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Republic of the Congo</a>',\r
+'images_google_cg','<a href="http://images.google.cg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Republic of the Congo ( images )</a>',\r
+'google_cg','<a href="http://google.cg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Republic of the Congo ( catchall )</a>',\r
+'www_google_ch','<a href="http://www.google.ch/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Switzerland</a>',\r
+'images_google_ch','<a href="http://images.google.ch/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Switzerland ( images )</a>',\r
+'google_ch','<a href="http://google.ch/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Switzerland ( catchall )</a>',\r
+'www_google_ci','<a href="http://www.google.ci/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ivory Coast</a>',\r
+'images_google_ci','<a href="http://images.google.ci/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ivory Coast ( images )</a>',\r
+'google_ci','<a href="http://google.ci/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ivory Coast ( catchall )</a>',\r
+'www_google_cl','<a href="http://www.google.cl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Chile</a>',\r
+'images_google_cl','<a href="http://images.google.cl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Chile ( images )</a>',\r
+'google_cl','<a href="http://google.cl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Chile ( catchall )</a>',\r
+'www_google_cm','<a href="http://www.google.cm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cameroon</a>',\r
+'images_google_cm','<a href="http://images.google.cm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cameroon ( images )</a>',\r
+'google_cm','<a href="http://google.cm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cameroon ( catchall )</a>',\r
+'www_google_cn','<a href="http://www.google.cn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google China</a>',\r
+'images_google_cn','<a href="http://images.google.cn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google China ( images )</a>',\r
+'google_cn','<a href="http://google.cn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google China ( catchall )</a>',\r
+'www_google_co_ao','<a href="http://www.google.co.ao/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Angola</a>',\r
+'images_google_co_ao','<a href="http://images.google.co.ao/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Angola ( images )</a>',\r
+'google_co_ao','<a href="http://google.co.ao/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Angola ( catchall )</a>',\r
+'www_google_co_bw','<a href="http://www.google.co.bw/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Botswana</a>',\r
+'images_google_co_bw','<a href="http://images.google.co.bw/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Botswana ( images )</a>',\r
+'google_co_bw','<a href="http://google.co.bw/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Botswana ( catchall )</a>',\r
+'www_google_co_ck','<a href="http://www.google.co.ck/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cook Islands</a>',\r
+'images_google_co_ck','<a href="http://images.google.co.ck/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cook Islands ( images )</a>',\r
+'google_co_ck','<a href="http://google.co.ck/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cook Islands ( catchall )</a>',\r
+'www_google_co_cr','<a href="http://www.google.co.cr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Costa Rica</a>',\r
+'images_google_co_cr','<a href="http://images.google.co.cr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Costa Rica ( images )</a>',\r
+'google_co_cr','<a href="http://google.co.cr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Costa Rica ( catchall )</a>',\r
+'www_google_co_id','<a href="http://www.google.co.id/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Indonesia</a>',\r
+'images_google_co_id','<a href="http://images.google.co.id/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Indonesia ( images )</a>',\r
+'google_co_id','<a href="http://google.co.id/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Indonesia ( catchall )</a>',\r
+'www_google_co_il','<a href="http://www.google.co.il/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Israel</a>',\r
+'images_google_co_il','<a href="http://images.google.co.il/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Israel ( images )</a>',\r
+'google_co_il','<a href="http://google.co.il/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Israel ( catchall )</a>',\r
+'www_google_co_jp','<a href="http://www.google.co.jp/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Japan</a>',\r
+'images_google_co_jp','<a href="http://images.google.co.jp/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Japan ( images )</a>',\r
+'google_co_jp','<a href="http://google.co.jp/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Japan ( catchall )</a>',\r
+'www_google_co_ke','<a href="http://www.google.co.ke/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Kenya</a>',\r
+'images_google_co_ke','<a href="http://images.google.co.ke/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Kenya ( images )</a>',\r
+'google_co_ke','<a href="http://google.co.ke/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Kenya ( catchall )</a>',\r
+'www_google_co_kr','<a href="http://www.google.co.kr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google South Korea</a>',\r
+'images_google_co_kr','<a href="http://images.google.co.kr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google South Korea ( images )</a>',\r
+'google_co_kr','<a href="http://google.co.kr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google South Korea ( catchall )</a>',\r
+'www_google_co_ls','<a href="http://www.google.co.ls/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Lesotho</a>',\r
+'images_google_co_ls','<a href="http://images.google.co.ls/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Lesotho ( images )</a>',\r
+'google_co_ls','<a href="http://google.co.ls/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Lesotho ( catchall )</a>',\r
+'www_google_co_ma','<a href="http://www.google.co.ma/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Morocco</a>',\r
+'images_google_co_ma','<a href="http://images.google.co.ma/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Morocco ( images )</a>',\r
+'google_co_ma','<a href="http://google.co.ma/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Morocco ( catchall )</a>',\r
+'www_google_co_mz','<a href="http://www.google.co.mz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Mozambique</a>',\r
+'images_google_co_mz','<a href="http://images.google.co.mz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Mozambique ( images )</a>',\r
+'google_co_mz','<a href="http://google.co.mz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Mozambique ( catchall )</a>',\r
+'www_google_co_th','<a href="http://www.google.co.th/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Thailand</a>',\r
+'images_google_co_th','<a href="http://images.google.co.th/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Thailand ( images )</a>',\r
+'google_co_th','<a href="http://google.co.th/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Thailand ( catchall )</a>',\r
+'www_google_co_tz','<a href="http://www.google.co.tz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Tanzania</a>',\r
+'images_google_co_tz','<a href="http://images.google.co.tz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Tanzania ( images )</a>',\r
+'google_co_tz','<a href="http://google.co.tz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Tanzania ( catchall )</a>',\r
+'www_google_co_ug','<a href="http://www.google.co.ug/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Uganda</a>',\r
+'images_google_co_ug','<a href="http://images.google.co.ug/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Uganda ( images )</a>',\r
+'google_co_ug','<a href="http://google.co.ug/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Uganda ( catchall )</a>',\r
+'www_google_co_uz','<a href="http://www.google.co.uz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Uzbekistan</a>',\r
+'images_google_co_uz','<a href="http://images.google.co.uz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Uzbekistan ( images )</a>',\r
+'google_co_uz','<a href="http://google.co.uz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Uzbekistan ( catchall )</a>',\r
+'www_google_co_ve','<a href="http://www.google.co.ve/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Venezuela</a>',\r
+'images_google_co_ve','<a href="http://images.google.co.ve/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Venezuela ( images )</a>',\r
+'google_co_ve','<a href="http://google.co.ve/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Venezuela ( catchall )</a>',\r
+'www_google_co_vi','<a href="http://www.google.co.vi/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google United States Virgin Islands</a>',\r
+'images_google_co_vi','<a href="http://images.google.co.vi/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google United States Virgin Islands ( images )</a>',\r
+'google_co_vi','<a href="http://google.co.vi/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google United States Virgin Islands ( catchall )</a>',\r
+'www_google_co_za','<a href="http://www.google.co.za/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google South Africa</a>',\r
+'images_google_co_za','<a href="http://images.google.co.za/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google South Africa ( images )</a>',\r
+'google_co_za','<a href="http://google.co.za/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google South Africa ( catchall )</a>',\r
+'www_google_co_zm','<a href="http://www.google.co.zm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Zambia</a>',\r
+'images_google_co_zm','<a href="http://images.google.co.zm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Zambia ( images )</a>',\r
+'google_co_zm','<a href="http://google.co.zm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Zambia ( catchall )</a>',\r
+'www_google_co_zw','<a href="http://www.google.co.zw/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Zimbabwe</a>',\r
+'images_google_co_zw','<a href="http://images.google.co.zw/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Zimbabwe ( images )</a>',\r
+'google_co_zw','<a href="http://google.co.zw/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Zimbabwe ( catchall )</a>',\r
+'www_google_com_af','<a href="http://www.google.com.af/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Afghanistan</a>',\r
+'images_google_com_af','<a href="http://images.google.com.af/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Afghanistan ( images )</a>',\r
+'google_com_af','<a href="http://google.com.af/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Afghanistan ( catchall )</a>',\r
+'www_google_com_ag','<a href="http://www.google.com.ag/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Antigua and Barbuda</a>',\r
+'images_google_com_ag','<a href="http://images.google.com.ag/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Antigua and Barbuda ( images )</a>',\r
+'google_com_ag','<a href="http://google.com.ag/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Antigua and Barbuda ( catchall )</a>',\r
+'www_google_com_ai','<a href="http://www.google.com.ai/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Anguilla</a>',\r
+'images_google_com_ai','<a href="http://images.google.com.ai/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Anguilla ( images )</a>',\r
+'google_com_ai','<a href="http://google.com.ai/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Anguilla ( catchall )</a>',\r
+'www_google_com_ar','<a href="http://www.google.com.ar/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Argentina</a>',\r
+'images_google_com_ar','<a href="http://images.google.com.ar/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Argentina ( images )</a>',\r
+'google_com_ar','<a href="http://google.com.ar/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Argentina ( catchall )</a>',\r
+'www_google_com_bd','<a href="http://www.google.com.bd/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bangladesh</a>',\r
+'images_google_com_bd','<a href="http://images.google.com.bd/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bangladesh ( images )</a>',\r
+'google_com_bd','<a href="http://google.com.bd/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bangladesh ( catchall )</a>',\r
+'www_google_com_bh','<a href="http://www.google.com.bh/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bahrain</a>',\r
+'images_google_com_bh','<a href="http://images.google.com.bh/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bahrain ( images )</a>',\r
+'google_com_bh','<a href="http://google.com.bh/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bahrain ( catchall )</a>',\r
+'www_google_com_bn','<a href="http://www.google.com.bn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Brunei</a>',\r
+'images_google_com_bn','<a href="http://images.google.com.bn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Brunei ( images )</a>',\r
+'google_com_bn','<a href="http://google.com.bn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Brunei ( catchall )</a>',\r
+'www_google_com_bo','<a href="http://www.google.com.bo/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bolivia</a>',\r
+'images_google_com_bo','<a href="http://images.google.com.bo/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bolivia ( images )</a>',\r
+'google_com_bo','<a href="http://google.com.bo/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Bolivia ( catchall )</a>',\r
+'www_google_com_br','<a href="http://www.google.com.br/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Brazil</a>',\r
+'images_google_com_br','<a href="http://images.google.com.br/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Brazil ( images )</a>',\r
+'google_com_br','<a href="http://google.com.br/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Brazil ( catchall )</a>',\r
+'www_google_com_bz','<a href="http://www.google.com.bz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Belize</a>',\r
+'images_google_com_bz','<a href="http://images.google.com.bz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Belize ( images )</a>',\r
+'google_com_bz','<a href="http://google.com.bz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Belize ( catchall )</a>',\r
+'www_google_com_co','<a href="http://www.google.com.co/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Colombia</a>',\r
+'images_google_com_co','<a href="http://images.google.com.co/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Colombia ( images )</a>',\r
+'google_com_co','<a href="http://google.com.co/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Colombia ( catchall )</a>',\r
+'www_google_com_cu','<a href="http://www.google.com.cu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cuba</a>',\r
+'images_google_com_cu','<a href="http://images.google.com.cu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cuba ( images )</a>',\r
+'google_com_cu','<a href="http://google.com.cu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cuba ( catchall )</a>',\r
+'www_google_com_cy','<a href="http://www.google.com.cy/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cyprus</a>',\r
+'images_google_com_cy','<a href="http://images.google.com.cy/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cyprus ( images )</a>',\r
+'google_com_cy','<a href="http://google.com.cy/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cyprus ( catchall )</a>',\r
+'www_google_com_do','<a href="http://www.google.com.do/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Dominican Republic</a>',\r
+'images_google_com_do','<a href="http://images.google.com.do/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Dominican Republic ( images )</a>',\r
+'google_com_do','<a href="http://google.com.do/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Dominican Republic ( catchall )</a>',\r
+'www_google_com_ec','<a href="http://www.google.com.ec/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ecuador</a>',\r
+'images_google_com_ec','<a href="http://images.google.com.ec/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ecuador ( images )</a>',\r
+'google_com_ec','<a href="http://google.com.ec/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ecuador ( catchall )</a>',\r
+'www_google_com_eg','<a href="http://www.google.com.eg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Egypt</a>',\r
+'images_google_com_eg','<a href="http://images.google.com.eg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Egypt ( images )</a>',\r
+'google_com_eg','<a href="http://google.com.eg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Egypt ( catchall )</a>',\r
+'www_google_com_et','<a href="http://www.google.com.et/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ethiopia</a>',\r
+'images_google_com_et','<a href="http://images.google.com.et/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ethiopia ( images )</a>',\r
+'google_com_et','<a href="http://google.com.et/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ethiopia ( catchall )</a>',\r
+'www_google_com_fj','<a href="http://www.google.com.fj/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Fiji</a>',\r
+'images_google_com_fj','<a href="http://images.google.com.fj/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Fiji ( images )</a>',\r
+'google_com_fj','<a href="http://google.com.fj/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Fiji ( catchall )</a>',\r
+'www_google_com_gh','<a href="http://www.google.com.gh/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ghana</a>',\r
+'images_google_com_gh','<a href="http://images.google.com.gh/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ghana ( images )</a>',\r
+'google_com_gh','<a href="http://google.com.gh/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ghana ( catchall )</a>',\r
+'www_google_com_gi','<a href="http://www.google.com.gi/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Gibraltar</a>',\r
+'images_google_com_gi','<a href="http://images.google.com.gi/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Gibraltar ( images )</a>',\r
+'google_com_gi','<a href="http://google.com.gi/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Gibraltar ( catchall )</a>',\r
+'www_google_com_gt','<a href="http://www.google.com.gt/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Guatemala</a>',\r
+'images_google_com_gt','<a href="http://images.google.com.gt/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Guatemala ( images )</a>',\r
+'google_com_gt','<a href="http://google.com.gt/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Guatemala ( catchall )</a>',\r
+'www_google_com_hk','<a href="http://www.google.com.hk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Hong Kong</a>',\r
+'images_google_com_hk','<a href="http://images.google.com.hk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Hong Kong ( images )</a>',\r
+'google_com_hk','<a href="http://google.com.hk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Hong Kong ( catchall )</a>',\r
+'www_google_com_jm','<a href="http://www.google.com.jm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Jamaica</a>',\r
+'images_google_com_jm','<a href="http://images.google.com.jm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Jamaica ( images )</a>',\r
+'google_com_jm','<a href="http://google.com.jm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Jamaica ( catchall )</a>',\r
+'www_google_com_kh','<a href="http://www.google.com.kh/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cambodia</a>',\r
+'images_google_com_kh','<a href="http://images.google.com.kh/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cambodia ( images )</a>',\r
+'google_com_kh','<a href="http://google.com.kh/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cambodia ( catchall )</a>',\r
+'www_google_com_kw','<a href="http://www.google.com.kw/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Kuwait</a>',\r
+'images_google_com_kw','<a href="http://images.google.com.kw/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Kuwait ( images )</a>',\r
+'google_com_kw','<a href="http://google.com.kw/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Kuwait ( catchall )</a>',\r
+'www_google_com_lb','<a href="http://www.google.com.lb/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Lebanon</a>',\r
+'images_google_com_lb','<a href="http://images.google.com.lb/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Lebanon ( images )</a>',\r
+'google_com_lb','<a href="http://google.com.lb/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Lebanon ( catchall )</a>',\r
+'www_google_com_lc','<a href="http://www.google.com.lc/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Saint Lucia</a>',\r
+'images_google_com_lc','<a href="http://images.google.com.lc/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Saint Lucia ( images )</a>',\r
+'google_com_lc','<a href="http://google.com.lc/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Saint Lucia ( catchall )</a>',\r
+'www_google_com_ly','<a href="http://www.google.com.ly/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Libya</a>',\r
+'images_google_com_ly','<a href="http://images.google.com.ly/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Libya ( images )</a>',\r
+'google_com_ly','<a href="http://google.com.ly/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Libya ( catchall )</a>',\r
+'www_google_com_mm','<a href="http://www.google.com.mm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Myanmar</a>',\r
+'images_google_com_mm','<a href="http://images.google.com.mm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Myanmar ( images )</a>',\r
+'google_com_mm','<a href="http://google.com.mm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Myanmar ( catchall )</a>',\r
+'www_google_com_mt','<a href="http://www.google.com.mt/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Malta</a>',\r
+'images_google_com_mt','<a href="http://images.google.com.mt/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Malta ( images )</a>',\r
+'google_com_mt','<a href="http://google.com.mt/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Malta ( catchall )</a>',\r
+'www_google_com_mx','<a href="http://www.google.com.mx/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Mexico</a>',\r
+'images_google_com_mx','<a href="http://images.google.com.mx/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Mexico ( images )</a>',\r
+'google_com_mx','<a href="http://google.com.mx/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Mexico ( catchall )</a>',\r
+'www_google_com_my','<a href="http://www.google.com.my/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Malaysia</a>',\r
+'images_google_com_my','<a href="http://images.google.com.my/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Malaysia ( images )</a>',\r
+'google_com_my','<a href="http://google.com.my/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Malaysia ( catchall )</a>',\r
+'www_google_com_na','<a href="http://www.google.com.na/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Namibia</a>',\r
+'images_google_com_na','<a href="http://images.google.com.na/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Namibia ( images )</a>',\r
+'google_com_na','<a href="http://google.com.na/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Namibia ( catchall )</a>',\r
+'www_google_com_nf','<a href="http://www.google.com.nf/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Norfolk Island</a>',\r
+'images_google_com_nf','<a href="http://images.google.com.nf/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Norfolk Island ( images )</a>',\r
+'google_com_nf','<a href="http://google.com.nf/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Norfolk Island ( catchall )</a>',\r
+'www_google_com_ng','<a href="http://www.google.com.ng/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Nigeria</a>',\r
+'images_google_com_ng','<a href="http://images.google.com.ng/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Nigeria ( images )</a>',\r
+'google_com_ng','<a href="http://google.com.ng/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Nigeria ( catchall )</a>',\r
+'www_google_com_ni','<a href="http://www.google.com.ni/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Nicaragua</a>',\r
+'images_google_com_ni','<a href="http://images.google.com.ni/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Nicaragua ( images )</a>',\r
+'google_com_ni','<a href="http://google.com.ni/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Nicaragua ( catchall )</a>',\r
+'www_google_com_np','<a href="http://www.google.com.np/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Nepal</a>',\r
+'images_google_com_np','<a href="http://images.google.com.np/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Nepal ( images )</a>',\r
+'google_com_np','<a href="http://google.com.np/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Nepal ( catchall )</a>',\r
+'www_google_com_om','<a href="http://www.google.com.om/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Oman</a>',\r
+'images_google_com_om','<a href="http://images.google.com.om/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Oman ( images )</a>',\r
+'google_com_om','<a href="http://google.com.om/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Oman ( catchall )</a>',\r
+'www_google_com_pa','<a href="http://www.google.com.pa/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Panama</a>',\r
+'images_google_com_pa','<a href="http://images.google.com.pa/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Panama ( images )</a>',\r
+'google_com_pa','<a href="http://google.com.pa/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Panama ( catchall )</a>',\r
+'www_google_com_pe','<a href="http://www.google.com.pe/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Peru</a>',\r
+'images_google_com_pe','<a href="http://images.google.com.pe/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Peru ( images )</a>',\r
+'google_com_pe','<a href="http://google.com.pe/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Peru ( catchall )</a>',\r
+'www_google_com_pg','<a href="http://www.google.com.pg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Papua New Guinea</a>',\r
+'images_google_com_pg','<a href="http://images.google.com.pg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Papua New Guinea ( images )</a>',\r
+'google_com_pg','<a href="http://google.com.pg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Papua New Guinea ( catchall )</a>',\r
+'www_google_com_ph','<a href="http://www.google.com.ph/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Philippines</a>',\r
+'images_google_com_ph','<a href="http://images.google.com.ph/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Philippines ( images )</a>',\r
+'google_com_ph','<a href="http://google.com.ph/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Philippines ( catchall )</a>',\r
+'www_google_com_pk','<a href="http://www.google.com.pk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Pakistan</a>',\r
+'images_google_com_pk','<a href="http://images.google.com.pk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Pakistan ( images )</a>',\r
+'google_com_pk','<a href="http://google.com.pk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Pakistan ( catchall )</a>',\r
+'www_google_com_pr','<a href="http://www.google.com.pr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Puerto Rico</a>',\r
+'images_google_com_pr','<a href="http://images.google.com.pr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Puerto Rico ( images )</a>',\r
+'google_com_pr','<a href="http://google.com.pr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Puerto Rico ( catchall )</a>',\r
+'www_google_com_py','<a href="http://www.google.com.py/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Paraguay</a>',\r
+'images_google_com_py','<a href="http://images.google.com.py/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Paraguay ( images )</a>',\r
+'google_com_py','<a href="http://google.com.py/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Paraguay ( catchall )</a>',\r
+'www_google_com_qa','<a href="http://www.google.com.qa/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Qatar</a>',\r
+'images_google_com_qa','<a href="http://images.google.com.qa/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Qatar ( images )</a>',\r
+'google_com_qa','<a href="http://google.com.qa/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Qatar ( catchall )</a>',\r
+'www_google_com_sa','<a href="http://www.google.com.sa/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Saudi Arabia</a>',\r
+'images_google_com_sa','<a href="http://images.google.com.sa/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Saudi Arabia ( images )</a>',\r
+'google_com_sa','<a href="http://google.com.sa/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Saudi Arabia ( catchall )</a>',\r
+'www_google_com_sb','<a href="http://www.google.com.sb/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Solomon Islands</a>',\r
+'images_google_com_sb','<a href="http://images.google.com.sb/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Solomon Islands ( images )</a>',\r
+'google_com_sb','<a href="http://google.com.sb/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Solomon Islands ( catchall )</a>',\r
+'www_google_com_sg','<a href="http://www.google.com.sg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Singapore</a>',\r
+'images_google_com_sg','<a href="http://images.google.com.sg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Singapore ( images )</a>',\r
+'google_com_sg','<a href="http://google.com.sg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Singapore ( catchall )</a>',\r
+'www_google_com_sl','<a href="http://www.google.com.sl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Sierra Leone</a>',\r
+'images_google_com_sl','<a href="http://images.google.com.sl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Sierra Leone ( images )</a>',\r
+'google_com_sl','<a href="http://google.com.sl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Sierra Leone ( catchall )</a>',\r
+'www_google_com_sv','<a href="http://www.google.com.sv/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google El Salvador</a>',\r
+'images_google_com_sv','<a href="http://images.google.com.sv/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google El Salvador ( images )</a>',\r
+'google_com_sv','<a href="http://google.com.sv/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google El Salvador ( catchall )</a>',\r
+'www_google_com_tj','<a href="http://www.google.com.tj/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Tajikistan</a>',\r
+'images_google_com_tj','<a href="http://images.google.com.tj/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Tajikistan ( images )</a>',\r
+'google_com_tj','<a href="http://google.com.tj/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Tajikistan ( catchall )</a>',\r
+'www_google_com_tw','<a href="http://www.google.com.tw/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Taiwan</a>',\r
+'images_google_com_tw','<a href="http://images.google.com.tw/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Taiwan ( images )</a>',\r
+'google_com_tw','<a href="http://google.com.tw/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Taiwan ( catchall )</a>',\r
+'www_google_com_ua','<a href="http://www.google.com.ua/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ukraine</a>',\r
+'images_google_com_ua','<a href="http://images.google.com.ua/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ukraine ( images )</a>',\r
+'google_com_ua','<a href="http://google.com.ua/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Ukraine ( catchall )</a>',\r
+'www_google_com_uy','<a href="http://www.google.com.uy/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Uruguay</a>',\r
+'images_google_com_uy','<a href="http://images.google.com.uy/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Uruguay ( images )</a>',\r
+'google_com_uy','<a href="http://google.com.uy/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Uruguay ( catchall )</a>',\r
+'www_google_com_vc','<a href="http://www.google.com.vc/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Saint Vincent and the Grenadines</a>',\r
+'images_google_com_vc','<a href="http://images.google.com.vc/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Saint Vincent and the Grenadines ( images )</a>',\r
+'google_com_vc','<a href="http://google.com.vc/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Saint Vincent and the Grenadines ( catchall )</a>',\r
+'www_google_com_vn','<a href="http://www.google.com.vn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Vietnam</a>',\r
+'images_google_com_vn','<a href="http://images.google.com.vn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Vietnam ( images )</a>',\r
+'google_com_vn','<a href="http://google.com.vn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Vietnam ( catchall )</a>',\r
+'www_google_cv','<a href="http://www.google.cv/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cape Verde</a>',\r
+'images_google_cv','<a href="http://images.google.cv/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cape Verde ( images )</a>',\r
+'google_cv','<a href="http://google.cv/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Cape Verde ( catchall )</a>',\r
+'www_google_cz','<a href="http://www.google.cz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Czech Republic</a>',\r
+'images_google_cz','<a href="http://images.google.cz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Czech Republic ( images )</a>',\r
+'google_cz','<a href="http://google.cz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Czech Republic ( catchall )</a>',\r
+'www_google_dj','<a href="http://www.google.dj/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Djibouti</a>',\r
+'images_google_dj','<a href="http://images.google.dj/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Djibouti ( images )</a>',\r
+'google_dj','<a href="http://google.dj/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Djibouti ( catchall )</a>',\r
+'www_google_dk','<a href="http://www.google.dk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Denmark</a>',\r
+'images_google_dk','<a href="http://images.google.dk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Denmark ( images )</a>',\r
+'google_dk','<a href="http://google.dk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Denmark ( catchall )</a>',\r
+'www_google_dm','<a href="http://www.google.dm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Dominica</a>',\r
+'images_google_dm','<a href="http://images.google.dm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Dominica ( images )</a>',\r
+'google_dm','<a href="http://google.dm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Dominica ( catchall )</a>',\r
+'www_google_dz','<a href="http://www.google.dz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Algeria</a>',\r
+'images_google_dz','<a href="http://images.google.dz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Algeria ( images )</a>',\r
+'google_dz','<a href="http://google.dz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Algeria ( catchall )</a>',\r
+'www_google_ee','<a href="http://www.google.ee/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Estonia</a>',\r
+'images_google_ee','<a href="http://images.google.ee/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Estonia ( images )</a>',\r
+'google_ee','<a href="http://google.ee/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Estonia ( catchall )</a>',\r
+'www_google_fi','<a href="http://www.google.fi/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Finland</a>',\r
+'images_google_fi','<a href="http://images.google.fi/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Finland ( images )</a>',\r
+'google_fi','<a href="http://google.fi/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Finland ( catchall )</a>',\r
+'www_google_fm','<a href="http://www.google.fm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Federated States of Micronesia</a>',\r
+'images_google_fm','<a href="http://images.google.fm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Federated States of Micronesia ( images )</a>',\r
+'google_fm','<a href="http://google.fm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Federated States of Micronesia ( catchall )</a>',\r
+'www_google_ga','<a href="http://www.google.ga/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Gabon</a>',\r
+'images_google_ga','<a href="http://images.google.ga/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Gabon ( images )</a>',\r
+'google_ga','<a href="http://google.ga/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Gabon ( catchall )</a>',\r
+'www_google_ge','<a href="http://www.google.ge/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Georgia</a>',\r
+'images_google_ge','<a href="http://images.google.ge/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Georgia ( images )</a>',\r
+'google_ge','<a href="http://google.ge/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Georgia ( catchall )</a>',\r
+'www_google_gf','<a href="http://www.google.gf/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google French Guiana</a>',\r
+'images_google_gf','<a href="http://images.google.gf/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google French Guiana ( images )</a>',\r
+'google_gf','<a href="http://google.gf/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google French Guiana ( catchall )</a>',\r
+'www_google_gg','<a href="http://www.google.gg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Guernsey</a>',\r
+'images_google_gg','<a href="http://images.google.gg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Guernsey ( images )</a>',\r
+'google_gg','<a href="http://google.gg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Guernsey ( catchall )</a>',\r
+'www_google_gl','<a href="http://www.google.gl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Greenland</a>',\r
+'images_google_gl','<a href="http://images.google.gl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Greenland ( images )</a>',\r
+'google_gl','<a href="http://google.gl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Greenland ( catchall )</a>',\r
+'www_google_gm','<a href="http://www.google.gm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Gambia</a>',\r
+'images_google_gm','<a href="http://images.google.gm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Gambia ( images )</a>',\r
+'google_gm','<a href="http://google.gm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Gambia ( catchall )</a>',\r
+'www_google_gp','<a href="http://www.google.gp/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Guadeloupe</a>',\r
+'images_google_gp','<a href="http://images.google.gp/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Guadeloupe ( images )</a>',\r
+'google_gp','<a href="http://google.gp/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Guadeloupe ( catchall )</a>',\r
+'www_google_gy','<a href="http://www.google.gy/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Guyana</a>',\r
+'images_google_gy','<a href="http://images.google.gy/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Guyana ( images )</a>',\r
+'google_gy','<a href="http://google.gy/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Guyana ( catchall )</a>',\r
+'www_google_hn','<a href="http://www.google.hn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Honduras</a>',\r
+'images_google_hn','<a href="http://images.google.hn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Honduras ( images )</a>',\r
+'google_hn','<a href="http://google.hn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Honduras ( catchall )</a>',\r
+'www_google_ht','<a href="http://www.google.ht/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Haiti</a>',\r
+'images_google_ht','<a href="http://images.google.ht/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Haiti ( images )</a>',\r
+'google_ht','<a href="http://google.ht/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Haiti ( catchall )</a>',\r
+'www_google_hu','<a href="http://www.google.hu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Hungary</a>',\r
+'images_google_hu','<a href="http://images.google.hu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Hungary ( images )</a>',\r
+'google_hu','<a href="http://google.hu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Hungary ( catchall )</a>',\r
+'www_google_im','<a href="http://www.google.im/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Isle of Man</a>',\r
+'images_google_im','<a href="http://images.google.im/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Isle of Man ( images )</a>',\r
+'google_im','<a href="http://google.im/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Isle of Man ( catchall )</a>',\r
+'www_google_io','<a href="http://www.google.io/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google British Indian Ocean Territory</a>',\r
+'images_google_io','<a href="http://images.google.io/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google British Indian Ocean Territory ( images )</a>',\r
+'google_io','<a href="http://google.io/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google British Indian Ocean Territory ( catchall )</a>',\r
+'www_google_iq','<a href="http://www.google.iq/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Iraq</a>',\r
+'images_google_iq','<a href="http://images.google.iq/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Iraq ( images )</a>',\r
+'google_iq','<a href="http://google.iq/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Iraq ( catchall )</a>',\r
+'www_google_is','<a href="http://www.google.is/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Iceland</a>',\r
+'images_google_is','<a href="http://images.google.is/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Iceland ( images )</a>',\r
+'google_is','<a href="http://google.is/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Iceland ( catchall )</a>',\r
+'www_google_je','<a href="http://www.google.je/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Jersey</a>',\r
+'images_google_je','<a href="http://images.google.je/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Jersey ( images )</a>',\r
+'google_je','<a href="http://google.je/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Jersey ( catchall )</a>',\r
+'www_google_jo','<a href="http://www.google.jo/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Jordan</a>',\r
+'images_google_jo','<a href="http://images.google.jo/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Jordan ( images )</a>',\r
+'google_jo','<a href="http://google.jo/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Jordan ( catchall )</a>',\r
+'www_google_kg','<a href="http://www.google.kg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Kyrgyzstan</a>',\r
+'images_google_kg','<a href="http://images.google.kg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Kyrgyzstan ( images )</a>',\r
+'google_kg','<a href="http://google.kg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Kyrgyzstan ( catchall )</a>',\r
+'www_google_ki','<a href="http://www.google.ki/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Kiribati</a>',\r
+'images_google_ki','<a href="http://images.google.ki/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Kiribati ( images )</a>',\r
+'google_ki','<a href="http://google.ki/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Kiribati ( catchall )</a>',\r
+'www_google_kz','<a href="http://www.google.kz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Kazakhstan</a>',\r
+'images_google_kz','<a href="http://images.google.kz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Kazakhstan ( images )</a>',\r
+'google_kz','<a href="http://google.kz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Kazakhstan ( catchall )</a>',\r
+'www_google_la','<a href="http://www.google.la/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Laos</a>',\r
+'images_google_la','<a href="http://images.google.la/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Laos ( images )</a>',\r
+'google_la','<a href="http://google.la/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Laos ( catchall )</a>',\r
+'www_google_li','<a href="http://www.google.li/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Liechtenstein</a>',\r
+'images_google_li','<a href="http://images.google.li/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Liechtenstein ( images )</a>',\r
+'google_li','<a href="http://google.li/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Liechtenstein ( catchall )</a>',\r
+'www_google_lk','<a href="http://www.google.lk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Sri Lanka</a>',\r
+'images_google_lk','<a href="http://images.google.lk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Sri Lanka ( images )</a>',\r
+'google_lk','<a href="http://google.lk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Sri Lanka ( catchall )</a>',\r
+'www_google_lt','<a href="http://www.google.lt/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Lithuania</a>',\r
+'images_google_lt','<a href="http://images.google.lt/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Lithuania ( images )</a>',\r
+'google_lt','<a href="http://google.lt/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Lithuania ( catchall )</a>',\r
+'www_google_lu','<a href="http://www.google.lu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Luxembourg</a>',\r
+'images_google_lu','<a href="http://images.google.lu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Luxembourg ( images )</a>',\r
+'google_lu','<a href="http://google.lu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Luxembourg ( catchall )</a>',\r
+'www_google_lv','<a href="http://www.google.lv/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Latvia</a>',\r
+'images_google_lv','<a href="http://images.google.lv/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Latvia ( images )</a>',\r
+'google_lv','<a href="http://google.lv/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Latvia ( catchall )</a>',\r
+'www_google_md','<a href="http://www.google.md/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Moldova</a>',\r
+'images_google_md','<a href="http://images.google.md/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Moldova ( images )</a>',\r
+'google_md','<a href="http://google.md/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Moldova ( catchall )</a>',\r
+'www_google_me','<a href="http://www.google.me/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Montenegro</a>',\r
+'images_google_me','<a href="http://images.google.me/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Montenegro ( images )</a>',\r
+'google_me','<a href="http://google.me/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Montenegro ( catchall )</a>',\r
+'www_google_mg','<a href="http://www.google.mg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Madagascar</a>',\r
+'images_google_mg','<a href="http://images.google.mg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Madagascar ( images )</a>',\r
+'google_mg','<a href="http://google.mg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Madagascar ( catchall )</a>',\r
+'www_google_mk','<a href="http://www.google.mk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Macedonia</a>',\r
+'images_google_mk','<a href="http://images.google.mk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Macedonia ( images )</a>',\r
+'google_mk','<a href="http://google.mk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Macedonia ( catchall )</a>',\r
+'www_google_ml','<a href="http://www.google.ml/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Mali</a>',\r
+'images_google_ml','<a href="http://images.google.ml/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Mali ( images )</a>',\r
+'google_ml','<a href="http://google.ml/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Mali ( catchall )</a>',\r
+'www_google_mn','<a href="http://www.google.mn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Mongolia</a>',\r
+'images_google_mn','<a href="http://images.google.mn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Mongolia ( images )</a>',\r
+'google_mn','<a href="http://google.mn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Mongolia ( catchall )</a>',\r
+'www_google_ms','<a href="http://www.google.ms/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Montserrat</a>',\r
+'images_google_ms','<a href="http://images.google.ms/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Montserrat ( images )</a>',\r
+'google_ms','<a href="http://google.ms/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Montserrat ( catchall )</a>',\r
+'www_google_mu','<a href="http://www.google.mu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Mauritius</a>',\r
+'images_google_mu','<a href="http://images.google.mu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Mauritius ( images )</a>',\r
+'google_mu','<a href="http://google.mu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Mauritius ( catchall )</a>',\r
+'www_google_mv','<a href="http://www.google.mv/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Maldives</a>',\r
+'images_google_mv','<a href="http://images.google.mv/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Maldives ( images )</a>',\r
+'google_mv','<a href="http://google.mv/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Maldives ( catchall )</a>',\r
+'www_google_mw','<a href="http://www.google.mw/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Malawi</a>',\r
+'images_google_mw','<a href="http://images.google.mw/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Malawi ( images )</a>',\r
+'google_mw','<a href="http://google.mw/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Malawi ( catchall )</a>',\r
+'www_google_ne','<a href="http://www.google.ne/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Niger</a>',\r
+'images_google_ne','<a href="http://images.google.ne/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Niger ( images )</a>',\r
+'google_ne','<a href="http://google.ne/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Niger ( catchall )</a>',\r
+'www_google_nr','<a href="http://www.google.nr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Nauru</a>',\r
+'images_google_nr','<a href="http://images.google.nr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Nauru ( images )</a>',\r
+'google_nr','<a href="http://google.nr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Nauru ( catchall )</a>',\r
+'www_google_nu','<a href="http://www.google.nu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Niue</a>',\r
+'images_google_nu','<a href="http://images.google.nu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Niue ( images )</a>',\r
+'google_nu','<a href="http://google.nu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Niue ( catchall )</a>',\r
+'www_google_pn','<a href="http://www.google.pn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Pitcairn Islands</a>',\r
+'images_google_pn','<a href="http://images.google.pn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Pitcairn Islands ( images )</a>',\r
+'google_pn','<a href="http://google.pn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Pitcairn Islands ( catchall )</a>',\r
+'www_google_ps','<a href="http://www.google.ps/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Palestine</a>',\r
+'images_google_ps','<a href="http://images.google.ps/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Palestine[4] ( images )</a>',\r
+'google_ps','<a href="http://google.ps/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Palestine[4] ( catchall )</a>',\r
+'www_google_ro','<a href="http://www.google.ro/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Romania</a>',\r
+'images_google_ro','<a href="http://images.google.ro/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Romania ( images )</a>',\r
+'google_ro','<a href="http://google.ro/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Romania ( catchall )</a>',\r
+'www_google_rs','<a href="http://www.google.rs/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Serbia</a>',\r
+'images_google_rs','<a href="http://images.google.rs/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Serbia ( images )</a>',\r
+'google_rs','<a href="http://google.rs/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Serbia ( catchall )</a>',\r
+'www_google_ru','<a href="http://www.google.ru/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Russia</a>',\r
+'images_google_ru','<a href="http://images.google.ru/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Russia ( images )</a>',\r
+'google_ru','<a href="http://google.ru/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Russia ( catchall )</a>',\r
+'www_google_rw','<a href="http://www.google.rw/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Rwanda</a>',\r
+'images_google_rw','<a href="http://images.google.rw/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Rwanda ( images )</a>',\r
+'google_rw','<a href="http://google.rw/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Rwanda ( catchall )</a>',\r
+'www_google_sc','<a href="http://www.google.sc/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Seychelles</a>',\r
+'images_google_sc','<a href="http://images.google.sc/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Seychelles ( images )</a>',\r
+'google_sc','<a href="http://google.sc/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Seychelles ( catchall )</a>',\r
+'www_google_sh','<a href="http://www.google.sh/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Saint Helena and Ascension and Tristan da Cunha</a>',\r
+'images_google_sh','<a href="http://images.google.sh/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Saint Helena and Ascension and Tristan da Cunha ( images )</a>',\r
+'google_sh','<a href="http://google.sh/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Saint Helena and Ascension and Tristan da Cunha ( catchall )</a>',\r
+'www_google_si','<a href="http://www.google.si/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Slovenia</a>',\r
+'images_google_si','<a href="http://images.google.si/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Slovenia ( images )</a>',\r
+'google_si','<a href="http://google.si/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Slovenia ( catchall )</a>',\r
+'www_google_sk','<a href="http://www.google.sk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Slovakia</a>',\r
+'images_google_sk','<a href="http://images.google.sk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Slovakia ( images )</a>',\r
+'google_sk','<a href="http://google.sk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Slovakia ( catchall )</a>',\r
+'www_google_sm','<a href="http://www.google.sm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google San Marino</a>',\r
+'images_google_sm','<a href="http://images.google.sm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google San Marino ( images )</a>',\r
+'google_sm','<a href="http://google.sm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google San Marino ( catchall )</a>',\r
+'www_google_sn','<a href="http://www.google.sn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Senegal</a>',\r
+'images_google_sn','<a href="http://images.google.sn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Senegal ( images )</a>',\r
+'google_sn','<a href="http://google.sn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Senegal ( catchall )</a>',\r
+'www_google_so','<a href="http://www.google.so/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Somalia</a>',\r
+'images_google_so','<a href="http://images.google.so/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Somalia ( images )</a>',\r
+'google_so','<a href="http://google.so/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Somalia ( catchall )</a>',\r
+'www_google_sr','<a href="http://www.google.sr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Suriname</a>',\r
+'images_google_sr','<a href="http://images.google.sr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Suriname ( images )</a>',\r
+'google_sr','<a href="http://google.sr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Suriname ( catchall )</a>',\r
+'www_google_st','<a href="http://www.google.st/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Sao Tome and Principe</a>',\r
+'images_google_st','<a href="http://images.google.st/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Sao Tome and Principe ( images )</a>',\r
+'google_st','<a href="http://google.st/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Sao Tome and Principe ( catchall )</a>',\r
+'www_google_td','<a href="http://www.google.td/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Chad</a>',\r
+'images_google_td','<a href="http://images.google.td/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Chad ( images )</a>',\r
+'google_td','<a href="http://google.td/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Chad ( catchall )</a>',\r
+'www_google_tg','<a href="http://www.google.tg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Togo</a>',\r
+'images_google_tg','<a href="http://images.google.tg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Togo ( images )</a>',\r
+'google_tg','<a href="http://google.tg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Togo ( catchall )</a>',\r
+'www_google_tk','<a href="http://www.google.tk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Tokelau</a>',\r
+'images_google_tk','<a href="http://images.google.tk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Tokelau ( images )</a>',\r
+'google_tk','<a href="http://google.tk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Tokelau ( catchall )</a>',\r
+'www_google_tl','<a href="http://www.google.tl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Timor-Leste</a>',\r
+'images_google_tl','<a href="http://images.google.tl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Timor-Leste ( images )</a>',\r
+'google_tl','<a href="http://google.tl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Timor-Leste ( catchall )</a>',\r
+'www_google_tm','<a href="http://www.google.tm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Turkmenistan</a>',\r
+'images_google_tm','<a href="http://images.google.tm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Turkmenistan ( images )</a>',\r
+'google_tm','<a href="http://google.tm/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Turkmenistan ( catchall )</a>',\r
+'www_google_tn','<a href="http://www.google.tn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Tunisia</a>',\r
+'images_google_tn','<a href="http://images.google.tn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Tunisia ( images )</a>',\r
+'google_tn','<a href="http://google.tn/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Tunisia ( catchall )</a>',\r
+'www_google_to','<a href="http://www.google.to/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Tonga</a>',\r
+'images_google_to','<a href="http://images.google.to/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Tonga ( images )</a>',\r
+'google_to','<a href="http://google.to/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Tonga ( catchall )</a>',\r
+'www_google_tt','<a href="http://www.google.tt/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Trinidad and Tobago</a>',\r
+'images_google_tt','<a href="http://images.google.tt/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Trinidad and Tobago ( images )</a>',\r
+'google_tt','<a href="http://google.tt/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Trinidad and Tobago ( catchall )</a>',\r
+'www_google_us','<a href="http://www.google.us/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google United States</a>',\r
+'images_google_us','<a href="http://images.google.us/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google United States ( images )</a>',\r
+'google_us','<a href="http://google.us/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google United States ( catchall )</a>',\r
+'www_google_vg','<a href="http://www.google.vg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google British Virgin Islands</a>',\r
+'images_google_vg','<a href="http://images.google.vg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google British Virgin Islands ( images )</a>',\r
+'google_vg','<a href="http://google.vg/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google British Virgin Islands ( catchall )</a>',\r
+'www_google_vu','<a href="http://www.google.vu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Vanuatu</a>',\r
+'images_google_vu','<a href="http://images.google.vu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Vanuatu ( images )</a>',\r
+'google_vu','<a href="http://google.vu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Vanuatu ( catchall )</a>',\r
+'www_google_ws','<a href="http://www.google.ws/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Samoa</a>',\r
+'images_google_ws','<a href="http://images.google.ws/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Samoa ( images )</a>',\r
+'google_ws','<a href="http://google.ws/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Samoa ( catchall )</a>',\r
+\r
+'google_cache','<a href="http://www.google.com/help/features.html#cached" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google (cache)</a>',\r
+'google_froogle','<a href="http://froogle.google.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Froogle (Google)</a>',\r
+'google_groups','<a href="http://groups.google.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google (Groups)</a>',\r
+'google_maps','<a href="http://maps.google.co.uk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google Maps</a>',\r
+'googleByIP','<a href="http://173.194.35.177/" rel="nofollow" title="Google (Access by IP-Address) [new window]" target="_blank">Google (Access by IP-Address)</a>',\r
+'google_catchall','<a href="http://www.google.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google catchall sites not specified</a>',\r
+'google_products','<a href="http://www.google.com/products" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Google (Products)</a>',\r
+'google_translate','google translate',\r
+'google4counter','<a href="http://www.4-counter.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">4-counter (Google)</a>',\r
+\r
+'1klik','1Klik',\r
+'1search','<a href="http://1search-board.com/" rel="nofollow" target="_blank">1search-board.com</a>',\r
+'1und1_de','<a href="http://suche.1und1.de/" rel="nofollow" title="1&amp;1 Suche [new window]" target="_blank">1&1 Suche (subdomain "suche")</a>',\r
+'3721','<a href="http://www.3721.com/" rel="nofollow" target="_blank">3721</a>',\r
+'a9', '<a href="http://www.a9.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">A9</a>',\r
+'abacho','Abacho',\r
+'accoona','<a href="http://cn.accoona.com">Accoona</a>',\r
+'alexa','<a href="http://www.alexa.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Alexa</a>',\r
+'aliceit','<a href="http://www.alice.it/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">alice.it</a>',\r
+'aliceitmaster','<a href="http://www.alice.it/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">search.alice.it.master</a>',\r
+'allesklar','allesklar.de',\r
+'allgameshome','<a href="http://my.allgameshome.com/" rel="nofollow" title="AllGamesHome [new window]" target="_blank">AllGamesHome</a>',\r
+'alltheweb','<a href="http://www.alltheweb.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">AllTheWeb</a>',\r
+'alot','alot',\r
+'altavista','<a href="http://www.altavista.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">AltaVista</a>',\r
+'amazon','amazon',\r
+'androidsearch','<a href="http://www.androidsearch.com/" rel="nofollow" title="androidsearch.com [new window]" target="_blank">androidsearch.com</a>',\r
+'answerbus','<a href="http://www.answerbus.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Answerbus</a>',\r
+'anzwers','<a href="http://anzwers.com.au/" title="anzwers.com.au home page [new window]" rel="nofollow" target="_blank">anzwers.com.au</a>',\r
+'aol_o2suche_de','AOL O2Suche (de)', \r
+'aolcatchall','<a href="http://search.aol.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">AOL catchall countries</a>',\r
+'aolcom','<a href="http://search.aol.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">AOL .com</a>',\r
+'aolde','<a href="http://suche.aol.de/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">AOL .de</a>',\r
+'aolfr','AOL (fr)', \r
+'aolpl','<a href="http://search.aol.pl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">AOL .pl</a>',\r
+'aolsearchde','<a href="http://de.aolsearch.com/" rel="nofollow" title="AOL Search Home Page [new window]" target="_blank">AOL Search de</a>',\r
+'aoluk','<a href="http://search.aol.co.uk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">AOL .uk</a>',\r
+'aport','Aport',\r
+'arianna','<a href="http://arianna.libero.it/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Arianna</a>',\r
+'asevenboard','<a href="http://asevenboard.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">asevenboard</a>',\r
+'askcatchall','<a href="http://www.ask.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Ask catchall sites</a>',\r
+'askde','<a href="http://de.ask.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Ask Deutschland</a>',\r
+'askes','<a href="http://es.ask.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Ask Espana</a>', # break out Ask country specific engines.\r
+'askfr','<a href="http://fr.ask.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Ask France</a>',\r
+'askimages','ask images',\r
+'askit','<a href="http://it.ask.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Ask Italia</a>',\r
+'askjp','<a href="http://www.ask.jp/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Ask Japan</a>',\r
+'asknl','<a href="http://nl.ask.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Ask Nederland</a>',\r
+'askuk','<a href="http://uk.ask.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Ask UK</a>',\r
+'atlanticbb','atlanticbb',\r
+'atlas','Atlas.cz',\r
+'atomz','Atomz',\r
+'att','<a href="http://www.att.net/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">AT&T search (powered by Google)</a>',\r
+'au_search_yahoo_com','<a href="http://au.search.yahoo.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Yahoo au.search.yahoo.com</a>',\r
+'auone','auone',\r
+'avantfind','<a href="http://www.avantfind.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Avantfind</a>',\r
+'avg','avg',\r
+'babylon','<a href="http://search.babylon.com/" title="search.babylon.com" rel="nofollow" target="_blank">Babylon</a>',\r
+'baidu','<a href="http://www.baidu.com/" rel="nofollow" target="_blank">Baidu</a>',\r
+'bbc','BBC', \r
+'benefind','<a href="http://www.benefind.de/" rel="nofollow" title="benefind Home Page [new window]" target="_blank">benefind</a>',\r
+'biglotron','<a href="http://www.biglotron.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Biglotron</a>',\r
+'bing','<a href="http://www.bing.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Bing</a>',\r
+'blekko','blekko',\r
+'blingo','<a href="http://www.blingo.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Blingo</a>',\r
+'bluewin','bluewin',\r
+'bt','BT',\r
+'bungeebonesdotcom','<a href="http://BungeeBones.com/search.php/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">BungeeBones</a>',\r
+'ca_search_yahoo_com','<a href="http://ca.search.yahoo.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Yahoo ca.search.yahoo.com</a>',\r
+'centraldatabase','<a href="http://search.centraldatabase.org/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">GPU p2p search</a>',\r
+'centrum','Centrum.cz', \r
+'centurylink','centurylink',\r
+'certifiedtoolbarsearch','<a href="http://search.certified-toolbar.com/" rel="nofollow" title="Certified-Toolbar Search [new window]" target="_blank">Certified-Toolbar Search</a>',\r
+'charter','charter',\r
+'chatzum','chatzum',\r
+'checkparams','checkparams',\r
+'chelloat','<a href="http://www.chello.at/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Chello Austria</a>',\r
+'chellobe','<a href="http://www.chello.be/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Chello Belgium</a>',\r
+'chellocom','<a href="http://www.chello.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Chello (Country not recognized)</a>',\r
+'chellocz','<a href="http://www.chello.cz/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Chello Czech Republic</a>',\r
+'chellofr','<a href="http://www.chello.fr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Chello France</a>',\r
+'chellohu','<a href="http://www.chello.hu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Chello Hungary</a>',\r
+'chellonl','<a href="http://www.chello.nl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Chello Netherlands</a>',\r
+'chellono','<a href="http://www.chello.no/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Chello Norway</a>',\r
+'chellopl','<a href="http://www.chello.pl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Chello Poland</a>',\r
+'chellose','<a href="http://www.chello.se/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Chello Sweden</a>',\r
+'chellosk','<a href="http://www.chello.sk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Chello Slovakia</a>',\r
+'clarosearch','<a href="http://www.claro-search.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Claro Search</a>',\r
+'clinck','clinck',\r
+'clubinternet', 'Club-internet',\r
+'clusty','<a href="http://www.clusty.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Clusty</a>',\r
+'comcast','comcast',\r
+'comettoolbar','<a href="http://as.starware.com/dp/search" title="Comet toolbar search home page [new window]" rel="nofollow" target="_blank">Comet toolbar search</a>',\r
+'conduit','conduit',\r
+'copernic','<a href="http://www.copernic.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Copernic</a>',\r
+'crawler','<a href="http://www.crawler.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">crawler.com</a>',\r
+'ctrouve','C\'est trouve', \r
+'dalesearch','<a href="http://www.dalesearch.com/" rel="nofollow" title="Dale Search [new window]" target="_blank">Dale Search</a>',\r
+'danielsen','Thor (danielsen.com)', \r
+'daum','daum',\r
+'de_dolphin_com','<a href="http://de.dolphin.com/" rel="nofollow" title="Dolphin Search search page [new window]" target="_blank">Dolphin Search</a>',\r
+'de_wiki_gov_cn','<a href="http://de.wiki.gov.cn/" rel="nofollow" title="Wiki Sucher [new window]" target="_blank">Wiki Sucher</a>',\r
+'dejanews','DejaNews',\r
+'delicious','<a href="http://del.icio.us/" title="del.icio.us home page [new window]" rel="nofollow" target="_blank">del.icio.us</a> (Social Bookmark)',\r
+'delta-search','delta-search',\r
+'digg','<a href="http://www.digg.com/" title="Digg home page [new window]" rel="nofollow" target="_blank">Digg</a> (Social Bookmark)',\r
+'dmoz','<a href="http://dmoz.org/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">DMOZ</a>',\r
+'dodajpl','<a href="http://www.dodaj.pl/" title="Dodaj.pl home page [new window]" rel="nofollow" target="_blank">Dodaj.pl</a>',\r
+'dogpile','<a href="http://www.dogpile.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Dogpile</a>',\r
+'duckduckgo','<a href="http://r.duckduckgo.com/" rel="nofollow" title="DuckDuckGo Home Page [new window]" target="_blank">DuckDuckGo</a>',\r
+'earthlink', 'Earth Link',\r
+'easysearch','<a href="http://heatherjeffery.easysearch.org.uk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">easysearch</a>',\r
+'ecosia','ecosia',\r
+'edderkoppen','Edderkoppen', \r
+'engine','Cade', \r
+'eniro','<a href="http://www.eniro.no/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Eniro</a>',\r
+'enirose','<a href="http://www.eniro.se/" title="Eniro Sverige home page [new window]" rel="nofollow" target="_blank">Eniro Sverige</a>',\r
+'ereadingsource','ereadingsource',\r
+'etools_ch','<a href="http://www.etools.ch/" rel="nofollow" title="eTools.ch [new window]" target="_blank">eTools.ch</a>',\r
+'euroseek','Euroseek',\r
+'everyclick','everyclick',\r
+'excite','<a href="http://www.excite.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Excite</a>',\r
+'facemoods','facemoods',\r
+'fastbot_de','<a href="http://fastbot.de/" rel="nofollow" title="Fastbot.de [new window]" target="_blank">Fastbot.de (Does not provide search keyphrases; using found page instead)</a>',\r
+'fbdownloader','<a href="http://search.fbdownloader.com/" rel="nofollow" title="FBDownloader Home Page [new window]" target="_blank">FBDownloader (fbdownloader)</a>',\r
+'fdownloadr_com','<a href="http://search.fdownloadr.com/" rel="nofollow" title="FBDownloader Home Page [new window]" target="_blank">FBDownloader (fdownloadr)</a>',\r
+'find1friend','<a href="http://find1friend.com/" rel="nofollow" title="Find1Friend [new window]" target="_blank">Find1Friend</a>',\r
+'findamo','findamo',\r
+'findarticles','Find Articles',\r
+'finddk','Find', \r
+'fireball','fireball',\r
+'flipora','<a href="http://static.flipora.com/" rel="nofollow" title="Flipora Home Page [new window]" target="_blank">Flipora</a>',\r
+'foxstart','foxstart',\r
+'fr_search_yahoo_com','<a href="http://fr.search.yahoo.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Yahoo fr.search.yahoo.com</a>',\r
+'francite','Francite', \r
+'free', 'Free.fr', \r
+'freenet_de','<a href="http://suche.freenet.de/" rel="nofollow" title="suche.freenet.de [new window]" target="_blank">suche.freenet.de</a>',\r
+'freeserve','Freeserve', \r
+'funmoods','funmoods',\r
+'gazetapl','<a href="http://szukaj.gazeta.pl/" title="Gazeta.pl home page [new window]" rel="nofollow" target="_blank">Gazeta.pl</a>',\r
+'genieo','<a href="http://search.genieo.com/" rel="nofollow" title="Genieo home page [new window]" target="_blank">Genieo</a>',\r
+'gerypl','<a href="http://szukaj.gery.pl/" title="Gery.pl home page [new window]" rel="nofollow" target="_blank">Gery.pl</a>',\r
+'globososo','Globososo',\r
+'gmxsuche','<a href="http://suche.gmx.net/" rel="nofollow" title="GMX Suche Home Page [new window]" target="_blank">GMX Suche</a>',\r
+'gmxsuche_at','<a href="http://suche.gmx.at/" rel="nofollow" title="GMX Suche Oesterreich Home Page [new window]" target="_blank">GMX Suche Oesterreich</a>',\r
+'go','Go.com',\r
+'go.mail.ru','go.mail.ru',\r
+'go2net','Go2Net (Metamoteur)',\r
+'godado','Godado.it',\r
+'goliat','Goliat', \r
+'goodsearch','<a href="http://www.goodsearch.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">GoodSearch</a>',\r
+'gotuneed','<a href="http://www.gotuneed.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">got u need</a>',\r
+'govome','<a href="http://www.govome.com/" rel="nofollow" title="Govome [new window]" target="_blank">Govome</a>',\r
+'haku','Ihmemaa',\r
+'handycafe','handycafe',\r
+'heureka','Heureka', \r
+'hogapl','<a href="http://www.hoga.pl/" title="Hoga.pl home page [new window]" rel="nofollow" target="_blank">Hoga.pl</a>',\r
+'holasearch','<a href="http://www.holasearch.com" rel="nofollow" title="Hola Search Home Page [new window]" target="_blank">Hola Search</a>',\r
+'hotbot','Hotbot',\r
+'hp_my_aol','hp my aol',\r
+'hubwe','hubwe',\r
+'iask','<a href="http://www.iask.com/" rel="nofollow" target="_blank">Iask</a>',\r
+'iboats','<a href="http://forums.iboats.com/" title="forum home page [new window]" rel="nofollow" target="_blank">Iboats</a>',\r
+'icerocket','<a href="http://www.icerocket.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Icerocket (Blog)</a>',\r
+'ichiro','<a href="http://search.goo.ne.jp/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Ichiro</a>',\r
+'icq','<a href="http://www.icq.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">icq</a>',\r
+'ilse','Ilse',\r
+'image_search_yahoo_co_jp','<a href="http://image.search.yahoo.co.jp/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Yahoo image.search.yahoo.co.jp</a>',\r
+'images_search_yahoo_com','<a href="http://images.search.yahoo.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Yahoo images.search.yahoo.com</a>',\r
+'iminent','<a href="http://start.iminent.com/" rel="nofollow" title="Iminent Home Page [new window]" target="_blank">Iminent</a>',\r
+'inbox','inbox',\r
+'incredibar','incredibar',\r
+'incredimail','incredimail',\r
+'indexhu','Index', \r
+'ineffabile','<a href="http://www.ineffabile.it/" title="Ineffabile.it home page [new window]" rel="nofollow" target="_blank">Ineffabile.it</a> (Social Bookmark)',\r
+'infoseek','Infoseek',\r
+'infospace','InfoSpace',\r
+'infouk','<a href="http://info.co.uk/" title="home page [new window]" rel="nofollow" target="_blank">Info UK</a>',\r
+'inspsearch','<a href="http://airzip.inspsearch.com/" rel="nofollow" title="airzip.inspsearch.com [new window]" target="_blank">airzip.inspsearch.com</a>',\r
+'int_search_myway_com','<a href="http://int.search.myway.com/" rel="nofollow" title="MyWay search page [new window]" target="_blank">MyWay</a>',\r
+'interiapl','<a href="http://www.google.interia.pl/" title="Interia.pl home page [new window]" rel="nofollow" target="_blank">Interia.pl</a>',\r
+'internetto','Internetto Kereso',\r
+'isearch_nation_com','<a href="http://isearch.nation.com/" rel="nofollow" title="Nation Search [new window]" target="_blank">Nation Search</a>',\r
+'it_search_yahoo_com','<a href="http://it.search.yahoo.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Yahoo it.search.yahoo.com</a>',\r
+'iune','<a href="http://www.i-une.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">i-une</a>',\r
+'ixquick','<a href="http://www.ixquick.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">ix quick</a>', \r
+'izito_catchall','izito ( catchall )', \r
+'izito_de','<a href="http://www.izito.de/" rel="nofollow" title="iZito Deutschland [new window]" target="_blank">izito .de</a>', \r
+'izito_uk','<a href="http://www.izito.co.uk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">izito .uk</a>', \r
+'jubii','Jubii', \r
+'jumpyit','Jumpy.it',\r
+'juno','<a href="http://search.juno.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">juno</a>', \r
+'jyxo','Jyxo.cz', \r
+'kartoo','<a href="http://www.kartoo.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Kartoo</a>',\r
+'katalogonetpl','<a href="http://katalog.onet.pl/" title="Katalog.Onet.pl home page [new window]" rel="nofollow" target="_blank">Katalog.Onet.pl</a>',\r
+'kataweb','<a href="http://www.kataweb.it/ricerca/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Kataweb</a>',\r
+'keresolap_hu','<a href="http://keresolap.hu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Tango keresolap</a>',\r
+'kvasir','kvasir',\r
+'kvitters','kvitters',\r
+'lapkereso_hu','Startlapkereso', \r
+'lbb','LBB', \r
+'ledix','<a href="http://www.ledix.net/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Ledix</a>',\r
+'libero','<a href="http://www.libero.it/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Libero IT</a>',\r
+'libertysurf', 'Libertysurf', \r
+'live','<a href="http://www.live.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Microsoft Windows Live</a>',\r
+'localmoxie','<a href="http://www.localmoxie.com/" rel="nofollow" title="Local Moxie [new window]" target="_blank">Local Moxie</a>',\r
+'looksmart_catchall','looksmart ( catchall )',\r
+'looksmart_co_uk','looksmart .co.uk',\r
+'lycos','<a href="http://www.lycos.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Lycos</a>',\r
+'mamma','Mamma',\r
+'meinestadt','meinestadt.de', \r
+'metabot', 'MetaBot',\r
+'metacrawler','metacrawler',\r
+'metacrawler_de','metacrawler.de',\r
+'metager','<a href="http://www.metager.de" rel="nofollow" title="MetaGer Home Page [new window]" target="_blank">MetaGer</a>',\r
+'metahannover','uni-hannover.de',\r
+'metasearch','metasearch',\r
+'metaspinner','metaspinner',\r
+'metasuche_ch','<a href="http://www.metasuche.ch/" rel="nofollow" title="Metasuche search page [new window]" target="_blank">Metasuche.ch</a>',\r
+'metaua','meta.ua',\r
+'miner','Meta Miner',\r
+'mirago','<a href="http://www.mirago.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Mirago (country unknown)</a>',\r
+'miragobe','<a href="http://www.mirago.be/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Mirago Belgium</a>',\r
+'miragoch','<a href="http://www.mirago.ch/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Mirago Switzerland</a>',\r
+'miragocouk','<a href="http://zone.mirago.co.uk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Mirago UK</a>',\r
+'miragode','<a href="http://www.mirago.de/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Mirago Germany</a>',\r
+'miragodk','<a href="http://www.mirago.dk/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Mirago Denmark</a>',\r
+'miragoes','<a href="http://es.mirago.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Mirago Spain</a>',\r
+'miragofr','<a href="http://www.mirago.fr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Mirago France</a>',\r
+'miragoit','<a href="http://www.mirago.it/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Mirago Italy</a>',\r
+'miragonl','<a href="http://www.mirago.nl/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Mirago Netherlands</a>',\r
+'miragono','<a href="http://no.mirago.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Mirago Norway</a>',\r
+'miragose','<a href="http://www.mirago.se/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Mirago Sweden</a>',\r
+'mitrasites','mitrasites',\r
+'mozbot','<a href="http://www.mozbot.fr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Mozbot</a>',\r
+'msn','<a href="http://search.msn.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Microsoft MSN Search</a>',\r
+'mys_yoursearch_me','<a href="http://mys.yoursearch.me/" rel="nofollow" title="Yoursearch.me search page [new window]" target="_blank">Yoursearch.me</a>',\r
+'mysearch','<a href="http://www.mysearch.com" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">My Search</a>',\r
+'mysearchdial','<a href="http://start.mysearchdial.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">mysearchdial</a>',\r
+'mysearchresults','<a href="http://www.mysearchresults.com" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">mysearchresults</a>',\r
+'myway','<a href="http://search.myway.com" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">myway</a>',\r
+'mywebsearch','<a href="http://search.mywebsearch.com/" title="MyWebSearch home page [new window]" rel="nofollow" target="_blank">MyWebSearch</a>',\r
+'najdi','Najdi.to',\r
+'nation','nation', \r
+'navigationshilfe_t_online','Navigationshilfe T-Online',\r
+'nbci','NBCI',\r
+'netease', '<a href="http://www.163.com/" rel="nofollow" target="_blank">NetEase</a>',\r
+'netluchs','<a href="http://www.netluchs.de/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Netluchs</a>',\r
+'netscape','<a href="http://www.netscape.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Netscape</a>',\r
+'netsprintpl','<a href="http://www.netsprint.pl/" title="NetSprint.pl home page [new window]" rel="nofollow" target="_blank">NetSprint.pl</a>',\r
+'netstjernen','Netstjernen',\r
+'netzero','<a href="http://search.netzero.net/" title="home page [new window]" rel="nofollow" target="_blank">netzero</a>',\r
+'northernlight','NorthernLight',\r
+'nortonsavesearch','<a href="http://int.search-results.com/" rel="nofollow" title="Norton Safe Search Home Page [new window]" target="_blank">Norton Safe Search</a>',\r
+'nusearch','<a href="http://www.nusearch.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Nusearch</a>',\r
+'o2pl','<a href="http://szukaj2.o2.pl/" title="o2.pl home page [new window]" rel="nofollow" target="_blank">o2.pl</a>',\r
+'ofir','Ofir',\r
+'oneseek_de','<a href="http://www.oneseek.de" rel="nofollow" title="Metasuchmaschine OneSeek.de [new window]" target="_blank">Metasuchmaschine OneSeek.de</a>',\r
+'onetpl','<a href="http://szukaj.onet.pl/" title="Onet.pl home page [new window]" rel="nofollow" target="_blank">Onet.pl</a>',\r
+'opasia','Opasia', \r
+'orange','orange',\r
+'orangeworld','orangeworld',\r
+'orbis','Orbis', \r
+'origo','Origo-Vizsla', \r
+'overture','Overture',\r
+'passagen','Evreka',\r
+'pch','pch',\r
+'peoplecheck_de','<a href="http://peoplecheck.de/" rel="nofollow" title="PeopleCheck.de [new window]" target="_blank">PeopleCheck.de</a>',\r
+'ph_search_yahoo_com','<a href="http://ph.search.yahoo.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Yahoo ph.search.yahoo.com</a>',\r
+'picsearch','<a href="http://www.picsearch.de/" rel="nofollow" title="picsearch [new window]" target="_blank">picsearch</a>',\r
+'pictures','pictures',\r
+'plusnetwork','<a href="http://www.searchplusnetwork.com/" title="Search Plus Network" rel="nofollow" target="_blank">Search Plus Network</a>',\r
+'pogodak','<a href="http://www.pogodak.com" title="Pogodak search engine home page [new window]" rel="nofollow" target="_blank">Pogodak.com</a>',\r
+'polskapl','<a href="http://szukaj.polska.pl/" title="Polska home page [new window]" rel="nofollow" target="_blank">Polska</a>',\r
+'polymeta_hu','<a href="http://www.polymeta.hu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Polymeta</a>',\r
+'preciobarato_xyz','<a href="http://preciobarato.xyz/" rel="nofollow" title="preciobarato.xyz offline on Oct 2 2015 [new window]" target="_blank">preciobarato xyz</a>',\r
+'questionanswering','<a href="http://www.questionanswering.com/" title="Questionanswering home page [new window]" rel="nofollow" target="_blank">Questionanswering</a>',\r
+'quick','Quick.cz', \r
+'qwant_com','<a href="https://www.qwant.com/" rel="nofollow" title="qwant.com [new window]" target="_blank">qwant.com</a>',\r
+'r_search_yahoo_com','<a href="http://r.search.yahoo.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Yahoo r.search.yahoo.com</a>',\r
+'rakuten','<a href="http://websearch.rakuten.co.jp" rel="nofollow" title="websearch.rakuten.co.jp [new window]" target="_blank">websearch.rakuten.co.jp</a>',\r
+'rambler','Rambler',\r
+'redbox','RedBox.cz',\r
+'rr','rr',\r
+'safehomepage_com','<a href="http://searches.safehomepage.com/" rel="nofollow" title="safehomepage.com [new window]" target="_blank">safehomepage.com</a>',\r
+'sagool','<a href="http://sagool.jp/" title="Sagool home page [new window]" rel="nofollow" target="_blank">Sagool</a>',\r
+'sapo','<a href="http://www.sapo.pt/" title="Sapo search engine home page [new window]" rel="nofollow" target="_blank">Sapo</a>',\r
+'schoenerbrausen','<a href="http://www.schoenerbrausen.de/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Schoenerbrausen/</a>',\r
+'scroogle','<a href="http://www.scroogle.org/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Scroogle</a>',\r
+'se_search_yahoo_com','<a href="http://se.search.yahoo.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Yahoo se.search.yahoo.com</a>',\r
+'search.com','<a href="http://www.search.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Search.com</a>',\r
+'search_1und1_de','<a href="http://search.1und1.de/" rel="nofollow" title="1&amp;1 Suche [new window]" target="_blank">1&1 Suche (subdomain "search")</a>',\r
+'search_foxtab_com','<a href="http://search.foxtab.com/" rel="nofollow" title="Foxtab Search [new window]" target="_blank">Foxtab Search</a>',\r
+'search_socialdownloadr_com','<a href="http://search.socialdownloadr.com/" rel="nofollow" title="Socialdownloadr search page [new window]" target="_blank">Socialdownloadr</a>',\r
+'search_yahoo_co_jp','<a href="http://search.yahoo.co.jp/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Yahoo search.yahoo.co.jp</a>',\r
+'search_yahoo_com','<a href="http://search.yahoo.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Yahoo search.yahoo.com</a>',\r
+'search_zonealarm_com','<a href="http://search.zonealarm.com/" rel="nofollow" title="Zone Alarm Search [new window]" target="_blank">Zone Alarm Search</a>',\r
+'searchalgo','searchalgo',\r
+'searchalot','<a href="http://www.searchalot.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Searchalot</a>',\r
+'searchch','search ch',\r
+'searchcompletion','searchcompletion',\r
+'searches_qone8_com','<a href="http://searches.qone8.com/" rel="nofollow" title="Omiga-Plus [new window]" target="_blank">Omiga-Plus</a>',\r
+'searchesnavigator','<a href="http://searchesnavigator.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">searchesnavigator</a>',\r
+'searchfunmoods','<a href="http://sr.searchfunmoods.com/" rel="nofollow" title="Funmoods [new window]" target="_blank">Funmoods</a>',\r
+'searchgol','<a href="http://www.searchgol.com/" rel="nofollow" title="Search-Gol [new window]" target="_blank">Search-Gol</a>',\r
+'searchlistingsite','<a href="http://searchlistingsite.com/" title="home page" rel="nofollow" target="_blank">SearchLlistingSite</a>',\r
+'searchmobileonline','searchmobileonline',\r
+'searchresults','<a href="http://www1.search-results.com/" rel="nofollow" title="Search-results Home Page [new window]" target="_blank">Search-results</a>',\r
+'search-results_mobi','<a href="http://search-results.mobi/" rel="nofollow" title="search-results.mobi [new window]" target="_blank">search-results.mobi</a>',\r
+'searchresultscom','<a href="http://www.search-results.com/" title="search-results" rel="nofollow" target="_blank">search-results.com ( all sites )</a>',\r
+'searchresultsmobi','<a href="http://www.search-results.mobi/" title="search-results" rel="nofollow" target="_blank">search-results.mobi</a>',\r
+'searchsafer','searchsafer',\r
+'searchy','searchy.co.uk',\r
+'searchya','<a href="http://www.searchya.com/" rel="nofollow" title="Searchya [new window]" target="_blank">Searchya</a>',\r
+'segnalo','<a href="http://segnalo.alice.it/" title="Segnalo home page [new window]" rel="nofollow" target="_blank">Segnalo</a> (Social Bookmark)',\r
+'semalt','semalt',\r
+'sensis','<a href="http://www.sensis.com.au/" title="Segnalo home page [new window]" rel="nofollow" target="_blank">Sensis AU</a>',\r
+'seznam','Seznam', \r
+'sg_search_yahoo_com','<a href="http://sg.search.yahoo.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Yahoo sg.search.yahoo.com</a>',\r
+'sg_yhs4_search_yahoo_com','<a href="http://sg.yhs4.search.yahoo.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Yahoo sg.yhs4.search.yahoo.com</a>',\r
+'shawca','<a href="http://start.shaw.ca/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Shaw.ca</a>',\r
+'shinyseek\.it','Shinyseek.it',\r
+'shoppstop','<a href="http://www.shoppstop.com/" rel="nofollow" title="ShoppStop [new window]" target="_blank">ShoppStop</a>',\r
+'sify','<a href="http://search.sify.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Sify</a>',\r
+'sky','sky',\r
+'smartsuggestor','<a href="http://search.smartsuggestor.com/" title="home page" rel="nofollow" target="_blank">smartsuggestor</a>',\r
+'smde','<a href="http://www.sm.de/" rel="nofollow" title="SM.de - Die SuchMaschine [new window]" target="_blank">SM.de - Die SuchMaschine</a>',\r
+'snapdo','snapdo',\r
+'softonic','softonic',\r
+'sogou','<a href="http://www.sogou.com/" rel="nofollow" target="_blank">SoGou</a>',\r
+'sol','SOL', \r
+'soso','<a href="http://www.soso.com/" rel="nofollow" target="_blank">SoSo</a>',\r
+'speedbit','<a href="http://go.speedbit.com/" rel="nofollow" title="Speedbit [new window]" target="_blank">Speedbit</a>',\r
+'sphere','<a href="http://www.sphere.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Sphere (Blog)</a>',\r
+'splut','Splut', \r
+'spotjockey','Spotjockey', \r
+'spray','Spray',\r
+'start','start.no',\r
+'startlap_hu','<a href="http://kereso.startlap.hu/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Startlab Kereso</a>',\r
+'startpage','startpage.com',\r
+'startsiden','startsiden',\r
+'startxxl','<a href="http://www.startxxl.com/" rel="nofollow" title="StartXXL Home Page [new window]" target="_blank">StartXXL</a>',\r
+'steadysearch','<a href="http://www.avantfind.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Avantfind</a>',\r
+'stumbleupon','<a href="http://www.stumbleupon.com/" title="Stumbleupon home page [new window]" rel="nofollow" target="_blank">Stumbleupon</a> (Social Bookmark)',\r
+'sucheaolde','<a href="http://sucheaol.aol.de/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">SucheAOL .de</a>',\r
+'sumaja','<a href="http://www.sumaja.de/" rel="nofollow" title="Sumaja [new window]" target="_blank">Sumaja</a>',\r
+'supereva','<a href="http://search.supereva.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Supereva</a>',\r
+'surfcanyon_com','<a href="http://search.surfcanyon.com/" rel="nofollow" title="SurfCanyon [new window]" target="_blank">SurfCanyon</a>',\r
+'sweetim','sweetim',\r
+'sweetpacks','<a href="http://www.sweetpacks-search.com/" rel="nofollow" title="Sweetpacks [new window]" target="_blank">Sweetpacks</a>',\r
+'swik','<a href="http://swik.net/" title="Swik home page [new window]" rel="nofollow" target="_blank">Swik</a> (Social Bookmark)',\r
+'swisscows_ch','<a href="https://swisscows.ch/" rel="nofollow" title="Swisscows search page [new window]" target="_blank">Swisscows</a>',\r
+'sympatico','<a href="http://sympatico.msn.ca/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Sympatico</a>',\r
+'szukaczpl','<a href="http://www.szukacz.pl/" title="Szukacz home page [new window]" rel="nofollow" target="_blank">Szukacz</a>',\r
+'t_online_catchall','T-Online ( catchall )',\r
+'t_online_de','T-Online .de',\r
+'talktalk_uk','talktalk uk',\r
+'tango_hu','<a href="http://tango.hu/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Tango</a>',\r
+'tbask','tb.ask ?',\r
+'teecnoit','<a href="http://www.teecno.it/" title="Teecno home page [new window]" rel="nofollow" target="_blank">Teecno</a>',\r
+'teoma','<a href="http://search.ask.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Teoma</a>',\r
+'terra','<a href="http://www.terra.es/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Terra</a>',\r
+'tesco','tesco',\r
+'theallsearches','<a href="http://theallsearches.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">theallsearches</a>',\r
+'three','three',\r
+'tiscali','<a href="http://search.tiscali.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Tiscali</a>',\r
+'tixuma_de','<a href="http://www.tixuma.de/" rel="nofollow" title="Tixuma Deutschland [new window]" target="_blank">Tixuma Deutschland</a>',\r
+'toile','Toile du Quebec',\r
+'toshiba','toshiba',\r
+'turtle','Turtle',\r
+'tw_images_search_yahoo_com','<a href="http://tw.images.search.yahoo.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Yahoo tw.images.search.yahoo.com</a>',\r
+'tyfon','Tyfon', \r
+'uk_foxstart_com','<a href="http://uk.foxstart.com/" rel="nofollow" title="Foxstart search page [new window]" target="_blank">Foxstart.com</a>',\r
+'uk_search_yahoo_com','<a href="http://uk.search.yahoo.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Yahoo uk.search.yahoo.com</a>',\r
+'uk_yhs4_search_yahoo_com','<a href="http://uk.yhs4.search.yahoo.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Yahoo uk.yhs4.search.yahoo.com</a>',\r
+'ukdirectory','UK Directory', \r
+'ukindex','UKIndex', \r
+'ukplus','UK Plus', \r
+'umfis','<a href="http://www.umfis.de/" rel="nofollow" title="UMFIS-Online Das Umweltfirmen-Informationssystem der IHKs in Deutschland [new window]" target="_blank">UMFIS-Online Das Umweltfirmen-Informationssystem der IHKs in Deutschland</a>',\r
+'umuwa_de','<a href="http://umuwa.de/" rel="nofollow" title="Umuwa Deutschland [new window]" target="_blank">Umuwa Deutschland</a>',\r
+'us_search_yahoo_com','<a href="http://us.search.yahoo.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Yahoo us.search.yahoo.com</a>',\r
+'vindex','Vindex',\r
+'virgilio','<a href="http://www.virgilio.it/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Virgilio</a>',\r
+'virginmedia','virginmedia',\r
+'vi-view_com','<a href="http://searches.vi-view.com/" rel="nofollow" title="vi-view.com [new window]" target="_blank">vi-view.com</a>',\r
+'vivisimo','<a href="http://www.vivisimo.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Vivisimo</a>',\r
+'vlips_de','vlips .de',\r
+'vnet','<a href="http://114.vnet.cn/" rel="nofollow" target="_blank">VNet</a>',\r
+'voila','<a href="http://www.voila.fr/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">Voila</a>',\r
+'wahoo','Wahoo', \r
+'webalta','<a href="http://www.webalta.ru/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">webalta.ru</a>',\r
+'webcrawler','<a href="http://www.webcrawler.com/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">WebCrawler</a>',\r
+'webde','Web.de',\r
+'webmania','webmania.hu', \r
+'whorush_com','whorush com',\r
+'windowssearch_com','<a href="http://www.windowssearch.com/search?q=AWStats" rel="nofollow" title="Example page [new window]" target="_blank">windowssearch.com</a>',\r
+'wisenut','WISENut', \r
+'wow_utop_it','<a href="http://wow.utop.it/" rel="nofollow" title="wow.utop.it [new window]" target="_blank">wow.utop.it</a>',\r
+'wowpl','<a href="http://szukaj.wow.pl/" title="Wow.pl home page [new window]" rel="nofollow" target="_blank">Wow.pl</a>',\r
+'wowsearch','<a href="http://de.wow.com/" rel="nofollow" title="Wow Search Home Page [new window]" target="_blank">Wow Search</a>',\r
+'wowuk','<a href="http://uk.wow.com/" title="uk.Wow home page [new window]" rel="nofollow" target="_blank">uk.wow.com</a>',\r
+'wp','<a href="http://szukaj.wp.pl/" title="Wirtualna Polska home page [new window]" rel="nofollow" target="_blank">Wirtualna Polska</a>',\r
+'www_buenosearch_com','<a href="http://www.buenosearch.com/" rel="nofollow" title="BuenoSearch [new window]" target="_blank">BuenoSearch</a>',\r
+'www_dregol_com','<a href="http://www.dregol.com/" rel="nofollow" title="Dregol Search [new window]" target="_blank">Dregol Search</a>',\r
+'www_wow_com','<a href="http://www.wow.com/" rel="nofollow" title="www.wow.com [new window]" target="_blank">WOW.com</a>',\r
+'wwweasel','<a href="http://wwweasel.de/" title="Search Engine Home Page [new window]" rel="nofollow" target="_blank">WWWeasel</a>',\r
+'yahoo_catchall','yahoo ( catchall )',\r
+'yahoo_mindset','<a href="http://mindset.research.yahoo.com/" rel="nofollow" title="Search Engine Home Page [new window]" target="_blank">Yahoo! Mindset</a>',\r
+'yandex','yandex ( catchall )',\r
+'yandexcom','yandex .com',\r
+'yandexcomtr','yandex .com.tr',\r
+'yandexkz','yandex .kz',\r
+'yandexru','yandex .ru',\r
+'yandexua','yandex .ua',\r
+'yell','<a href="http://www.yell.com/" title="Yell Home Page [new window]" rel="nofollow" target="_blank">Yell</a>',\r
+'yourbestsearch','<a href="http://yourbestsearch.net/" title="Home Page [new window]" rel="nofollow" target="_blank">YourBest Search</a>',\r
+'youtube','youtube',\r
+'zapmeta_catchall','zapmeta ( catchall )',\r
+'zapmeta_ch','zapmeta ch',\r
+'zapmeta_com','zapmeta com',\r
+'zapmeta_de','zapmeta de',\r
+'zhongsou','<a href="http://www.zhongsou.com/" rel="nofollow" target="_blank">ZhongSou</a>',\r
+'zoeken','<a href="http://www.zoeken.nl/" rel="nofollow" target="_blank">Zoeken</a>',\r
+'zoznam','<a href="http://www.zoznam.sk/" title="Zoznam search engine home page [new window]" rel="nofollow" target="_blank">Zoznam</a>',\r
+\r
+# Generic search engines\r
+'search','Unknown search engines'\r
+);\r
+\r
+# Sanity check.\r
+# Enable this code and run perl search_engines.pm to check file entries are ok\r
+#-----------------------------------------------------------------------------\r
+#foreach my $key (@SearchEnginesSearchIDOrder_list1) {\r
+#      if (! $SearchEnginesHashID{$key}) { error("Entry '$key' has been found in SearchEnginesSearchIDOrder_list1 with no value in SearchEnginesHashID");\r
+#      foreach my $key2 (@SearchEnginesSearchIDOrder_list2) { if ($key2 eq $key) { error("$key is in 1 and 2\n"); } }\r
+#      foreach my $key2 (@SearchEnginesSearchIDOrder_listgen) { if ($key2 eq $key) { error("$key is in 1 and gen\n"); } }\r
+#} }\r
+#foreach my $key (@SearchEnginesSearchIDOrder_list2) {\r
+#      if (! $SearchEnginesHashID{$key}) { error("Entry '$key' has been found in SearchEnginesSearchIDOrder_list1 with no value in SearchEnginesHashID");\r
+#      foreach my $key2 (@SearchEnginesSearchIDOrder_list1) { if ($key2 eq $key) { error("$key is in 2 and 1\n"); } }\r
+#      foreach my $key2 (@SearchEnginesSearchIDOrder_listgen) { if ($key2 eq $key) { error("$key is in 2 and gen\n"); } }\r
+#} }\r
+#foreach my $key (@SearchEnginesSearchIDOrder_listgen) { if (! $SearchEnginesHashID{$key}) { error("Entry '$key' has been found in SearchEnginesSearchIDOrder_listgen with no value in SearchEnginesHashID"); } }\r
+#foreach my $key (keys %NotSearchEnginesKeys) { if (! $SearchEnginesHashID{$key}) { error("Entry '$key' has been found in NotSearchEnginesKeys with no value in SearchEnginesHashID"); } }\r
+#foreach my $key (keys %SearchEnginesKnownUrl) {\r
+#      my $found=0;\r
+#      foreach my $key2 (values %SearchEnginesHashID) {\r
+#              if ($key eq $key2) { $found=1; last; }\r
+#      }\r
+#      if (! $found) { die "Entry '$key' has been found in SearchEnginesKnownUrl with no value in SearchEnginesHashID"; }\r
+#}\r
+#foreach my $key (keys %SearchEnginesHashLib) {\r
+#      my $found=0;\r
+#      foreach my $key2 (values %SearchEnginesHashID) {\r
+#              if ($key eq $key2) { $found=1; last; }\r
+#      }\r
+#      if (! $found) { die "Entry '$key' has been found in SearchEnginesHashLib with no value in SearchEnginesHashID"; }\r
+#}\r
+#print @SearchEnginesSearchIDOrder_list1." ".@SearchEnginesSearchIDOrder_list2." ".@SearchEnginesSearchIDOrder_listgen;\r
+\r
+1;\r