-
Notifications
You must be signed in to change notification settings - Fork 13
Expand file tree
/
Copy pathwtop.cfg
More file actions
42 lines (35 loc) · 8.54 KB
/
wtop.cfg
File metadata and controls
42 lines (35 loc) · 8.54 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
[main]
DEFAULT_OUTPUT_FIELDS=ts,class,ip,msec,uas,url,refdom
LOG_FILE_TYPE=apache
# This MUST match your Apache LogFormat directive.
# To use wtop, you MUST have at least %s, %r, %t and %D.
LOG_FORMAT=%h %l %u %t "%r" %>s %B "%{Referer}i" "%{User-Agent}i" %D
LOG_ROOT=/var/log/apache2/
LOG_FILE=access_log
## uncomment these lines for limited, experimental Microsoft IIS support
# LOG_FILE_TYPE=iis
# LOG_FORMAT=w3c-extended
# LOG_ROOT=C:\Windows\System32\logfiles\W3SVC1\
[wtop]
# max time before a request is logged in the "slow" column
MAX_REQUEST_TIME=5000
# minimum requests/second before a URL class appears in top mode
MIN_RPS=0.2
[classes]
# you can define any classes you wish with regular expressions
#foo=/some/.+/bar
#baz=/some/other/path
#affiliate=MY_AFFILIATE_ID
home=^/(?:\?.*)?$
#static=\.(?:png|gif|jpe?g|cur|ico|bmp|xml|txt|js|css|swf)(?:\?.*)?$
xml=\.xml(?:\?.*)?$
js=\.js(?:\?.*)?$
css=\.css(?:\?.*)?$
swf=\.swf(?:\?.*)?$
img=\.(?:png|gif|jpe?g|cur|ico|bmp)(?:\?.*)?$
[patterns]
# the generic class pattern is used if a URL does not match any
# of the named classes above.
generic=^/([^/\?]+) # top-level directory
## user-agent pattern for identifying robots (optimized)
robots=(?:00(?:7AC9|8\/0\.(?:71|8[35]))|192\.comAgent|200PleaseBot|360Spider|4seohuntBot|50\.nu|A(?:6\-Indexer|DmantX\ Platform\ Semantic\ Analyzer|MZNKAssocBot|SAHA\ Search\ Engine\ Turkey|b(?:ou(?:ndexbot|tUsBot)|rave\ Spider)|c(?:c(?:elobot|oona\-AI\-Agent)|o(?:onBot|rn))|d(?:dThis\.com|sBot\-Google)|hrefsBot|l(?:exabot|maden)|m(?:agit\.COM|fibibot)|ntBot|p(?:ercite|ortWorm)|ra(?:Bot|chnophilia)|sk(?:\ Jeeves\/Teoma|Quickly)|utomattic\ Analytics\ Crawler)|B(?:D(?:Cbot|Fetch)|LEXBot|UbiNG|a(?:balooSpider|cklinkCrawler|d\-Neighborhood|iduspider)|e(?:comeBot|gunAdvertising)|igsearch\.ca|l(?:aiz\-Bee|ekkobot|inkaCrawler|og(?:Pulse|gsi))|otOnParade|r(?:ainbruBot|owsershots)|u(?:tterfly|zzRankingBot))|C(?:C(?:Bot|ResearchBot)|JB\.NET\ Proxy|MS\ Crawler|OMODOSpider|a(?:montSpider|reerBot|stabot|tchBot|zoodleBot)|ha(?:ngeDetection|rlotte)|i(?:rrusExplorer|ty4you)|l(?:i(?:gooRobot|qz(?:Bot|bot))|oud(?:Flare\-AlwaysOnline|ServerMarketSpider))|o(?:m(?:bine|p(?:SpyBot|any\ News\ Search\ engine))|nveraCrawler|rpusCrawler|vario\-IDS)|r(?:a(?:wler4j|zyWebCrawler\-Spider)|owsnest)|urious\ George)|D(?:BLBot|CPbot|KIMRepBot|NS\-Digger\-Explorer|a(?:ta(?:Fountains|parkSearch)|umoa)|e(?:alGates\ Bot|pSpid)|o(?:mainDB|t(?:\ TK\ \-\ spider|Bot))|ripfeedBot|uckDuck(?:Bot|Preview))|E(?:DI\/1\.6\.[56]|as(?:ouSpider|yBib\ AutoCite)|disterBot|mbedly|n(?:aBot|terprise\_Search)|sribot|ur(?:ipBot|obot)|v(?:e(?:ntGuruBot|ryoneSocialBot)|riNid)|x(?:B\ Language\ Crawler|a(?:bot|ctSEEK))|zooms)|F(?:AST\ (?:Enterprise\ Crawler|MetaWeb\ Crawler)|a(?:cebookExternalHit|irShare|lconsbot|uBot)|e(?:ed(?:CatBot|Finder\/bloggz\.se|ly)|tch\-Guess)|indexa\ Crawler|l(?:atland\ Industries\ Web\ Spider|i(?:ghtDeckReportsBot|pboardProxy)|ocke\ bot)|o(?:llowSite\ Bot|oooo\_Web\_Video\_Crawl|rschungsportal)|r(?:ancis|eeWebMonitoring\ SiteChecker)|u(?:nnelBack|rlBot)|yberSpider)|G(?:OFORITBOT|a(?:isbot|llent\ Search\ Spider|rlikCrawler)|e(?:liyooBot|nieo\ Web\ filter|onaBot)|i(?:gabot|ngerCrawler|rafabot)|ooglebot|ra(?:hambot|peshotCrawler)|urujiBot)|H(?:a(?:iloobot|tenaScreenshot)|eartRails\_Capture|iddenMarket|o(?:lmes(?:Bot)?|meTags|oWWWer|stTracker(?:\.com)?)|u(?:aweiSymantecSpider|bSpot\ C(?:onnect|rawler))|ypeStat)|I(?:C(?:C\-Crawler|F\_Site\_Crawler)|RLbot|XEbot|deelaborPlagiaat|framely|l(?:Trovatore(?:\-Setaccio)?|seBot)|mplisenseBot|n(?:f(?:luencebot|o(?:ciousBot|helfer))|te(?:gromeDB|rnetSeer))|pselonbot|stellaBot)|J(?:UST\-CRAWLER|a(?:bse\.com\ Crawler|dynAve(?:Bot)?|mbot)|ikeSpider|ob\ Roboter\ Spider|yxobot)|K(?:Retrieve|a(?:kle\ Bot|looga|rneval\-Bot)|eyw(?:enBot|ordDensityRobot)|o(?:modiaBot|ngulo)|r(?:OWLer|aken|ugle))|L(?:\.webis|a(?:pozzBot|rbin)|e(?:ikibot|murWebCrawler|xxeBot)|i(?:jit|n(?:gu(?:aBot|ee\ Bot)|k(?:\ Valet\ Online|Aider|Walker|edInBot))|pperhey\ Spider)|oad(?:ImpactPageAnalyzer|TimeBot)|uminateBot)|M(?:IA\ Bot|J12bot|LBot|Qbot|S(?:NBot|RBOT)|a(?:hiti\ Crawler|il\.Ru\ bot)|e(?:MoNewsBot|gatext|ta(?:GeneratorCrawler|HeadersBot|JobBot|TagRobot|URI(?:\ API)?|mojiCrawler))|i(?:aDev|xBot)|noGoSearch|o(?:atbot|jeekBot|toricerca\-Robots\.txt\-Checker)|p3Bot|ultiCrawler|yFamilyBot)|N(?:G(?:\-Search|\/2\.0)|LNZ\_IAHarvester2013|PBot|a(?:jdi\.si|lezenCzBot|verBot)|e(?:rd(?:ByNature\.Bot|yBot)|t(?:ResearchServer|WhatCrawler|craftSurveyAgent|intelligence\ LiveAssessment|seer)|xtGenSearchBot)|i(?:gma\.ru|mbleCrawler)|u(?:Search\ Spider|hk|tch)|ymesis)|O(?:celli|mniExplorer\_Bot|n(?:etSzukaj|line\ Domain\ Tools)|oyyoBot|pen(?:\ Web\ Analytics\ Bot|CalaisSemanticProxy|WebSpider|bot|indexSpider)|r(?:biter|gbyBot)|sObot)|P(?:a(?:ge(?:2RSS|BitesHyperBot|Peeker)|nscient\ web\ crawler|perLiBot|rchBot|yPal\ IPN)|e(?:e(?:p(?:lo\ Screenshot\ Bot|owbot)|w)|rcolateCrawler)|i(?:nterest|plBot|xray\-Seeker)|lukkie|o(?:godak\.co\.yu|mpos|stPost)|roCog(?:Bot|SEOBot))|Q(?:irina\ Hurdler|seero|u(?:a(?:lidator\.com\ Bot|ntcastbot)|erySeekerSpider))|R(?:6\ bot|ADaR\-Bot|SSMicro\.com\ RSS\/Atom\ Feed\ Robot|ankurBot|e(?:adability|dBot)|o(?:bo(?:\ Crawler|ts\_Tester|zilla)|nzoobot)|uky\-Roboter|yzeCrawler)|S(?:AI\ Crawler|B(?:Ider|Search)|CFCrawler|EO(?:Dat|ENGBot|kicks\-Robot)|SL(?:\-Crawler|Bot)|TINGbot|WEBot|anszBot|c(?:arlett|o(?:llSpider|oter|utJet)|r(?:apy|eenerBot\ Crawler|ubby))|e(?:arch(?:\ Engine\ World\ Robots\.txt\ Validator|17Bot|metricsBot)|curityResearchBot|m(?:a(?:ger|ntifire)|rushBot)|nsis\ Web\ Crawler|o(?:CheckBot|bility)|toozbot|znamBot)|h(?:areaholicbot|elob|im\-Crawler|o(?:pWiki|wyouBot))|i(?:rketce\/Busiverse|te(?:Condor|domain\-Bot))|kreemRBot|n(?:ap(?:Bot|bot|py)|iffRSS)|o(?:lomonoBot|sospider)|p(?:eedy|i(?:derLing|nn3r)|o(?:ck\ Crawler|keSpider)|roose|utnikBot)|revBot|t(?:a(?:ckRambler|toolsBot)|eeler|rokebot)|ur(?:centroBot|phace\ Scout|veyBot)|y(?:golBot|mfony\ Spider|nooBot)|zuka(?:cz|nkobot))|T(?:agoobot|e(?:chnoratibot|ragramCrawler)|h(?:eophrastus|umb(?:S(?:hots\-Bot|niper)|nail\.CZ\ robot|shots\.ru))|inEye|o(?:mTom\ places\ company\ search|picbot|read\-Crawler|uche)|u(?:rnitinBot|torGigBot)|w(?:engaBot|i(?:celer|kle|ngly\ Recon)))|U(?:ASlinkChecker|RLAppendBot|n(?:isterBot|windFetchor)|p(?:downerbot|time(?:Dog|Robot))|rlfilebot\ \(Urlbot\))|V(?:ERASYS\ 2k|MBot|ORTEX|WBot|agabondo|e(?:dma|rmut|spa\ Crawler)|i(?:deoSurf\_bot|sbot)|oilaBot)|W(?:ASALive\-Bot|BSearchBot|IRE|MCAI\_robot|atchMouse|e(?:SEE|b(?:\-(?:Monitoring|sniffer)|Alta\ Crawler|Co(?:okies|rp)|Images|NL|RankSpider|T(?:arantula\.com\ Crawler|humbnail)|Watch\/Robot\_txtChecker|arooBot|scope\ Crawler))|hoismindbot|i(?:kioFeedBot|ll(?:ow\ Internet\ Crawler|yBot)|n(?:WebBot|kBot))|o(?:ko|rdPress\.com\ mShots|tbox))|X(?:ML\ Sitemaps\ Generator|RL\/3\.00|marksFetch|oviBot)|Y(?:RSpider|YSpider|a(?:anb|hoo\!|n(?:dexBot|ga))|ioopBot|o(?:daoBot|ono\ Bot|udaoBot|wedoBot))|Z(?:ACATEK\_CZ|e(?:erchBot|usbot)|oo(?:ka(?:Bot|bot)|mSpider\ \(ZSEBOT\))|umBot|yBorg)|\^Nail|a(?:bby|dressendeutschland\.de|i(?:HitBot|ppie)|kula|lexa\ site\ audit|mibot|r(?:achnode\.net|chive\.org\_bot))|b(?:a(?:cklink\-check\.de|ypup)|i(?:ngbot|tlybot|wec|xocrawler)|l\.uk\_lddc\_bot|nf\.fr\_bot|o(?:itho\.com\-dc|t(?:\-pge\.chlooe\.com|\.wsowner\.com|mobi))|tbot)|c(?:cubee|ityreview|lassbot|o(?:ccoc|pyright\ sheriff)|rawler\ for\ netopian|sci\_b659|url)|d(?:atagnionbot|el\.icio\.us\-thumbnails|iscoverybot|l(?:cbot|vr\.it)|otSemantic|rupact)|e(?:\-SocietyRobot|C(?:airn\-Grabber|ommerceBot)|gothor|jupiter\.com|mefgebot|nvolk)|f(?:a(?:c(?:ebookplatform|tbot)|stbot\ crawler|vorstarbot)|i(?:ndlinks|rmilybot)|latlandbot)|g(?:2crawler|enieBot|o(?:crawl|nzo)|sa\-crawler)|h(?:awkReader|eritrix|t\:\/\/Dig)|i(?:Cjobs|a(?:\_archiver|nt|skspider)|chiro|dmarch|m(?:bot|mediatenet\ thumbnails))|k(?:sibot|ulturarw)|l(?:i(?:n(?:guatools|k(?:dex(?:\.com|bot)|smanager\_bot))|vedoor\ ScreenShot)|mspider)|m(?:agpie\-crawler|eanpathbot|iniRank|o(?:ba\-crawler|zDex)|usobot)|n(?:avissobot|e(?:kstbot|stReader|tEstate\ Crawler|xtthing\.org)|ner|o(?:destackbot|yona)|worm)|o(?:Bot|mgilibot|w(?:nCloud\ Server\ Crawler|sBot))|p(?:a(?:ge\_verifier|rsijoo)|eerindex|ingdom\.com\_bot|moz\.info\ ODP\ link\ checker|o(?:lixea\.de|sterus)|r(?:\-cy\.ru\ Screenshot\ Bot|oximic)|sbot)|quickobot|r(?:\.it|ogerbot)|s(?:chibstedsokbot|e(?:arch\.KumKie\.com|egnifybot)|i(?:lk|strix)|mart\.apnoti\.com\ Robot|nap\.com|o(?:cialbm\_bot|gou\ spider)|p(?:bot|roose)|tq\_bot|uggybot)|t(?:aptubot|extractor|humbshots\-de\-Bot|rendictionbot)|u(?:MBot|pdated|rlfan\-bot)|v(?:irus\_detector|o(?:id\-bot|ltron|yager))|w(?:e(?:b(?:inatorbot|mastercoffee)|ctar)|get|ikiwix\-bot|oriobot|s(?:Analyzer|check\.com)|ww(?:\.fi\ crawler|ster))|x28\-job\-bot|y(?:acybot|zer))