Skip to content

Commit b574005

Browse files
authored
Merge pull request #31 from Setono/create-pull-request/patch
Changes by create-pull-request action
2 parents be487de + 7ef3611 commit b574005

File tree

1 file changed

+61
-10
lines changed

1 file changed

+61
-10
lines changed

src/BotDetector/Bots.php

Lines changed: 61 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,8 @@
1010

1111
final class Bots
1212
{
13-
public const REGEX = "#monitoring360bot
13+
public const REGEX = "#WireReaderBot(?:/([\d+.]+))?
14+
|monitoring360bot
1415
|Cloudflare-Healthchecks
1516
|360Spider
1617
|Aboundex
@@ -108,8 +109,10 @@ final class Bots
108109
|Seznam-Zbozi-robot
109110
|Heurekabot-Feed
110111
|ShopAlike
111-
|Adwords-(?:DisplayAds|Express|Instant)|Google\sWeb\sPreview|Google[\s-]Publisher[\s-]Plugin|Google-(?:Ads-Conversions|Ads-Qualify|Adwords|AMPHTML|Assess|Extended|HotelAdsVerifier|InspectionTool|PageRenderer|Read-Aloud|Safety|Shopping-Quality|Site-Verification|speakr|Stale-Content-Probe|Test|Youtube-Links)|(?:AdsBot|APIs|DuplexWeb|Feedfetcher|Mediapartners)-Google(?:-Mobile)?|Google(?:AdSenseInfeed|AssociationService|bot|Other|Prober|Producer)|Google.*/\+/web/snippet
112+
|Googlebot-News
113+
|Adwords-(?:DisplayAds|Express|Instant)|Google\sWeb\sPreview|Google[\s-]Publisher[\s-]Plugin|Google-(?:adstxt|Ads-Conversions|Ads-Qualify|Adwords|AMPHTML|Assess|Extended|HotelAdsVerifier|InspectionTool|Lens|PageRenderer|Read-Aloud|Safety|Shopping-Quality|Site-Verification|Sites-Thumbnails|speakr|Stale-Content-Probe|Test|Youtube-Links)|(?:AdsBot|APIs|DuplexWeb|Feedfetcher|Mediapartners)-Google(?:-Mobile)?|Google(?:AdSenseInfeed|AssociationService|bot|Other|Prober|Producer|Sites)|Google.*/\+/web/snippet
112114
|^Google$
115+
|Google-Area120-PrivacyPolicyFetcher
113116
|heritrix
114117
|HubSpot\s
115118
|vuhuvBot
@@ -182,6 +185,9 @@ final class Bots
182185
|Screaming\sFrog\sSEO\sSpider
183186
|ScreenerBot
184187
|SemrushBot
188+
|SerpReputationManagementAgent/[\d.]+
189+
|SplitSignalBot
190+
|SiteAuditBot/[\d.]+
185191
|SensikaBot
186192
|SEOENG(?:World)?Bot
187193
|SEOkicks-Robot
@@ -216,16 +222,16 @@ final class Bots
216222
|TinEye-bot
217223
|Tiny\sTiny\sRSS
218224
|theoldreader\.com
219-
|Trackable/0.1
225+
|Trackable/0\.1
220226
|trendictionbot
221227
|TurnitinBot
222-
|TweetedTimes\sBot
228+
|TweetedTimes
223229
|TweetmemeBot
224230
|Twingly\sRecon
225231
|Twitterbot
226232
|UniversalFeedParser
227233
|via\ssecureurl\.fwdcdn\.com
228-
|Uptimebot
234+
|Uptime(?:bot)?/[\d.]+
229235
|UptimeRobot
230236
|URLAppendBot
231237
|Vagabondo
@@ -256,7 +262,9 @@ final class Bots
256262
|YahooCacheSystem
257263
|Y!J-BRW
258264
|Y!J-WSC
259-
|Yandex(?:(?:\.Gazeta\s|Accessibility|Mobile|MobileScreenShot|RenderResources|Screenshot|Sprav)?Bot|(?:AdNet|Antivirus|Blogs|Calendar|Catalog|Direct|Favicons|ForDomain|ImageResizer|Images|Market|Media|Metrika|News|OntoDB(?:API)?|Pagechecker|Partner|RCA|SearchShop|(?:News|Site)links|Tracker|Turbo|Verticals|Vertis|Video|Webmaster))|YaDirectFetcher
265+
|Y!J-ASR
266+
|^Y!J
267+
|Yandex(?:(?:\.Gazeta\s|Accessibility|Mobile|MobileScreenShot|RenderResources|Screenshot|Sprav)?Bot|(?:AdNet|Antivirus|Blogs|Calendar|Catalog|Direct|Favicons|ForDomain|ImageResizer|Images|Market|Media|Metrika|News|OntoDB(?:API)?|Pagechecker|Partner|RCA|SearchShop|(?:News|Site)links|Tracker|Turbo|Userproxy|Verticals|Vertis|Video|Webmaster))|YaDirectFetcher
260268
|Yeti|NaverJapan|AdsBot-Naver
261269
|YoudaoBot
262270
|YOURLS\sv[0-9]
@@ -269,7 +277,8 @@ final class Bots
269277
|.*Java.*outbrain
270278
|HubPages.*crawlingpolicy
271279
|Pinterest(?:bot)?/[\d.]+.*www\.pinterest\.com
272-
|Site24x7
280+
|.*Site24x7
281+
|.*\sHLB/[\d.]+
273282
|s~snapchat-proxy
274283
|Snap\sURL\sPreview\sService
275284
|SnapchatAds/[\d.]+
@@ -358,6 +367,7 @@ final class Bots
358367
|datagnionbot
359368
|WhatCMS
360369
|httpx
370+
|.*\.oast\.
361371
|scaninfo@(?:expanseinc|paloaltonetworks)\.com
362372
|HuaweiWebCatBot
363373
|Hatena-Favicon
@@ -453,7 +463,6 @@ final class Bots
453463
|RenovateBot/[\d.]+
454464
|INETDEX-BOT/[\d.]+
455465
|NETZZAPPEN
456-
|SerpReputationManagementAgent/[\d.]+
457466
|panscient\.com
458467
|research@pdrlabs\.net
459468
|Nicecrawler/[\d.]+
@@ -533,6 +542,8 @@ final class Bots
533542
|MBCrawler
534543
|mariadb-mysql-kbs-bot
535544
|GitHubCopilotChat
545+
|^pdrl\.fm
546+
|PodUptime/
536547
|anthropic-ai
537548
|NetpeakCheckerBot/[\d.]+
538549
|SandobaCrawler/[\d.]+
@@ -568,7 +579,47 @@ final class Bots
568579
|ViberUrlDownloader
569580
|^Zeno$
570581
|Barracuda\sSentinel
571-
|nuhk|grub-client|Download\sDemon|SearchExpress|Microsoft\sURL\sControl|borg|altavista|dataminr\.com|tweetedtimes\.com|teoma|oegp|http%20client|htdig|mogimogi|larbin|scrubby|searchsight|semanticdiscovery|snappy|vortex(?!(?:\sBuild|Plus))|zeal(?!ot)|dataparksearch|findlinks|BrowserMob|URL2PNG|ZooShot|GomezA|Google\sSketchUp|Read%20Later|7Siters|centuryb\.o\.t9|InterNaetBoten|EasyBib\sAutoCite|Bidtellect|tomnomnom/meg|cortex|Re-re\sStudio|adreview|AHC/|NameOfAgent|Request-Promise|ALittle\sClient|Hello,?\sworld|wp_is_mobile|0xAbyssalDoesntExist|Anarchy99|daumoa,damoa,daum,daumos,duamoa,duam,duamos|^revolt|nvd0rz|xfa1|Hakai|gbrmss|fuck-your-hp|IDBTE4M\sCODE87|Antoine|Insomania|Hells-Net|b3astmode|Linux\sGnu\s\(cow\)|Test\sCertificate\sInfo|iplabel|Magellan|TheSafex?Internetx?Search|kirkland-signature|^xenu|^ZmEu|^(?:chrome|firefox|Zeus)$
572-
|[a-z0-9_-]*(?:(?<!cu|power[\s_]|m[\s_])bot(?![\s_]TAB|[\s_]?5[0-9]|[\s_]Senior|[\s_]Junior)|analyzer|appengine|archiver|checker|collector|crawl|crawler|fetcher|indexer|monitor|project(?!or)|research|resolver|robots|scraper|security|spider|study|transcoder|uptime|user[\s_]?agent|validator)(?:[^a-z]|$)
582+
|RuxitSynthetic/[\d.]+
583+
|DynatraceSynthetic/[\d.]+
584+
|sitebulb
585+
|Monsidobot/[\d.]+
586+
|AccompanyBot
587+
|Ghost\sInspector
588+
|Cypress/[\d.]+
589+
|Google-Apps-Script
590+
|SiteOne-Crawler/[\d.]+
591+
|Detectify
592+
|DomCopBot
593+
|Paqlebot/[\d.]+
594+
|Wibybot
595+
|Synapse
596+
|OSZKbot/[\d.]+
597+
|ZoomBot
598+
|RavenCrawler/[\d.]+
599+
|KadoBot
600+
|Dubbotbot/[\d.]+
601+
|Swiftbot/[\d.]+
602+
|EyeMonIT
603+
|ThousandEyes
604+
|OmtrBot/[\d.]+
605+
|WebMon/[\d.]+
606+
|AdsTxtCrawlerTP/[\d.]+
607+
|fragFINN
608+
|Clickagy
609+
|kiwitcms-gitops/[\d.]+
610+
|webtru_crawler
611+
|URLSuMaBot
612+
|360JK\syunjiankong
613+
|UCSBNetworkMeasurement
614+
|Plesk\sscreenshot\sbot
615+
|Who\.is
616+
|Probely
617+
|Uptimia(?:/[\d.]+)?
618+
|2GDPR/[\d.]+
619+
|abuse\.xmco\.fr
620+
|CheckHost
621+
|LAC_IAHarvester/[\d.]+
622+
|nuhk|grub-client|Download\sDemon|SearchExpress|Microsoft\sURL\sControl|borg|altavista|dataminr\.com|teoma|oegp|http%20client|htdig|mogimogi|larbin|scrubby|searchsight|semanticdiscovery|snappy|vortex(?!(?:\sBuild|Plus))|zeal(?!ot)|dataparksearch|findlinks|BrowserMob|URL2PNG|ZooShot|GomezA|Google\sSketchUp|Read%20Later|7Siters|centuryb\.o\.t9|InterNaetBoten|EasyBib\sAutoCite|Bidtellect|tomnomnom/meg|cortex|Re-re\sStudio|adreview|AHC/|NameOfAgent|Request-Promise|ALittle\sClient|Hello,?\sworld|wp_is_mobile|0xAbyssalDoesntExist|Anarchy99|^revolt|nvd0rz|xfa1|Hakai|gbrmss|fuck-your-hp|IDBTE4M\sCODE87|Antoine|Insomania|Hells-Net|b3astmode|Linux\sGnu\s\(cow\)|Test\sCertificate\sInfo|iplabel|Magellan|TheSafex?Internetx?Search|Searcherweb|kirkland-signature|LinkChain|survey-security-dot-txt|^xenu|^ZmEu|^(?:chrome|firefox|Zeus)$
623+
|[a-z0-9_-]*(?:(?<!cu|power[\s_]|m[\s_])bot(?![\s_]TAB|[\s_]?5[0-9]|[\s_]Senior|[\s_]Junior)|analyzer|appengine|archiver?|checker|collector|crawl|crawler|fetcher|indexer|inspector|monitor|project(?!or)|(?<!Google\sWap\s)proxy|research|resolver|robots|scanner|scraper|script|searcher|(?<!-)security|spider|study|transcoder|uptime|user[\s_]?agent|validator)(?:[^a-z]|$)
573624
#x";
574625
}

0 commit comments

Comments
 (0)