Skip to content

Commit

Permalink
change robots regex
Browse files Browse the repository at this point in the history
  • Loading branch information
sebastiank committed Oct 4, 2018
1 parent c3b1b46 commit c1f05c4
Show file tree
Hide file tree
Showing 2 changed files with 3 additions and 3 deletions.
4 changes: 2 additions & 2 deletions composer.json
Original file line number Diff line number Diff line change
@@ -1,8 +1,8 @@
{
"name": "phantazm/robotdetector",
"name": "workana/robotdetector",
"description": "Detect robots and crawlers.",
"keywords": ["crawler", "spider", "robots", "user_agent"],
"homepage": "https://github.com/Phantazm/RobotDetector",
"homepage": "https://github.com/Workana/RobotDetector",
"license": "MIT",
"authors": [
{
Expand Down
2 changes: 1 addition & 1 deletion src/RobotDetector/RobotDetector.php
Original file line number Diff line number Diff line change
Expand Up @@ -50,7 +50,7 @@ function RobotDetect($user_agent)
$agent = strstr($user_agent, '/', TRUE);

// Robots
$robots = "abcdatos|acme-spider|ahoythehomepagefinder|Alkaline|anthill|appie|arachnophilia|arale|araneo|araybot|architext|aretha|ariadne|arks|aspider|atn|atomz|auresys|backrub|bayspider|bbot|bigbrother|bingbot|bjaaland|blackwidow|blindekuh|Bloodhound|borg-bot|boxseabot|brightnet|bspider|cactvschemistryspider|calif|cassandra|cgireader|checkbot|christcrawler|churl|cienciaficcion|cmc|Collective|combine|confuzzledbot|coolbot|core|cosmos|cruiser|cusco|cyberspyder|cydralspider|desertrealm|deweb|dienstspider|digger|diibot|directhit|dnabot|download_express|dragonbot|dwcp|e-collector|ebiness|eit|elfinbot|emacs|emcspider|esculapio|esther|evliyacelebi|nzexplorer|fastcrawler|fdse|felix|ferret|fetchrover|fido|finnish|fireball|fish|fouineur|francoroute|freecrawl|funnelweb|gama|gazz|gcreep|getbot|geturl|golem|googlebot|grapnel|griffon|gromit|gulliver|gulperbot|hambot|harvest|havindex|hi|hometown|wired-digital|htdig|htmlgobble|hyperdecontextualizer|iajabot|ibm|iconoclast|Ilse|imagelock|incywincy|informant|infoseek|infoseeksidewinder|infospider|inspectorwww|intelliagent|irobot|iron33|israelisearch|javabee|JBot|jcrawler|askjeeves|jobo|jobot|joebot|jubii|jumpstation|kapsi|katipo|kdd|kilroy|ko_yappo_robot|larbin|legs|linkidator|linkscan|linkwalker|lockon|lycos|macworm|magpie|marvin|mattie|mediafox|merzscope|meshexplorer|MindCrawler|mnogosearch|moget|momspider|monster|motor|msnbot|muncher|muninn|muscatferret|mwdsearch|myweb|NDSpider|netcarta|netmechanic|netscoop|newscan-online|nhse|nomad|northstar|objectssearch|occam|octopus|OntoSpider|openfind|orb_search|packrat|pageboy|parasite|patric|pegasus|perignator|perlcrawler|phantom|phpdig|piltdownman|pimptrain|pioneer|pitkow|pjspider|pka|plumtreewebaccessor|poppi|portalb|psbot|Puu|python|raven|rbse|resumerobot|rhcs|rixbot|roadrunner|robbie|robi|robocrawl|robofox|robozilla|roverbot|rules|safetynetrobot|scooter|search_au|search-info|searchprocess|senrigan|sgscout|shaggy|shaihulud|sift|simbot|site-valet|sitetech|skymob|slcrawler|slurp|smartspider|snooper|solbot|speedy|spider_monkey|spiderbot|spiderline|spiderman|spiderview|spry|ssearcher|suke|suntek|sven|sygol|tach_bw|tarantula|tarspider|tcl|techbot|templeton|titin|titan|tkwww|tlspider|ucsd|udmsearch|uptimebot|urlck|us|valkyrie|verticrawl|victoria|visionsearch|voidbot|voyager|vwbot|w3index|w3m2|wallpaper|wanderer|wapspider|webbandit|webcatcher|webcopy|webfetcher|webfoot|webinator|weblayers|weblinker|webmirror|webmoose|webquest|webreader|webreaper|webs|websnarf|webspider|webvac|webwalk|webwalker|webwatch|wget|whatuseek|whowhere|wlm|wmir|wolp|wombat|worm|wwwc|wz101|xget|Nederland.zoek|nutch";
$robots = "abcdatos|spider|ahoythehomepagefinder|Alkaline|anthill|appie|arachnophilia|arale|araneo|araybot|architext|aretha|ariadne|arks|atn|atomz|auresys|backrub|bbot|bigbrother|bingbot|bjaaland|blackwidow|blindekuh|Bloodhound|borg-bot|boxseabot|brightnet|calif|cassandra|cgireader|checkbot|crawl|churl|cienciaficcion|cmc|Collective|combine|confuzzledbot|coolbot|core|cosmos|cruiser|cusco|cyberspyder|desertrealm|deweb|digger|diibot|directhit|dnabot|download_express|dragonbot|dwcp|e-collector|ebiness|eit|elfinbot|emacs|esculapio|esther|evliyacelebi|nzexplorer|fdse|felix|ferret|fetchrover|fido|finnish|fireball|fish|fouineur|francoroute|funnelweb|gama|gazz|gcreep|getbot|geturl|golem|googlebot|grapnel|griffon|gromit|gulliver|gulperbot|hambot|harvest|havindex|hi|hometown|wired-digital|htdig|htmlgobble|hyperdecontextualizer|iajabot|ibm|iconoclast|Ilse|imagelock|incywincy|informant|infoseek|infoseeksidewinder|inspectorwww|intelliagent|irobot|iron33|israelisearch|javabee|JBot|askjeeves|jobo|jobot|joebot|jubii|jumpstation|kapsi|katipo|kdd|kilroy|ko_yappo_robot|larbin|legs|linkidator|linkscan|linkwalker|lockon|lycos|magpie|marvin|mattie|mediafox|merzscope|meshexplorer|mnogosearch|moget|monster|motor|msnbot|muncher|muninn|muscatferret|mwdsearch|myweb|netcarta|netmechanic|netscoop|newscan-online|nhse|nomad|northstar|objectssearch|occam|octopus|openfind|orb_search|packrat|pageboy|parasite|patric|pegasus|perignator|phantom|phpdig|piltdownman|pimptrain|pioneer|pitkow|pka|plumtreewebaccessor|poppi|portalb|psbot|Puu|python|raven|rbse|resumerobot|rhcs|rixbot|roadrunner|robbie|robi|robofox|robozilla|roverbot|rules|safetynetrobot|scooter|search_au|search-info|searchprocess|senrigan|sgscout|shaggy|shaihulud|sift|simbot|site-valet|sitetech|skymob|slurp|snooper|solbot|speedy|spry|ssearcher|suke|suntek|sven|sygol|tach_bw|tarantula|tcl|techbot|templeton|titin|titan|tkwww|ucsd|udmsearch|uptimebot|urlck|us|valkyrie|victoria|visionsearch|voidbot|voyager|vwbot|w3index|w3m2|wallpaper|wanderer|webbandit|webcatcher|webcopy|webfetcher|webfoot|webinator|weblayers|weblinker|webmirror|webmoose|webquest|webreader|webreaper|webs|websnarf|webvac|webwalk|webwalker|webwatch|wget|whatuseek|whowhere|wlm|wmir|wolp|wombat|worm|wwwc|wz101|xget|Nederland.zoek|nutch|yandex|ahrefs|semrush|dotbot|trovitbot";

// Quick check if robot
$isRobot = (stripos($robots, $agent) === FALSE) ? 0 : 1;
Expand Down

0 comments on commit c1f05c4

Please sign in to comment.