# List of robot spider # First is the string find in the log, second the robot fullname # Sorted by popularity (faster search) # #http://www.user-agents.org/cgi-bin/free-search.cgi?free-search.shtml # Top robot "googlebot", "Googlebot" "msnbot", "Msn" "slurp", "Yahoo" "yahoo", "Yahoo" "bingbot", "Bing" "mms dash", "Yahoo" "voila", "Voila" "natcrawlbloc", "Voila" "yodaobot", "Yodao" "cuil", "Cuil" "exabot", "Exabot" "baiduspider", "Baidu" "htdig", "ht://Dig" "infoseek", "InfoSeek Robot 1.0" "infoseeksidewinder", "Infoseek Sidewinder" "fast-webcrawler", "Fast Web Crawler" "fast enterprise crawler", "FAST Enterprise" "fast metaWeb crawler", "Fast Search" "fast crawler", "FAST Web Crawler" "crawler@fast.no", "FAST Enterprise" "Jyxobot", "Jyxobot" "jeeves", "Jeeves" # frequent robot "webvac", "WebVac" "ichiro", "Ichiro" "StackRambler", "StackRambler" "speedy", "Speedy Spider" "surveybot", "Survey Whois" "harvest", "Harvest" "antibot", "Antibot" "seekbot", "Seekbot", "ia_archiver", "Alexa" "vsyncrawler", "vsyncrawler" "sogou", "Sougou spider" "Accoona-AI-Agent", "Accoona" "scooter", "Yahoo" "scoutjet", "ScoutJet" "ask.com", "Ask.com" "dotnetdotcom", "dotnetdotcom" "youdaobot", "Youdao" "discobot", "Discovery Engine" "GSLFbot", "Amazon aws" # Seen only once "MyNutchSpider", "Apache Nutch" "ExB Language Crawler", "ExB" "Sistrix", "Sistrix" "EasouSpider", "EasouSpider" "AhrefsBot", "Ahrefs" "Sistrix", "Sistrix" "Voluniabot", "Volunia" "Ezooms", "Ezooms" "Cityreview", "Cityreview" "nigma", "Nigma" "Sosospider", "Soso" "Daumoa", "Daumoa" "accelobot", "Accelovation" "Purebot", "Puritysearch" "SolomonoBot", "Solomono" "Atraxbot", "Atrax Solutions" "Cityreview", "Cityreview" "CatchBot", "CatchBot" "GingerCrawler", "Gingersoftware" "Kalooga", "Kalooga" "Fastsearch", "Fastsearch" "Yanga", "Yanga" "AISearchBot", "AISearchBot" "Twitturly", "Twitturly" "seedmain", "Spam bot" "rdfbot", "rdfbot" "laycat", "aceleo.com" "PDFBot", "PDF bot" "turnitinbot", "Turnitin" "lapozzbot", "Lappoz" "checkbot", "Checkbot" "yetibot", Yeti" "atomz", "Atomz.com Search Robot" "atom", "Atom Feed Robot" "favorstarbot", "Favorstar" "IsItRunning-Monitoring", "IsItRunning-Monitoring" "IRLbot", "Internet Research Lab" "Lsearch", "Lsearch" "HTTrack", "HTTrack" "gaisbot", "Gais" "sharp-info-agent", "Internet Shinchakubin" "vwbot", "VWbot" "larbin", "Larbin" "python", "The Python Robot" "Robo Crawler", "Softbank Corp" "voyager", "Voyager" "giant", "Giant" "Redbot", "RedBot" "appie", "Walhello appie" "kdd", "KDD-Explorer" "combine", "Combine System" "phantom", "Phantom" "lexxe", "Lexxe" "fdse", "Fluid Dynamics Search Engine robot" "linkwalker", "LinkWalker" "calif", "Calif" "jobot", "Jobot" "bloodhound", "Bloodhound" "visbot", "Visvo" "naverbot", "Naver" "msrbot", "Microsoft Research Bot" "cazoodleBot", "Cazoodle" "becomeBot", "Become" "becomejpbot", "Become" "factbot", "Factbites" "robotgenius", "Robotgenius" "psbot", "Picsearch" "snapbot", "Snap" "seznambot", "Seznam" "archive.org_bot", "Archive" "gigabot", "Gigablast" "botw spider", "Best of the Web" "nsrbot", "Net Research Server" "gnoztik bot", "GnoZtiK" "ultraseek", "Ultraseek" "snappreviewbot", "SnapPreview" "socscibot", "Social Sciences" "holmes", "Morfeo" "heritrix", "Heritrix" "mj12bot", "MJ12" "sygolbot", "Sygol" "yacybot", "Yacy" "synoobot", "Synoo" "webaroobot", "Webaroo" "mqbot", "MQBot" "teezirbot", "Teezir" "sproose", "Sproose" "pagebiteshyperbot", "Pagebites" "furlbot", "Furl" "quantcastbot", "Quantcast" "lanshanbot", "Lanshan" "nrsbot", "Loopimprovements" "netresearchserver, "Loopimprovements" "nextgensearchbot", "NextGenSearch" "woriobot", "Worio" "qihoobot", "Qihoo" "great-plains-web-spider", "Flatland" "localcombot","Localcom" "girafabot", "Girafa" "geniebot", "Genie" "noxtrumbot", "Noxtrum" "crawler@noxtrum", "Noxtrum" "digi-rssbot", "DiGi-RSS" "archive.org_bot", "BNF" "disco-crawl", "Experimental crawler" "novosoft", "Novosoft" "w3crobot", "W3C Unknown robot" "MJ12bot", "Majestic-12" "ImageWalker", "ImageWalker" "Yandex", "Yandex" "bot", "Unknown robot"