webcrawler bot detection
[ "panscient", "larbin", "dummy", "Teoma", "alexa",
"froogle", "inktomi", "looksmart", "URL_Spider_SQL",
"Firefly", "NationalDirectory", "Ask Jeeves", "TECNOSEEK",
"InfoSeek", "WebFindBot", "crawler", "girafobot", "Scooter",
"Baidu", "bot", "Google", "SiteUptime", "Slurp",
"WordPress", "ZIBB", "ZyBorg", "msnbot", "check_http",
"libwww-perl", "lwp-trivial", "wget", "curl", "SimplePie",
"Python", "Feed", "HTTPClient", "Tumblr", "Spider", "sanszbot"]
end
Full source at http://pastie.org/191922










2 Comments