#2006-09-13 04:04:30 GET /robots.txt - - 217.212.224.141 HTTP/1.0 psbot/0.1+(+http://www.picsearch.com/bot.html) - - 404 1814 259 46 #2006-09-13 04:17:13 GET /robots.txt - - 220.130.191.232 HTTP/1.0 Cazoodle/Nutch-0.9-dev+(Cazoodle+Nutch+Crawler;+http://www.cazoodle.com;+mqbot@cazoodle.com) - - 404 1814 188 437 #2006-09-13 04:25:50 GET /robots.txt - - 66.249.65.114 HTTP/1.1 Googlebot-Image/1.0 - - 404 1795 195 140 #2006-09-13 07:17:50 GET /robots.txt - - 68.142.212.218 HTTP/1.0 Yahoo-MMCrawler/3.x+(mms+dash+mmcrawler+dash+support+at+yahoo+dash+inc+dot+com) - - 404 1814 163 1171 #2006-09-13 07:50:10 GET /robots.txt - - 209.167.50.22 HTTP/1.1 LinkWalker ASP.NET_SessionId=exggvq454vh23oavxaecm545 www.seventwentyfour.com/ 404 1795 240 140 #2006-09-13 07:55:10 GET /robots.txt - - 146.133.13.253 HTTP/1.1 FAST+Enterprise+Crawler+6+used+by+Enel+(gdl_app_fi@enel.it) ASP.NET_SessionId=dsliml455oz1isvrglpaxemx - 404 1814 272 250 #2006-09-13 16:07:16 GET /robots.txt - - 38.100.225.9 HTTP/1.0 sproose/0.1+(sproose+bot;+http://www.sproose.com/bot.html;+crawler@sproose.com) - - 404 1814 175 203 #2006-09-13 17:04:27 GET /robots.txt - - 131.175.1.168 HTTP/1.1 swish-e+spider+2.2+http://swish-e.org/ - - 404 1795 195 15 #2006-09-13 19:50:40 GET /robots.txt - - 69.25.71.12 HTTP/1.1 Accoona-AI-Agent/1.1.2+(aicrawler+at+accoonabot+dot+com) - - 404 1814 232 109 #2006-09-13 20:30:04 GET /robots.txt - - 88.33.54.218 HTTP/1.1 NG/2.0 - - 404 0 169 31 #2006-09-13 21:11:35 GET /robots.txt - - 84.9.137.104 HTTP/1.1 Nusearch+Spider+(www.nusearch.com) - - 404 1795 234 46 #2006-09-13 23:54:00 GET /robots.txt - - 38.113.234.181 HTTP/1.0 voyager/1.0 - - 404 1814 155 187 #2006-09-15 01:33:43 GET /robots.txt - - 212.48.8.143 HTTP/1.1 VirgilioBot+(+admin+e-mail+address+:+search@staff.virgilio.it) - - 200 3286 238 31 2006-09-15 04:57:37 GET /robots.txt - - 210.173.180.161 HTTP/1.1 ichiro/2.0+(http://help.goo.ne.jp/door/crawler.html) - - 200 3286 161 2006-09-17 00:26:00 GET /robots.txt - - 209.237.238.179 HTTP/1.0 ia_archiver - - 200 3286 120 375# Escludo dall'intero sito xxx, installato il 2006/09/14 h:5:18 PM 2006-09-17 06:19:20 GET /robots.txt - - 66.94.232.246 HTTP/1.0 Scooter/3.3 - - 200 0 147 187 2006-09-17 10:12:27 GET /robots.txt - - 140.123.101.66 HTTP/1.0 Gaisbot/3.0+(robot06@gais.cs.ccu.edu.tw;+http://gais.cs.ccu.edu.tw/robot.php) - - 200 3291 212 1265 2006-09-17 10:38:21 GET /robots.txt - - 60.28.17.51 HTTP/1.1 Baiduspider+(+http://www.baidu.com/search/spider.htm) - - 200 3286 161 734 2006-09-17 19:59:05 GET /robots.txt - - 85.18.14.22 HTTP/1.0 NutchCVS/0.8-dev+(Nutch;+http://lucene.apache.org/nutch/bot.html;+nutch-agent@lucene.apache.org) - - 200 3286 192 15 2006-09-17 20:40:01 GET /robots.txt - - 168.143.106.240 HTTP/1.0 SE03/SE03+(SE+Release;+http://www.SE-Release.org;+SE03@SE-Release.org) - - 200 3286 166 234 User-agent: NaverBot-1.0 Disallow: / User-agent: SygolBot Disallow: / User-agent: Speedy Disallow: / ##User-agent: msnbot/1.0 ##Disallow: / User-agent: lwp-trivial/1.38 Disallow: / User-agent: lwp-trivial Disallow: / User-agent: Snapbot/1.0 Disallow: / User-agent: Snapbot Disallow: / User-agent: Seekbot/1.0 Disallow: / User-agent: Seekbot Disallow: / User-agent: psbot/0.1 Disallow: / User-agent: psbot Disallow: / User-agent: Cazoodle/Nutch-0.9-dev Disallow: / User-agent: Cazoodle Disallow: / #User-agent: Googlebot-Image/1.0 #Disallow: / #User-agent: Googlebot #Disallow: / #User-agent: Yahoo-MMCrawler/3.x #Disallow: / User-agent: LinkWalker Disallow: / User-agent: FAST Enterprise Crawler 6 used by Enel (gdl_app_fi@enel.it) Disallow: / User-agent: sproose/0.1 Disallow: / User-agent: sproose Disallow: / User-agent: swish-e Disallow: / User-agent: Accoona-AI-Agent/1.1.2 Disallow: / User-agent: Accoona-AI-Agent Disallow: / User-agent: NG/2.0 Disallow: / User-agent: NG Disallow: / User-agent: Nusearch Disallow: / User-agent: voyager/1.0 Disallow: / User-agent: voyager Disallow: / #User-agent: * #Disallow: /cgi-bin/ #Disallow: /admin/ #Disallow: /privata/