Page Content
# robots.txt for www.nwa.com # # Outside agents may search the site, but will be restricted from the disallowed directories Sitemap: http://www.nwa.com/sitemap.xml User-agent: * Disallow: /aaq Disallow: /kanaiq Disallow: /club Disallow: /cgi-bin Disallow: /cgi-bin2 Disallow: /tmp Disallow: /logs Disallow: /philly Disallow: /images Disallow: /nwco Disallow: /palm Disallow: /cargo Disallow: /pe002 Disallow: /pe003 Disallow: /pe004 Disallow: /pe005 Disallow: /pe006 Disallow: /pe007 Disallow: /corpinfo/newsc Disallow: /weather # Primary search engine will have same area as outside engines, as well as feature press releases User-agent: htdig-main Disallow: /cgi-bin Disallow: /cgi-bin2 Disallow: /tmp Disallow: /logs Disallow: /philly Disallow: /images Disallow: /nwco Disallow: /palm Disallow: /cargo Disallow: /pe002 Disallow: /pe003 Disallow: /pe004 Disallow: /pe005 Disallow: /pe006 Disallow: /pe007 Disallow: /corpinfo/newsc/2002 Disallow: /corpinfo/newsc/2001 Disallow: /corpinfo/newsc/2000 Disallow: /corpinfo/newsc/1999 Disallow: /corpinfo/newsc/1998 Disallow: /corpinfo/newsc/1997 # Press release search engine will restrict itself to press release area, but has free-reign there User-agent: htdig-press Disallow: /cgi-bin Disallow: /cgi-bin2 Disallow: /tmp Disallow: /logs Disallow: /philly Disallow: /images Disallow: /nwco Disallow: /palm Disallow: /cargo Disallow: /pe002 Disallow: /pe003 Disallow: /pe004 Disallow: /pe005 Disallow: /pe006 Disallow: /pe007 Disallow: /weather