sitemap: http://www.goabroad.com/sitemap_index.xml sitemap: http://www.goabroad.com/study-abroad/sitemap_index.xml sitemap: http://www.goabroad.com/study-abroad/country-city-degprog-sitemap_index.xml sitemap: http://www.goabroad.com/study-abroad/country-city-degprog-term-sitemap_index.xml sitemap: http://www.goabroad.com/study-abroad/country-degprog-term-sitemap_index.xml sitemap: http://www.goabroad.com/volunteer-abroad/sitemap_index.xml sitemap: http://www.goabroad.com/volunteer-abroad/country-city-type-duration-sitemap_index.xml sitemap: http://www.goabroad.com/volunteer-abroad/country-city-type-sitemap_index.xml sitemap: http://www.goabroad.com/volunteer-abroad/country-type-duration-sitemap_index.xml sitemap: http://www.goabroad.com/intern-abroad/sitemap_index.xml sitemap: http://www.goabroad.com/intern-abroad/country-city-type-sitemap_index.xml sitemap: http://www.goabroad.com/teach-abroad/sitemap_index.xml sitemap: http://www.goabroad.com/tefl-courses/sitemap_index.xml sitemap: http://www.goabroad.com/degree-abroad/sitemap_index.xml sitemap: http://www.goabroad.com/degree-abroad/country-city-degprog-studytype-sitemap_index.xml sitemap: http://www.goabroad.com/highschool-study-abroad/sitemap_index.xml sitemap: http://www.goabroad.com/language-study-abroad/sitemap_index.xml sitemap: http://www.goabroad.com/adventure-travel-abroad/sitemap_index.xml sitemap: http://www.goabroad.com/scholarships-abroad/sitemap_index.xml sitemap: http://www.goabroad.com/scholarships-abroad/country-acaddegree-degprog-sitemap_index.xml sitemap: http://www.goabroad.com/scholarships-abroad/country-degprog-sitemap_index.xml sitemap: http://www.goabroad.com/scholarships-abroad/country-type-acaddegree-degprog-sitemap_index.xml sitemap: http://www.goabroad.com/scholarships-abroad/country-type-degprog-sitemap_index.xml # Some bots are known to be trouble, particularly those designed to copy # entire sites. Please obey robots.txt. User-agent: spider Disallow: / User-agent: bot- Disallow: / User-agent: bot/ Disallow: / User-agent: LinkChecker Disallow: / User-agent: Microsoft URL Control Disallow: / User-agent: IRLbot Disallow: / User-agent: MJ12bot Disallow: / User-agent: Java Disallow: / User-agent: nicebot Disallow: / User-agent: Nutch Disallow: / User-agent: Python-urllib Disallow: / User-agent: Powermarks Disallow: / User-agent: Missigua_Locator Disallow: / User-agent: Web Downloader Disallow: / User-agent: lanshanbot Disallow: / User-agent: Custo Disallow: / User-agent: CFNetwork Disallow: / User-agent: HTTrack off-line browser Disallow: / User-agent: NutchCVS Disallow: / User-agent: T-H-U-N-D-E-R-S-T-O-N-E Disallow: / User-agent: Jakarta commons-httpclient Disallow: / User-agent: HTMLParser Disallow: / User-agent: crawl Disallow: / User-agent: sitecheck.internetseer.com Disallow: / User-agent: Zealbot Disallow: / User-agent: MSIECrawler Disallow: / User-agent: SiteSnagger Disallow: / User-agent: WebStripper Disallow: / User-agent: WebCopier Disallow: / User-agent: Fetch Disallow: / User-agent: Offline Explorer Disallow: / User-agent: Teleport Disallow: / User-agent: TeleportPro Disallow: / User-agent: WebZIP Disallow: / User-agent: linko Disallow: / User-agent: HTTrack Disallow: / User-agent: Microsoft.URL.Control Disallow: / User-agent: larbin Disallow: / User-agent: ZyBORG Disallow: / User-agent: Download Ninja Disallow: / # # Doesn't follow robots.txt anyway, but... # User-agent: k2spider Disallow: / # A capture bot, downloads gazillions of pages with no public benefit # http://www.webreaper.net/ User-agent: WebReaper Disallow: / # # Hits many times per second, not acceptable # http://www.nameprotect.com/botinfo.html User-agent: NPBot Disallow: / User-agent: * allow: /index.php Disallow: /frontend_dev.php/ Disallow: /admin_dev.php/ Disallow: /client_dev.php/ Disallow: /help Disallow: /stats