# See http://www.robotstxt.org/wc/norobots.html for documentation on how to use the robots.txt file
#
# To ban all spiders from the entire site uncomment the next two lines:
# User-Agent: *
# Disallow: /
#
# Also be aware that this robots.txt is only served for charanga.com and the
# principle partner sites. We have a dynamically generated robots.txt for
# assets1.charanga.com, assets2.charanga.com etc to prevent us getting duplicate
# content penalties, but it might interfere with e.g. redbot.org testing
User-Agent: *
Disallow: /hnyp0t
# redbot is very useful for testing, but will only work if we
# specifically allow it
User-agent: RED
Allow: /
# Don't index any pdfs in the resource_library; there are brochures we do want
# indexed, hence the /resource_library path
User-Agent: *
Disallow: /resource_library/*.pdf$
#Noindex: /resource_library/*.pdf$
# And really, we should just stop any crawling of the resource_library
User-Agent: *
Disallow: /resource_library
#Noindex: /resource_library
# Stop Bingpreview from invalidating links
User-Agent: BingPreview
Disallow: /pupil_reports
#Noindex: /pupil_reports
# The AdsBot-Google has gone mental and is following links that
# deliver converting users to us. It seems to particularly like
# the login page, so BAN THIS FILTH
User-agent: AdsBot-Google
Disallow: /user/login
# Some SEO spider that's all over us
User-agent: MJ12bot
Disallow: /
# Google, Yahoo, MSN et al all seem to be trying to index this (non-existant) url. God knows why
# Tell them to sod off
User-Agent: *
Disallow: /~magnolia/
# It was public, now it's login-only. We need this here so we can purge
# cached copies with Google Webmaster Tools
Disallow: /music_service_admin/letters/pupil_information_printable
# These have to be fully qualified URLs, and because this robots.txt is shared
# let's add them all here...
# Ours
Sitemap: https://charanga.com/site/sitemap_index.xml
Sitemap: https://www.charanga.cz/site/sitemap_index.xml
Sitemap: https://www.charanga.dk/site/sitemap_index.xml
Sitemap: https://www.charanga.com.au/site/sitemap_index.xml
Sitemap: https://www.charanga.co.za/site/sitemap_index.xml
Sitemap: https://www.charanga.hk/site/sitemap_index.xml
Sitemap: https://www.charanga.in/site/sitemap_index.xml
Sitemap: https://www.charanga.vn/site/sitemap_index.xml
# Partners
Sitemap: https://www.banesmusiconline.co.uk/site/sitemapindex.xml
Sitemap: https://www.bradfordmusiconline.co.uk/site/sitemap_index.xml
Sitemap: https://www.essexmusichub.org.uk/site/sitemap_index.xml
Sitemap: https://www.lancashiremusichub.co.uk/site/sitemap_index.xml
Sitemap: https://www.norfolkmusichub.org.uk/site/sitemap_index.xml
Sitemap: https://www.richmondmusictrust.org.uk/site/sitemap_index.xml
Sitemap: https://www.wakefieldmusicservices.org/site/sitemap_index.xml
# stop dumb robots submitting this with no values
Disallow: /school_quotes
#Noindex: /school_quotes
Disallow: /vip_session_accounts
#Noindex: /vip_session_accounts
Disallow: /quotes
#Noindex: /school_quotes
Disallow: /musicalschoolfreetrial
Disallow: /assets/record_usage
Disallow: /admin
#Noindex: /admin
Disallow: /music_service_admin
#Noindex: /music_service_admin
Disallow: /training_events
#Noindex: /training_events