# # robots.txt for www.torontopubliclibrary.ca # Updated: 2024-09-15 # "Allow" and "Crawl-delay" are "non-standard" # Not supported by all robots, but requests a 30s delay between page loads: User-agent: * Crawl-delay: 30 User-agent: * Disallow: /branch-computer/ Disallow: /components/ Disallow: /config/ Disallow: /eblast/ Disallow: /it-essentials/ Disallow: /kids-computer-rr/ Disallow: /kids-computer/ Disallow: /kidsstop/ Disallow: /kiosk/ Disallow: /placehold Disallow: /research-computer/ Disallow: /rss.jsp Disallow: /search.jsp Disallow: /share-item-detail.jsp Disallow: /xml/ # https://github.com/ai-robots-txt/ai.robots.txt/blob/main/robots.txt User-agent: Amazonbot User-agent: Applebot User-agent: Applebot-Extended User-agent: Bytespider User-agent: CCBot User-agent: ChatGPT-User User-agent: Claude-Web User-agent: ClaudeBot User-agent: DOC User-agent: Diffbot User-agent: Download Ninja User-agent: FacebookBot User-agent: Fetch User-agent: FriendlyCrawler User-agent: GPTBot User-agent: Google-Extended User-agent: GoogleOther User-agent: GoogleOther-Image User-agent: GoogleOther-Video User-agent: HTTrack User-agent: ICC-Crawler User-agent: ImagesiftBot User-agent: MSIECrawler User-agent: Mediapartners-Google* User-agent: Meta-ExternalAgent User-agent: Meta-ExternalFetcher User-agent: Microsoft.URL.Control User-agent: NPBot User-agent: OAI-SearchBot User-agent: Offline Explorer User-agent: PerplexityBot User-agent: PetalBot User-agent: Scrapy User-agent: SiteSnagger User-agent: Teleport User-agent: TeleportPro User-agent: Timpibot User-agent: UbiCrawler User-agent: VelenPublicWebCrawler User-agent: WebCopier User-agent: WebReaper User-agent: WebStripper User-agent: WebZIP User-agent: Webzio-Extended User-agent: Xenu User-agent: YouBot User-agent: Zao User-agent: Zealbot User-agent: ZyBORG User-agent: anthropic-ai User-agent: cohere-ai User-agent: facebookexternalhit User-agent: grub-client User-agent: img2dataset User-agent: larbin User-agent: libwww User-agent: linko User-agent: omgili User-agent: omgilibot User-agent: sitecheck.internetseer.com User-agent: wget Disallow: /