PageRenderTime 60ms CodeModel.GetById 23ms RepoModel.GetById 0ms app.codeStats 0ms

/alert/assets/templates/robots/robots.txt

https://bitbucket.org/jbward/search-and-awareness-platform-courtlistener
Plain Text | 62 lines | 54 code | 8 blank | 0 comment | 0 complexity | 0f7d9b6c703ca745cb095056f088efd2 MD5 | raw file
Possible License(s): LGPL-2.0, AGPL-3.0, BSD-3-Clause, MPL-2.0-no-copyleft-exception
  1. # Google, AOL, Bing, Yahoo!
  2. # These support meta robots and x-robots-tag.
  3. # Crawl everything except a few explicit blocks
  4. User-agent: Googlebot
  5. Disallow: /robots.txt
  6. Disallow: /dumps/
  7. Disallow: /assets/
  8. Disallow: /api/rest/v1/
  9. User-agent: bingbot
  10. Disallow: /robots.txt
  11. Disallow: /dumps/
  12. Disallow: /assets/
  13. Disallow: /api/rest/v1/
  14. User-agent: Slurp
  15. Disallow: /robots.txt
  16. Disallow: /dumps/
  17. Disallow: /assets/
  18. Disallow: /api/rest/v1/
  19. # Yandex, Ask
  20. # These support meta robots, but not x-robots-tag
  21. # Crawl everything except real files
  22. User-agent: YandexBot
  23. Disallow: /robots.txt
  24. Disallow: /dumps/
  25. Disallow: /assets/
  26. Disallow: /api/rest/v1/
  27. Disallow: /pdf/
  28. Disallow: /wpd/
  29. Disallow: /txt/
  30. Disallow: /doc/
  31. User-agent: teoma
  32. Disallow: /robots.txt
  33. Disallow: /dumps/
  34. Disallow: /assets/
  35. Disallow: /api/rest/v1/
  36. Disallow: /pdf/
  37. Disallow: /wpd/
  38. Disallow: /txt/
  39. Disallow: /doc/
  40. User-agent: ia_archiver
  41. Disallow: /robots.txt
  42. Disallow: /dumps/
  43. Disallow: /assets/
  44. Disallow: /api/rest/v1/
  45. Disallow: /pdf/
  46. Disallow: /wpd/
  47. Disallow: /txt/
  48. Disallow: /doc/
  49. # Duckduckgo, Baidu, Blekko, Others
  50. # No support for robots meta tag nor x-robots-tag.
  51. # Be conservative; Block everything.
  52. User-agent: *
  53. Disallow: /
  54. Sitemap: https://www.courtlistener.com/sitemap.xml