Robots.txt file comparison

Previous version copy

  1. # Google Search Engine Robot
  2. # ==========================
  3. User-agent: Googlebot
  4. Allow: /?_escaped_fragment_
  5. Allow: /*?lang=
  6. Allow: /hashtag/*?src=
  7. Allow: /search?q=%23
  8. Allow: /i/api/
  9. Disallow: /search/realtime
  10. Disallow: /search/users
  11. Disallow: /search/*/grid
  12. Allow: /*?ref_src=
  13. Allow: /*?src=
  14. Disallow: /*?
  15. Disallow: /*/followers
  16. Disallow: /*/following
  17. Disallow: /account/deactivated
  18. Disallow: /settings/deactivated
  19. # Yahoo! Search Engine Robot
  20. # ==========================
  21. User-Agent: Slurp
  22. Allow: /?_escaped_fragment_
  23. Allow: /*?lang=
  24. Allow: /hashtag/*?src=
  25. Allow: /search?q=%23
  26. Allow: /i/api/
  27. Disallow: /search/realtime
  28. Disallow: /search/users
  29. Disallow: /search/*/grid
  30. Disallow: /*?
  31. Disallow: /*/followers
  32. Disallow: /*/following
  33. Disallow: /account/deactivated
  34. Disallow: /settings/deactivated
  35. # Yandex Search Engine Robot
  36. # ==========================
  37. User-agent: Yandex
  38. Allow: /?_escaped_fragment_
  39. Allow: /*?lang=
  40. Allow: /hashtag/*?src=
  41. Allow: /search?q=%23
  42. Allow: /i/api/
  43. Disallow: /search/realtime
  44. Disallow: /search/users
  45. Disallow: /search/*/grid
  46. Disallow: /*?
  47. Disallow: /*/followers
  48. Disallow: /*/following
  49. Disallow: /account/deactivated
  50. Disallow: /settings/deactivated
  51. # Microsoft Search Engine Robot
  52. # =============================
  53. User-Agent: msnbot
  54. Allow: /?_escaped_fragment_
  55. Allow: /*?lang=
  56. Allow: /hashtag/*?src=
  57. Allow: /search?q=%23
  58. Disallow: /search/realtime
  59. Disallow: /search/users
  60. Disallow: /search/*/grid
  61. Disallow: /*?
  62. Disallow: /*/followers
  63. Disallow: /*/following
  64. Disallow: /account/deactivated
  65. Disallow: /settings/deactivated
  66. # Bing Search Engine Robot
  67. # ========================
  68. User-Agent: bingbot
  69. Allow: /?_escaped_fragment_
  70. Allow: /*?lang=
  71. Allow: /hashtag/*?src=
  72. Allow: /search?q=%23
  73. Disallow: /search/realtime
  74. Disallow: /search/users
  75. Disallow: /search/*/grid
  76. Disallow: /*?
  77. Disallow: /*/followers
  78. Disallow: /*/following
  79. Disallow: /account/deactivated
  80. Disallow: /settings/deactivated
  81. # Every bot that might possibly read and respect this file
  82. # ========================================================
  83. User-agent: *
  84. Allow: /*?lang=
  85. Allow: /hashtag/*?src=
  86. Allow: /search?q=%23
  87. Allow: /i/api/
  88. Disallow: /search/realtime
  89. Disallow: /search/users
  90. Disallow: /search/*/grid
  91. Disallow: /*?
  92. Disallow: /*/followers
  93. Disallow: /*/following
  94. Disallow: /account/deactivated
  95. Disallow: /settings/deactivated
  96. Disallow: /oauth
  97. Disallow: /1/oauth
  98. Disallow: /i/streams
  99. Disallow: /i/hello
  100. # WHAT-4882 - Block indexing of links in notification emails. This applies to all bots.
  101. # =====================================================================================
  102. Disallow: /i/u
  103. Noindex: /i/u
  104. # Wait 1 second between successive requests. See ONBOARD-2698 for details.
  105. Crawl-delay: 1
  106. # Independent of user agent. Links in the sitemap are full URLs using https:// and need to match
  107. # the protocol of the sitemap.
  108. Sitemap: https://twitter.com/sitemap.xml

New version copy

  1. # Google Search Engine Robot
  2. # ==========================
  3. User-agent: Googlebot
  4. Allow: /?_escaped_fragment_
  5. Allow: /*?lang=
  6. Allow: /hashtag/*?src=
  7. Allow: /search?q=%23
  8. Allow: /i/api/
  9. Disallow: /search/realtime
  10. Disallow: /search/users
  11. Disallow: /search/*/grid
  12. Allow: /*?ref_src=
  13. Allow: /*?src=
  14. Disallow: /*?
  15. Disallow: /*/followers
  16. Disallow: /*/following
  17. Disallow: /account/deactivated
  18. Disallow: /settings/deactivated
  19. # Every bot that might possibly read and respect this file
  20. # ========================================================
  21. User-agent: *
  22. Disallow: /
  23. # WHAT-4882 - Block indexing of links in notification emails. This applies to all bots.
  24. # =====================================================================================
  25. Disallow: /i/u
  26. Noindex: /i/u
  27. # Wait 1 second between successive requests. See ONBOARD-2698 for details.
  28. Crawl-delay: 1
  29. # Independent of user agent. Links in the sitemap are full URLs using https:// and need to match
  30. # the protocol of the sitemap.
  31. Sitemap: https://twitter.com/sitemap.xml