User-agent: * Disallow: /_mm/ Disallow: /_notes/ Disallow: /_baks/ Disallow: /_cgi-bin-shortcut/ Disallow: /_docs-shortcut/ Disallow: /MMWIP/ Disallow: /jeremy_hicks/ Disallow: /randy_wood/ Disallow: /wp/randy_wood/ # "members" is a secure site and we don't want # spiders in there Disallow: /members/ # "ntmfm" is a secure site and we don't want # spiders in there Disallow: /ntmfm/ # "mobile" is basically a text-only version of # pages that are already indexed in the main site Disallow: /mobile/ # On the main site, links to missionary give # pages use the mod_rewrite format of # www.ntm.org/give/123 ... which translates to # www.ntm.org/give/give_missionary_details.php?missionary_id=123 # ... so since we already have the shortened # version on the main site any other reference # to give_missionary_details.php is in other # parts of the site, like Explore sites, where # again we don't want duplicate content indexed Disallow: /give/give_missionary_details.php # On the main site, links to news details pages # use the mod_rewrite format of www.ntm.org/news/123 # ... which translates to # www.ntm.org/news/news_details.php?news_id=123 # ... so since we already have the shortened # version on the main site any other reference # to news_details.php is in other parts of the # site, like Explore sites, where again we don't # want duplicate content indexed Disallow: /news/news_details.php # /////////////////////////////////////// # This section is specific to Google spiders # ... reasons for most rules can be seen above User-agent: Googlebot Disallow: *.csi Disallow: /members/ Disallow: /ntmfm/ Disallow: /mobile/ # "/*_*/ntm*" uses wildcards (specific to # Google spiders) to match any myMinistry # site's pages that display main NTM.org # news articles within the myMinistry site # ... and we need to cut back on pages # that have duplicate content as much as # possible, to help our ranking. ########Disallow: /*_*/ntm* # the above line commented by Andy Corley on 4-25-08 # because we are not able to match up this restriction # with our sitemap that Google uses ... and since they # don't match up, we keep getting Google "warnings" in # our www.google.com/webmasters control panel. Disallow: /give/give_missionary_details.php Disallow: /news/news_details.php Disallow: /give/1318 Disallow: /give/1321 Disallow: /give/1323 Disallow: /give/1583 Disallow: /give/2098 Disallow: /give/2363 Disallow: /give/2805 Disallow: /give/5309 # Don't allow bots to click on a "share" link from any of the news articles Disallow: /quicklinks/share.php