#**************************************************************************** # robots.txt # : Robots, spiders, and search engines use this file to detmine which # content they should *not* crawl while indexing your website. # : This system is called "The Robots Exclusion Standard." # : It is strongly encouraged to use a robots.txt validator to check # for valid syntax before any robots read it! # # Examples: # # Instruct all robots to stay out of the admin area. # : User-agent: * # : Disallow: /admin/ # # Restrict Google and MSN from indexing your images. # : User-agent: Googlebot # : Disallow: /images/ # : User-agent: MSNBot # : Disallow: /images/ #**************************************************************************** Sitemap: https://www.markupandprofit.com/sitemap_index.xml User-agent: * Disallow: /cgi-bin Disallow: /wp-login.php Disallow: /xmlrpc.php Disallow: /cdn-cgi/ Disallow: /cdn-cgi/ User-agent: * Disallow: /*.doc$ Disallow: /*.pdf$ Disallow: /*.zip$ User-agent: ChatGPT-User Disallow: / User-agent: CCBot Disallow: /