# robots.txt automatically for JOUTECH.MA # This file is to prevent the crawling and indexing of your site # by web crawlers and spiders run by sites like bingg # and Google. By telling these "robots" where not to go on your site, # you save bandwidth and server resources. # For more information about the robots.txt standard, see: # https://www.robotstxt.org/robotstxt.html # Global rules User-agent: * # Allow necessary scripts and styles Allow: /wp-admin/admin-ajax.php Allow: /wp-includes/js/ Allow: /wp-content/themes/ Allow: /wp-content/uploads/ # Block admin and system files Disallow: /wp-admin/ Disallow: /wp-includes/ Disallow: /wp-content/plugins/ Disallow: /xmlrpc.php Disallow: /trackback/ Disallow: /wp-login.php Disallow: /readme.html Disallow: /license.txt # Prevent duplicate content Disallow: /*? Disallow: /*?order= Disallow: /*?replytocom= Disallow: /*?add-to-cart= Disallow: /product/*?* # WooCommerce specific exclusions Disallow: /wp-content/uploads/wc-logs/ Disallow: /wp-content/uploads/woocommerce_transient_files/ Disallow: /wp-content/uploads/woocommerce_uploads/ # Cart, checkout, and account pages Disallow: /my-account/ Disallow: /cart/ Disallow: /checkout/ Disallow: /thank-you/ # Sitemap Sitemap: https://joutech.ma/sitemap_index.xml # Allow AI search and agent use User-agent: OAI-SearchBot User-agent: ChatGPT-User User-agent: PerplexityBot User-agent: FirecrawlAgent User-agent: AndiBot User-agent: ExaBot User-agent: PhindBot User-agent: YouBot Allow: / # Disallow AI training data collection User-agent: GPTBot User-agent: CCBot User-agent: Google-Extended