# robots.txt for https://www.researchandmarkets.com/ # # use robots.txt file on the live site # as updates are more recent there Sitemap: https://www.researchandmarkets.com/sitemap.xml # for googlebot, use google webmaster tools User-agent: msnbot Disallow: /*.PDF$ User-agent: * Disallow: /basket_add.asp Disallow: /samples Disallow: /feats/download_sample.asp Disallow: /feats/thank_order.asp Disallow: /SystemStatus/GetMailCampaignSystemStatus Disallow: /Common/LogHttpRequest Disallow: /Common/GetRecentlyViewedProducts Disallow: /download-attachment Disallow: /download-order-form Disallow: /common/add-acl-entry Disallow: /*?*filtered= Disallow: /*?*PageSize= Disallow: /*?*OrderingOption= Disallow: /*?*PriceRange= Disallow: /*?*PublicationDateRange= Disallow: /*?*CategoryIds= Disallow: /*?*RegionIds= Disallow: /*?*CountryIds= Disallow: /*?*ProducttypeIds= Disallow: /*?*ExpandedCategoryIds= #Bad Crawlers: User-Agent: Sindup Disallow: / User-Agent: ezooms.bot Disallow: / User-Agent: 008 Disallow: / user-agent: AhrefsBot disallow: / user-agent: ExaleadCloudView disallow: / user-agent: exabot disallow: / user-agent: Arquivo-web-crawler disallow: / user-agent: MJ12bot disallow: / User-agent: dotbot Disallow: / User-agent: JobBot Disallow: /