User-Agent: * # short url redirects Disallow: /c/ Disallow: /g/ Disallow: /L/ Disallow: /n/ Disallow: /p/ Disallow: /r/ Disallow: /t/ Disallow: /u/ Disallow: /w/ Disallow: /y/ Disallow: /a/ Disallow: /b/ Disallow: /d/ Disallow: /e/ Disallow: /f/ Disallow: /h/ Disallow: /i/ Disallow: /j/ Disallow: /k/ Disallow: /m/ Disallow: /q/ Disallow: /v/ Disallow: /x/ Disallow: /z/ Disallow: /tw/ Disallow: /sw/ Disallow: /pt/ Disallow: /pi/ Disallow: /lk/ Disallow: /cm/ Disallow: /fr/ Disallow: /po/ Disallow: /si/ Disallow: /pm/ Disallow: /tc/ Disallow: /tm/ Disallow: /we/ Disallow: /ei/ Disallow: /og/ Disallow: /ct/ Disallow: /cw/ Disallow: /likes?data_target Disallow: /tracked_workouts/* Disallow: /sounds/ Disallow: /digital_sounds/ Disallow: /leaderboard.mobile Disallow: /native_android/* Disallow: /native-android/* # exclude list and activity pages with no important info on them Disallow: /tracked_activities Disallow: /yoga_ticks/* Disallow: /weight_ticks/* Disallow: /pilates_ticks/* Disallow: /cardio_ticks/* Disallow: /poses_ticks/* Disallow: /team_sport_ticks/* Disallow: /program_instances/* Disallow: /trips/* # Not public version Disallow: /workout_exercises/* # old urls that are the same as /workouts/ - removed since we have canonical URLs there # Disallow: /interval_timers/ Disallow: /workouts/liked # path json data Disallow: /paths/*/data.json Allow: / SITEMAP: https://www.skimble.com/sitemap_index.xml.gz # Slow down bots Crawl-delay: 2 # try to slow down bots that are known to be aggressive User-agent: GPTBot Disallow: /people/ Crawl-delay: 2 User-agent: bingbot Crawl-delay: 2 # block certain bots entirely User-Agent: AwarioBot Disallow: / User-Agent: ImagesiftBot Disallow: / User-Agent: Bytedance Disallow: / User-Agent: Bytespider Disallow: / User-Agent: MauiBot Disallow: / User-Agent: PetalBot Disallow: / User-Agent: grapeshot Disallow: / User-Agent: Baiduspider Disallow: / User-Agent: MegaIndex Disallow: / User-Agent: AhrefsBot Disallow: / User-Agent: Treato-Bot Disallow: / User-Agent: SemrushBot Disallow: / User-Agent: SeekportBot Disallow: / User-Agent: Barkrowler Disallow: / User-Agent: Linguee Bot Disallow: / User-Agent: The Knowledge AI Disallow: / # Disallow: Sistrix User-Agent: sistrix Disallow: / # Disallow: Sistrix User-Agent: SISTRIX Crawler Disallow: / # Disallow: Sistrix User-Agent: SISTRIX Disallow: / # Disallow: SEOkicks-Robot User-Agent: SEOkicks-Robot Disallow: / # Disallow: jobs.de-Robot User-Agent: jobs.de-Robot Disallow: / # Bot der Leipziger Unister Holding GmbH user-agent: UnisterBot disallow: / # http://www.opensiteexplorer.org/dotbot User-Agent: DotBot Disallow: / User-Agent: dotbot Disallow: / # http://www.searchmetrics.com User-Agent: SearchmetricsBot Disallow: / # http://www.majestic12.co.uk/projects/dsearch/mj12bot.php User-Agent: MJ12bot Disallow: / # http://www.domaintools.com/webmasters/surveybot.php User-Agent: SurveyBot Disallow: / # http://www.seodiver.com/bot user-agent: SEOdiver disallow: / # http://openlinkprofiler.org/bot User-Agent: spbot Disallow: / # http://www.wotbox.com/bot/ User-Agent: wotbox Disallow: / # http://www.meanpath.com/meanpathbot.html User-Agent: meanpathbot Disallow: / # http://www.backlinktest.com/crawler.html User-Agent: BacklinkCrawler Disallow: / # http://www.brandwatch.com/magpie-crawler/ User-Agent: magpie-crawler Disallow: / # http://filterdb.iss.net/crawler/ User-Agent: oBot Disallow: / User-Agent: fr-crawler Disallow: / # http://webmeup-crawler.com User-Agent: BLEXBot Disallow: / # https://megaindex.com/crawler User-Agent: MegaIndex.ru Disallow: / User-Agent: megaindex.com Disallow: / # http://www.cloudservermarket.com User-Agent: CloudServerMarketSpider Disallow: / # http://www.trendiction.de/de/publisher/bot User-Agent: trendictionbot Disallow: / # http://www.exalead.com User-Agent: Exabot Disallow: / # http://www.career-x.de/bot.html User-Agent: careerbot Disallow: / # https://www.lipperhey.com/en/about/ User-Agent: Lipperhey-Kaus-Australis Disallow: / User-Agent: seoscanners.net Disallow: / User-Agent: MetaJobBot Disallow: / User-Agent: Spiderbot Disallow: / User-Agent: LinkStats Disallow: / User-Agent: JobboerseBot Disallow: / User-Agent: ICCrawler Disallow: / User-Agent: Plista Disallow: / User-Agent: Domain Re-Animator Bot Disallow: / # https://www.lipperhey.com/en/about/ User-Agent: Lipperhey-Kaus-Australis Disallow: / # https://turnitin.com/robot/crawlerinfo.html User-Agent: turnitinbot Disallow: / # http://help.coccoc.com/ User-Agent: coccoc Disallow: / # ubermetrics-technologies.com User-Agent: um-IC Disallow: / # datenbutler.de User-Agent: mindUpBot Disallow: / # http://searchgears.de/uber-uns/crawling-faq.html User-Agent: sg-Orbiter Disallow: / # http://commoncrawl.org/faq/ User-Agent: CCBot Disallow: / # https://www.qwant.com/ User-Agent: Qwantify Disallow: / # http://linkfluence.net/ User-Agent: Kraken Disallow: / # http://www.botje.com/plukkie.htm User-Agent: plukkie Disallow: / # https://www.safedns.com/searchbot User-Agent: SafeDNSBot Disallow: / # http://www.haosou.com/help/help_3_2.html User-Agent: 360Spider Disallow: / # http://www.haosou.com/help/help_3_2.html User-Agent: HaosouSpider Disallow: / # http://www.moz.com/dp/rogerbot User-Agent: rogerbot Disallow: / # http://www.openhose.org/bot.html User-Agent: OpenHoseBot Disallow: / # http://www.screamingfrog.co.uk/seo-spider/ User-Agent: Screaming Frog SEO Spider Disallow: / # http://thumbsniper.com User-Agent: ThumbSniper Disallow: / # http://www.radian6.com/crawler User-Agent: R6_CommentReader Disallow: / User-Agent: ImplisenseBot Disallow: / # http://cliqz.com/company/cliqzbot User-Agent: Cliqzbot Disallow: / # https://www.aihitdata.com/about User-Agent: aiHitBot Disallow: / # http://www.trendiction.com/en/publisher/bot User-Agent: trendictionbot Disallow: / # http://seocompany.store User-Agent: adscanner Disallow: / # https://github.com/yasserg/crawler4j/ User-Agent: crawler4j Disallow: / # http://warebay.com/bot.html User-Agent: WBSearchBot Disallow: / User-Agent: Python/3.5 aiohttp Disallow: / User-Agent: Toweya.com Disallow: / # http://www.website-datenbank.de/ User-Agent: netEstate Disallow: / # http://law.di.unimi.it/BUbiNG.html User-Agent: BUbiNG Disallow: / # http://www.linguee.com/bot; bot@linguee.com User-Agent: Linguee Disallow: / User-Agent: SemrushBot-SA Disallow: / # www.sentibot.eu User-Agent: sentibot Disallow: / User-Agent: SentiBot Disallow: / # http://velen.io User-Agent: VelenPublicWebCrawler Disallow: / User-Agent: DomainCrawler Disallow: / # https://moz.com/help/guides/moz-procedures/what-is-rogerbot User-Agent: rogerbot Disallow: / User-Agent: IndeedBot Disallow: / # http://www.garlik.com User-Agent: GarlikCrawler Disallow: / # https://www.gosign.de/typo3-extension/typo3-sicherheitsmonitor/ User-Agent: Gosign-Security-Crawler Disallow: / # http://www.siteliner.com/bot User-Agent: Siteliner Disallow: / # https://sabsim.com User-Agent: SabsimBot Disallow: / # http://ltx71.com/ User-Agent: ltx71 Disallow: / User-Agent: DataForSeoBot Disallow: / User-Agent: SenutoBot Disallow: / User-Agent: NeevaBot Disallow: /