User-agent: * #SiteMap.xml can be found at this URL SiteMap: http://www.utsouthwestern.edu/sitemap.xml # Googlebot seeing 500 errors for Patient Care global site search Disallow: /patientcare/globalsearch/ # Spammers are linking to hrmsphoto.jsp Disallow: /utsw-ext-templating/org/jsp/ Disallow: /wp-login.php Disallow: /connectors/system/settings.php Disallow: /EWS/Exchange.asmx Disallow: /wp-admin Disallow: /wp-includes Disallow: /wp-content # Googlebot seeing badly-formed URLs from some HR pages Disallow: /UTSW/CMA/CMA_applications/UTSWPageStencils/human_resource/ # Dont allow crawl of the following web page Disallow: /about-us/administrative-offices/information-resources/academic-information-systems/systems/core-lims.html Disallow: /_googlesearch Disallow: /_googlesearch?q=&site= Disallow: /_channelcache Disallow: /_collectioncache Disallow: /_assetcache Disallow: /_websitepagecache Disallow: /shared/ # Dont allow jsonp calls from this application Disallow: /nfis/getGraduateSchoolProgramsByProgramNameFilter.jsonp Disallow: /nfis/getClinicalKeywordsByKeywordNameFilter.jsonp Disallow: /nfis/getDepartmentsByDepartmentNameFilter.jsonp Disallow: /nfis/getProfileFacultiesByNameFilter.jsonp # Dont allow crawl of demolish Disallow: /newsroom/media-relations/st-paul-demolition.html Disallow: /edumedia/edufiles/newsroom/demolition-map.pdf # Do not crawl purchasing documents Disallow: /edumedia/edufiles/about_us/admin_offices/Purchasing/ # Dont crawl any of the sugar content Disallow: /sugar Disallow: /legal/open-records-request.html # Do not crawl email pages Disallow: /sites/cuh-email Disallow: /sites/html-email #Do not crawl for the new Campus Updates site and any of its pages Disallow: /sites/campus-updates # Do not crawl open record requests Disallow: /open-records-request-detail.html?requestId= Disallow: /openrecordsdoc/ # Do not crawl purchasing transparency Disallow: /about-us/administrative-offices/purchasing/transparency.html # Do not allow indiviual news items is search Disallow: /newsroom/in-the-news/year # Do not crawl email pages Disallow: /sites/campus-updates # Do not crawl test folder Disallow: /test Disallow: /edu-guide Disallow: /resources #Disallow: /fonts #Disallow: /css #Disallow: /js #Disallow: /img # Do not allow campaign landing pages Disallow: /lp/ Disallow: /alerts/ # Dont allow crawl in-pursuit ###Disallow: /research/in-pursuit/ ### Do not crawl /sites/campus-news (added on 09/05/2018) User-agent: Googlebot Disallow: /sites/campus-news User-agent: Bingbot Disallow: /sites/campus-news User-agent: Slurp Disallow: /sites/campus-news User-agent: DuckDuckBot Disallow: /sites/campus-news User-agent: Baiduspider Disallow: /sites/campus-news User-agent: YandexBot Disallow: /sites/campus-news User-agent: Vegi bot (we follow your robots.txt settings before crawling, you can slow down the bot by change the Crawl-Delay parameter in the settings.if you have an enquiry, please email to: abuse-report@terrykyleseoagency.com) Disallow: / User-agent: Vegi bot Disallow: / User-agent: libwww Disallow: / User-agent: HTTP::Lite Disallow: / User-agent: PHPCrawl Disallow: / User-agent: WEP Search Disallow: / User-agent: EmailCollector Disallow: / User-agent: EmailSiphon Disallow: / User-agent: EmailWolf Disallow: /