newyorksportsclubs.com Review

TitletagDescriptiontaglanguage
Home | NYSC en-us
Alexarank
399086
Ip adress54.87.33.86Nameserverns-138.awsdns-17.com
ns-681.awsdns-21.net
ns-1234.awsdns-26.org
ns-1976.awsdns-55.co.uk
Status code200
robots.txt -http://newyorksportsclubs.com/robots.txt
 # ==================================================================================
# βœ… Allow major search engine bots, but block URLs containing "confirmation" or "dtx-confirmation"
# Reason: These are typically thank-you or conversion pages that do not need indexing.
# Blocking them improves SEO hygiene and keeps post-submission pages out of search results.
# ==================================================================================

User-agent: Googlebot
Disallow: /*dtx-confirmation*
Disallow: /*confirmation*

User-agent: Bingbot
Disallow: /*dtx-confirmation*
Disallow: /*confirmation*

User-agent: DuckDuckBot
Disallow: /*dtx-confirmation*
Disallow: /*confirmation*

User-agent: Applebot
Disallow: /*dtx-confirmation*
Disallow: /*confirmation*

User-agent: Slurp
Disallow: /*dtx-confirmation*
Disallow: /*confirmation*

# ==================================================================================
# βœ… Allow social media bots to fetch preview content (title, image, description)
# These bots are harmless and helpful for link sharing on platforms like Facebook & Twitter.
# ==================================================================================

User-agent: facebookexternalhit
Allow: /
User-agent: Twitterbot
Allow: /

# ==================================================================================
# βœ… Allow Google to crawl images and news content
# Ensures media content is indexed properly for visibility in Google Image Search and News.
# ==================================================================================

User-agent: Googlebot-Image
Allow: /

User-agent: Googlebot-News
Allow: /

# ==================================================================================
# 🧠 Block modern AI crawlers and data-harvesting bots
# Reason: These bots scrape site content for AI training or data resale without permission.
# Blocking them protects intellectual property and privacy.
# ==================================================================================

User-agent: GPTBot
Disallow: /

User-agent: ChatGPT-User
Disallow: /

User-agent: ClaudeBot
Disallow: /

User-agent: anthropic-ai
Disallow: /

User-agent: CCBot
Disallow: /

User-agent: Amazonbot
Disallow: /

User-agent: Bytespider
Disallow: /

User-agent: Pinterestbot
Disallow: /

# ==================================================================================
# ❌ Block aggressive SEO scraping bots (excluding SemrushBot which is allowed)
# These bots often crawl heavily and add no SEO value. Blocking them conserves server resources.
# ==================================================================================

User-agent: AhrefsBot
Disallow: /

User-agent: MJ12bot
Disallow: /

User-agent: Screaming Frog SEO Spider
Disallow: /

User-agent: Sitebulb
Disallow: /

User-agent: DotBot
Disallow: /

User-agent: BLEXBot
Disallow: /

User-agent: SEOkicks
Disallow: /

User-agent: Exabot
Disallow: /

User-agent: Yandex
Disallow: /

User-agent: Baiduspider
Disallow: /

# ==================================================================================
# πŸ”’ Default rules for any unidentified or generic bots
# Applies the same protections: blocks sensitive paths, query-based duplicates, and private areas.
# ==================================================================================

User-agent: *
Disallow: /*dtx-confirmation*
Disallow: /*confirmation*
Disallow: /*?                  # Avoid crawling URLs with query strings (often duplicates)
Disallow: /*#                  # Avoid URLs with hash fragments
Disallow: /*thank              # Prevent thank-you pages from indexing
Disallow: /tmp/                # Block temporary file directory
Disallow: /cache/              # Block cached file directory
Disallow: /admin/              # Block admin panel
Disallow: /career              # Block career-related paths
Disallow: /wp-login.php        # Block WordPress login page
Disallow: /wp-register.php     # Block WordPress register page
Disallow: /clubs/downtown-crossing

# ==================================================================================
# πŸ—ΊοΈ Sitemap declaration
# Helps search engines understand your site structure and prioritize crawling efficiently.
# ==================================================================================

Sitemap: https://www.newyorksportsclubs.com/sitemap_index.xml
HTTP/1.1 301 Moved Permanently
Date: Thu, 28 Aug 2025 14:56:46 GMT
Content-Type: text/html; charset=UTF-8
Transfer-Encoding: chunked
Connection: keep-alive
Server: nginx
Set-Cookie: PHPSESSID=jd72rr3m7nt0ssdlrrjokfudif; path=/
Pragma: no-cache
Expires: Wed, 11 Jan 1984 05:00:00 GMT
Cache-Control: no-cache, must-revalidate, max-age=0
X-Redirect-By: WordPress
Location: https://www.newyorksportsclubs.com/
Strict-Transport-Security: max-age=31536000; includeSubDomains; preload
X-Frame-Options: DENY
X-Content-Type-Options: nosniff
X-XSS-Protection: 1; mode=block
Referrer-Policy: origin
Referrer-Policy: no-referrer-when-downgrade

HTTP/1.1 200 OK
Date: Thu, 28 Aug 2025 14:56:47 GMT
Content-Type: text/html; charset=UTF-8
Transfer-Encoding: chunked
Connection: keep-alive
Server: nginx
Set-Cookie: PHPSESSID=ivc9ugpqk784anjje3d58bvmk6; path=/
Expires: Thu, 19 Nov 1981 08:52:00 GMT
Cache-Control: no-store, no-cache, must-revalidate
Pragma: no-cache
Link: ; rel="https://api.w.org/"
Link: ; rel="alternate"; title="JSON"; type="application/json"
Link: ; rel=shortlink
Strict-Transport-Security: max-age=31536000; includeSubDomains; preload
X-Frame-Options: DENY
X-Content-Type-Options: nosniff
X-XSS-Protection: 1; mode=block
Referrer-Policy: origin
Referrer-Policy: no-referrer-when-downgrade
Content-Encoding: gzip

iframe