# Copyright (c) 1997- The Swedish Internet Foundation.
# All rights reserved.
# The information obtained through searches, or otherwise, is protected
# by the Swedish Copyright Act (1960:729) and international conventions.
# It is also subject to database protection according to the Swedish
# Copyright Act.
# Any use of this material to target advertising or
# similar activities is forbidden and will be prosecuted.
# If any of the information below is transferred to a third
# party, it must be done in its entirety. This server must
# not be used as a backend for a search engine.
# Result of search for registered domain names under
# the .se top level domain.
# This whois printout is printed with UTF-8 encoding.
#
state: active
domain: tv4.se
holder: CSC03-90958280
created: 1994-08-19
modified: 2025-12-22
expires: 2026-12-31
transferred: 2016-02-15
nserver: ns-1757.awsdns-27.co.uk
nserver: ns-1067.awsdns-05.org
nserver: ns-1017.awsdns-63.net
nserver: ns-228.awsdns-28.com
dnssec: unsigned delegation
registry-lock: locked
status: serverUpdateProhibited
status: serverDeleteProhibited
status: serverTransferProhibited
registrar: CSC Corp Domains
# =========================
# 1) General Site Rules
# =========================
User-agent: *
Disallow: /rss/kb
Disallow: /health
Disallow: /8cbf4ebb-4570-4351-a0ad-45b19148e4de
# =========================
# 2) Explicitly Allowed Agents
# =========================
# OpenAI Search Bot is explicitly allowed to access all content
User-agent: OAI-SearchBot
Disallow:
# =========================
# 3) AI / LLM-Related Crawlers (Disallowed)
# =========================
# Common Crawl robot, the resulting dataset is often used for LLM training.
User-agent: CCBot
Disallow: /
# ChatGPT robot, used to improve ChatGPT LLM.
User-agent: ChatGPT-User
Disallow: /
# ChatGPT robot, may be used to improve ChatGPT LLM.
User-agent: GPTBot
Disallow: /
# Robot used to improve Bard and Vertex AI LLMs.
User-agent: Google-Extended
Disallow: /
# Used by webz.io; their datasets are frequently used to train LLMs.
User-agent: omgili
Disallow: /
# Used by webz.io; their datasets are frequently used to train LLMs.
User-agent: omgilibot
Disallow: /
# FacebookBot crawls public web pages, which can feed Facebook’s LLM efforts.
User-agent: FacebookBot
Disallow: /
# Amazonbot is used to train Amazon services such as Alexa.
User-agent: Amazonbot
Disallow: /
# Bytespider is ByteDance's bot (TikTok); may not respect robots.txt but is known for AI/ML data gathering.
User-agent: Bytespider
Disallow: /
# Robot used to improve Anthropic AI LLMs.
User-agent: anthropic-ai
Disallow: /
# Additional known AI/LLM bots
User-agent: AI2Bot
Disallow: /
User-agent: Applebot-Extended
Disallow: /
User-agent: Claude-Web
Disallow: /
User-agent: ClaudeBot
Disallow: /
User-agent: cohere-ai
Disallow: /
User-agent: cohere-training-data-crawler
Disallow: /
User-agent: Diffbot
Disallow: /
User-agent: Kangaroo Bot
Disallow: /
User-agent: Meta-ExternalAgent
Disallow: /
User-agent: PanguBot
Disallow: /
User-agent: Timpibot
Disallow: /
User-agent: Webzio-Extended
Disallow: /
User-agent: grapeshot
Disallow: /
# =========================
# Sitemap
# =========================
Sitemap: https://www.tv4.se/sitemap.xml
| Konum | İfade etmek | Sayfa | Snippet |
|---|---|---|---|
| 1 | /usa | ||
| 43 | / |