Vejr.tv2.dk has robots.txt file. Http response code is 200.
Robots size is small. It is about 185 kb and 56 rows.

Robots.txt for User-Agent=* contains only disallow directives.

Host directive is not presented for domain vejr.tv2.dk in robots.txt file.
Array
(
    [*] => Array
        (
            [crawl-delay] => 10
            [disallow] => Array
                (
                    [0] => /includes/
                    [1] => /misc/
                    [2] => /modules/
                    [3] => /profiles/
                    [4] => /scripts/
                    [5] => /themes/
                    [6] => /CHANGELOG.txt
                    [7] => /cron.php
                    [8] => /INSTALL.mysql.txt
                    [9] => /INSTALL.pgsql.txt
                    [10] => /INSTALL.sqlite.txt
                    [11] => /install.php
                    [12] => /INSTALL.txt
                    [13] => /LICENSE.txt
                    [14] => /MAINTAINERS.txt
                    [15] => /update.php
                    [16] => /UPGRADE.txt
                    [17] => /xmlrpc.php
                    [18] => /admin/
                    [19] => /comment/reply/
                    [20] => /filter/tips/
                    [21] => /node/add/
                    [22] => /search/
                    [23] => /user/register/
                    [24] => /user/password/
                    [25] => /user/login/
                    [26] => /user/logout/
                    [27] => /?q=admin/
                    [28] => /?q=comment/reply/
                    [29] => /?q=filter/tips/
                    [30] => /?q=node/add/
                    [31] => /?q=search/
                    [32] => /?q=user/password/
                    [33] => /?q=user/register/
                    [34] => /?q=user/login/
                    [35] => /?q=user/logout/
                )

        )

)
#
# robots.txt
#
# This file is to prevent the crawling and indexing of certain parts
# of your site by web crawlers and spiders run by sites like Yahoo!
# and Google. By telling these "robots" where not to go on your site,
# you save bandwidth and server resources.
#
# This file will be ignored unless it is at the root of your host:
# Used:    http://example.com/robots.txt
# Ignored: http://example.com/site/robots.txt
#
# For more information about the robots.txt standard, see:
# http://www.robotstxt.org/robotstxt.html

User-agent: *
Crawl-delay: 10
# Directories
Disallow: /includes/
Disallow: /misc/
Disallow: /modules/
Disallow: /profiles/
Disallow: /scripts/
Disallow: /themes/
# Files
Disallow: /CHANGELOG.txt
Disallow: /cron.php
Disallow: /INSTALL.mysql.txt
Disallow: /INSTALL.pgsql.txt
Disallow: /INSTALL.sqlite.txt
Disallow: /install.php
Disallow: /INSTALL.txt
Disallow: /LICENSE.txt
Disallow: /MAINTAINERS.txt
Disallow: /update.php
Disallow: /UPGRADE.txt
Disallow: /xmlrpc.php
# Paths (clean URLs)
Disallow: /admin/
Disallow: /comment/reply/
Disallow: /filter/tips/
Disallow: /node/add/
Disallow: /search/
Disallow: /user/register/
Disallow: /user/password/
Disallow: /user/login/
Disallow: /user/logout/
# Paths (no clean URLs)
Disallow: /?q=admin/
Disallow: /?q=comment/reply/
Disallow: /?q=filter/tips/
Disallow: /?q=node/add/
Disallow: /?q=search/
Disallow: /?q=user/password/
Disallow: /?q=user/register/
Disallow: /?q=user/login/
Disallow: /?q=user/logout/
  • код 301 http://vejr.tv2.dk/robots.txt
  • код 200 https://vejr.tv2.dk/robots.txt