Add robots and fix up sitemap.

This commit is contained in:
Michael Fabian 'Xaymar' Dirks
2024-09-07 13:55:17 +02:00
parent 1be1a7d451
commit d998a59fda
2 changed files with 16 additions and 4 deletions
+11
View File
@@ -1,4 +1,11 @@
---
layout: null
sitemap:
exclude: true
---
User-agent: * User-agent: *
Sitemap: {{ "/robots.txt" | absolute_url }}
Disallow: /assets/ Disallow: /assets/
Disallow: /feed/ Disallow: /feed/
Disallow: /feed.xml Disallow: /feed.xml
@@ -13,12 +20,14 @@ User-agent: Applebot
User-agent: Applebot-Extended User-agent: Applebot-Extended
User-agent: Bytespider User-agent: Bytespider
User-agent: CCBot User-agent: CCBot
User-agent: ChatGPT
User-agent: ChatGPT-User User-agent: ChatGPT-User
User-agent: Claude-Web User-agent: Claude-Web
User-agent: ClaudeBot User-agent: ClaudeBot
User-agent: Diffbot User-agent: Diffbot
User-agent: FacebookBot User-agent: FacebookBot
User-agent: FriendlyCrawler User-agent: FriendlyCrawler
User-agent: GPT
User-agent: GPTBot User-agent: GPTBot
User-agent: Google-Extended User-agent: Google-Extended
User-agent: GoogleOther User-agent: GoogleOther
@@ -29,7 +38,9 @@ User-agent: ICC-Crawler
User-agent: ImagesiftBot User-agent: ImagesiftBot
User-agent: Meta-ExternalAgent User-agent: Meta-ExternalAgent
User-agent: Meta-ExternalFetcher User-agent: Meta-ExternalFetcher
User-agent: OpenAI
User-agent: OAI-SearchBot User-agent: OAI-SearchBot
User-agent: OAI-Bot
User-agent: PerplexityBot User-agent: PerplexityBot
User-agent: PetalBot User-agent: PetalBot
User-agent: Scrapy User-agent: Scrapy
+4 -3
View File
@@ -3,13 +3,13 @@ layout: null
sitemap: sitemap:
exclude: true exclude: true
--- ---
{% capture var %}
<?xml version="1.0" encoding="UTF-8"?> <?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9"> <urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
{% for post in site.posts %} {% for post in site.posts %}
{% unless post.published == false %} {% unless post.published == false %}
<url> <url>
<loc>{{ site.url }}{{ post.url }}</loc> <loc>{{ site.url | xml_encode }}{{ post.url | xml_encode }}</loc>
{% if post.sitemap.lastmod %} {% if post.sitemap.lastmod %}
<lastmod>{{ post.sitemap.lastmod | date: "%Y-%m-%d" }}</lastmod> <lastmod>{{ post.sitemap.lastmod | date: "%Y-%m-%d" }}</lastmod>
{% elsif post.date %} {% elsif post.date %}
@@ -41,7 +41,7 @@ sitemap:
{% endfor %} {% endfor %}
{% unless skip == true or page.sitemap.exclude == true %} {% unless skip == true or page.sitemap.exclude == true %}
<url> <url>
<loc>{{ site.url }}{{ page.url | remove: "index.html" }}</loc> <loc>{{ site.url | xml_encode }}{{ page.url | remove: "index.html" | xml_encode }}</loc>
{% if page.sitemap.lastmod %} {% if page.sitemap.lastmod %}
<lastmod>{{ page.sitemap.lastmod | date: "%Y-%m-%d" }}</lastmod> <lastmod>{{ page.sitemap.lastmod | date: "%Y-%m-%d" }}</lastmod>
{% elsif page.date %} {% elsif page.date %}
@@ -63,3 +63,4 @@ sitemap:
{% endunless %} {% endunless %}
{% endfor %} {% endfor %}
</urlset> </urlset>
{% endcapture %}{{ var | normalize_whitespace }}