Add robots and fix up sitemap.
This commit is contained in:
+11
@@ -1,4 +1,11 @@
|
|||||||
|
---
|
||||||
|
layout: null
|
||||||
|
sitemap:
|
||||||
|
exclude: true
|
||||||
|
---
|
||||||
|
|
||||||
User-agent: *
|
User-agent: *
|
||||||
|
Sitemap: {{ "/robots.txt" | absolute_url }}
|
||||||
Disallow: /assets/
|
Disallow: /assets/
|
||||||
Disallow: /feed/
|
Disallow: /feed/
|
||||||
Disallow: /feed.xml
|
Disallow: /feed.xml
|
||||||
@@ -13,12 +20,14 @@ User-agent: Applebot
|
|||||||
User-agent: Applebot-Extended
|
User-agent: Applebot-Extended
|
||||||
User-agent: Bytespider
|
User-agent: Bytespider
|
||||||
User-agent: CCBot
|
User-agent: CCBot
|
||||||
|
User-agent: ChatGPT
|
||||||
User-agent: ChatGPT-User
|
User-agent: ChatGPT-User
|
||||||
User-agent: Claude-Web
|
User-agent: Claude-Web
|
||||||
User-agent: ClaudeBot
|
User-agent: ClaudeBot
|
||||||
User-agent: Diffbot
|
User-agent: Diffbot
|
||||||
User-agent: FacebookBot
|
User-agent: FacebookBot
|
||||||
User-agent: FriendlyCrawler
|
User-agent: FriendlyCrawler
|
||||||
|
User-agent: GPT
|
||||||
User-agent: GPTBot
|
User-agent: GPTBot
|
||||||
User-agent: Google-Extended
|
User-agent: Google-Extended
|
||||||
User-agent: GoogleOther
|
User-agent: GoogleOther
|
||||||
@@ -29,7 +38,9 @@ User-agent: ICC-Crawler
|
|||||||
User-agent: ImagesiftBot
|
User-agent: ImagesiftBot
|
||||||
User-agent: Meta-ExternalAgent
|
User-agent: Meta-ExternalAgent
|
||||||
User-agent: Meta-ExternalFetcher
|
User-agent: Meta-ExternalFetcher
|
||||||
|
User-agent: OpenAI
|
||||||
User-agent: OAI-SearchBot
|
User-agent: OAI-SearchBot
|
||||||
|
User-agent: OAI-Bot
|
||||||
User-agent: PerplexityBot
|
User-agent: PerplexityBot
|
||||||
User-agent: PetalBot
|
User-agent: PetalBot
|
||||||
User-agent: Scrapy
|
User-agent: Scrapy
|
||||||
|
|||||||
+4
-3
@@ -3,13 +3,13 @@ layout: null
|
|||||||
sitemap:
|
sitemap:
|
||||||
exclude: true
|
exclude: true
|
||||||
---
|
---
|
||||||
|
{% capture var %}
|
||||||
<?xml version="1.0" encoding="UTF-8"?>
|
<?xml version="1.0" encoding="UTF-8"?>
|
||||||
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
|
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
|
||||||
{% for post in site.posts %}
|
{% for post in site.posts %}
|
||||||
{% unless post.published == false %}
|
{% unless post.published == false %}
|
||||||
<url>
|
<url>
|
||||||
<loc>{{ site.url }}{{ post.url }}</loc>
|
<loc>{{ site.url | xml_encode }}{{ post.url | xml_encode }}</loc>
|
||||||
{% if post.sitemap.lastmod %}
|
{% if post.sitemap.lastmod %}
|
||||||
<lastmod>{{ post.sitemap.lastmod | date: "%Y-%m-%d" }}</lastmod>
|
<lastmod>{{ post.sitemap.lastmod | date: "%Y-%m-%d" }}</lastmod>
|
||||||
{% elsif post.date %}
|
{% elsif post.date %}
|
||||||
@@ -41,7 +41,7 @@ sitemap:
|
|||||||
{% endfor %}
|
{% endfor %}
|
||||||
{% unless skip == true or page.sitemap.exclude == true %}
|
{% unless skip == true or page.sitemap.exclude == true %}
|
||||||
<url>
|
<url>
|
||||||
<loc>{{ site.url }}{{ page.url | remove: "index.html" }}</loc>
|
<loc>{{ site.url | xml_encode }}{{ page.url | remove: "index.html" | xml_encode }}</loc>
|
||||||
{% if page.sitemap.lastmod %}
|
{% if page.sitemap.lastmod %}
|
||||||
<lastmod>{{ page.sitemap.lastmod | date: "%Y-%m-%d" }}</lastmod>
|
<lastmod>{{ page.sitemap.lastmod | date: "%Y-%m-%d" }}</lastmod>
|
||||||
{% elsif page.date %}
|
{% elsif page.date %}
|
||||||
@@ -63,3 +63,4 @@ sitemap:
|
|||||||
{% endunless %}
|
{% endunless %}
|
||||||
{% endfor %}
|
{% endfor %}
|
||||||
</urlset>
|
</urlset>
|
||||||
|
{% endcapture %}{{ var | normalize_whitespace }}
|
||||||
|
|||||||
Reference in New Issue
Block a user