Added robots.txt
This commit is contained in:
parent
2443addfdd
commit
17063143ab
@ -12,6 +12,14 @@ sites:
|
||||
- ./pages/*.md
|
||||
template_selections:
|
||||
article: templates.components.simple_article
|
||||
|
||||
robots_txt:
|
||||
title: robots.txt
|
||||
base_url: http://localhost:8000/robots.txt
|
||||
web_root: ./dist
|
||||
build_cache: ./site
|
||||
assets:
|
||||
- robots.txt
|
||||
|
||||
resume:
|
||||
title: Resume
|
||||
|
||||
@ -230,7 +230,7 @@ img {
|
||||
width: 50vw;
|
||||
}
|
||||
|
||||
li::marker {
|
||||
ul > li::marker {
|
||||
content: '⍟ ';
|
||||
/* TODO: Decide on a default li marker for the theme*/
|
||||
}
|
||||
@ -248,6 +248,11 @@ ul:has(> .blog-archive-li){
|
||||
border-bottom-style: solid;
|
||||
}
|
||||
|
||||
.blog-archive-li::marker{
|
||||
display: none;
|
||||
content: none;
|
||||
}
|
||||
|
||||
.blog-archive-li > time {
|
||||
float: right;
|
||||
}
|
||||
50
site/robots.txt
Normal file
50
site/robots.txt
Normal file
@ -0,0 +1,50 @@
|
||||
User-agent *:
|
||||
Crawl-delay: 5
|
||||
Content-Signal: ai-train=no, search=yes, ai-input=no
|
||||
Disallow: /assets/
|
||||
Disallow: /dogma-jimfinium/assets/
|
||||
Disallow: /*/assets/
|
||||
Disallow: /shepich_resume.pdf
|
||||
|
||||
|
||||
# Block AI bots.
|
||||
User-agent: GPTBot
|
||||
User-agent: OAI-SearchBot
|
||||
User-agent: ChatGPT-User
|
||||
User-agent: anthropic-ai
|
||||
User-agent: ClaudeBot
|
||||
User-agent: claude-web
|
||||
User-agent: PerplexityBot
|
||||
User-agent: Perplexity-User
|
||||
User-agent: Google-Extended
|
||||
User-agent: Googlebot
|
||||
User-agent: Bingbot
|
||||
User-agent: Amazonbot
|
||||
User-agent: Applebot
|
||||
User-agent: Applebot-Extended
|
||||
User-agent: FacebookBot
|
||||
User-agent: meta-externalagent
|
||||
User-agent: LinkedInBot
|
||||
User-agent: Bytespider
|
||||
User-agent: DuckAssistBot
|
||||
User-agent: cohere-ai
|
||||
User-agent: AI2Bot
|
||||
User-agent: CCBot
|
||||
User-agent: Diffbot
|
||||
User-agent: omgili
|
||||
User-agent: Timpibot
|
||||
User-agent: YouBot
|
||||
User-agent: MistralAI-User
|
||||
User-agent: GoogleAgent-Mariner
|
||||
User-agent: Standard Chrome UA
|
||||
User-agent: No known UA
|
||||
User-agent: Knowatoa AI Search Console
|
||||
User-agent: Merkle robots.txt Tester
|
||||
User-agent: Block GPT model training
|
||||
User-agent: Allow ChatGPT user traffic
|
||||
User-agent: ChatGPT Atlas
|
||||
User-agent: OpenAI Operator
|
||||
User-agent: Google Project Mariner
|
||||
User-agent: Anthropic Computer Use
|
||||
User-agent: xAI Grok
|
||||
Disallow: /
|
||||
@ -3,6 +3,7 @@
|
||||
<meta charset="UTF-8">
|
||||
<meta name="viewport" content="width=device-width, initial-scale=1">
|
||||
<meta name="description" content="{site.description}">
|
||||
<meta name="robots" content="noindex" />
|
||||
<head>
|
||||
{templates.partials.default_css}
|
||||
{templates.partials.header}
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user