1
0
Fork 0
mirror of https://git.sr.ht/~seirdy/seirdy.one synced 2024-12-30 20:02:09 +00:00
seirdy.one/linter-configs/htmltest.yml
2022-10-18 21:35:41 -07:00

60 lines
2.8 KiB
YAML

DirectoryPath: "public"
IgnoreDirs:
- "search"
CacheExpires: "168h" # seven days
CheckFavicon: true
EnforceHTML5: true
IgnoreAltMissing: true # an empty alt makes presentation-role explicit, it's not a defect.
EnforceHTTPS: true
ExternalTimeout: 180
HTTPConcurrencyLimit: 96
IgnoreHTTPS:
- "http://192.168.1"
- "http://localhost:"
- "http://wgq3bd2kqoybhstp77i3wrzbfnsyd27wt34psaja4grqiezqircorkyd.onion"
- "http://bettermotherfuckingwebsite.com/"
- "http://dtrace.org/"
- "http://emacspeak.sourceforge.net/"
- "http://herpolhode.com/"
- "http://io.netgarage.org/me/"
- "http://linter.structured-data.org/"
- "http://optipng.sourceforge.net/"
- "http://renaissancechambara.jp/"
- "http://techrights.org/"
- "http://www.nathanmyhrvold.com/"
- "http://www.tuxmachines.org/"
- "http://xmlns.com/"
- "http://nerdlistings.info/category/personalsites/"
CheckExternal: true
IgnoreURLs:
- "../music.txt"
- "^gemini://"
- "mailto:"
- "git@git"
- "http://[^/]*.onion"
- "https://archive.is"
- "https://ogp.me/ns"
- "https://seirdy.one/webmentions/"
- "http://creativecommons.org/ns"
- "https://seirdy.one/search/"
- "https://nerdlistings.info/category/personalsites/" # I reached out about the expired cert and mentioned the issue on the page.
- "https://www.reddit.com/user/Seirdy" # reddit doesn't like htmltest
# - "https://i.reddit.com/r/web_design/comments/k0dmpj/an_opinionated_list_of_best_practices_for_textual/gdmxy4u/"
- "https://i.reddit.com"
- "https://fediring.net/(previous|next)" # redir
# - "https://forum.palemoon.org/viewtopic.php?f=1&t=25473" # manual check: blocks crawlers
- "https://forum.palemoon.org/viewtopic.php"
- "https://queue.acm.org/detail" # manual check: blocks crawlers
- "https://www.geocities.ws/jaup/jaup.htm" # manual check: blocks crawlers
- "https://plausible.io/blog/google-floc#" # manual check: I block this domain
- "https://twitter.com/" # manual check: 404 for some reason, using curl works fine.
# - "https://bugs.debian.org/cgi-bin/bugreport.cgi?bug=830173" # manual check: 400 for some reason, using curl works fine.
- "https://bugs.debian.org/cgi-bin/bugreport.cgi"
# - "https://forum.kuketz-blog.de/viewtopic.php?p=78202" # manual check: blocks crawlers
- "https://forum.kuketz-blog.de/viewtopic.php"
- "https://web.archive.org/" # the wayback machine itself.
- "https://webring.yesterweb.org/noJS/index.php" # Seems to block htmltest; check manually
- "https://gitweb.torproject.org/tor-browser.git/tree/browser/components/securitylevel/SecurityLevel.jsm.id=ffdf" # Seems to block htmltest; check manually
- "https://lnk.dk" # blocks htmltest
- "https://www.fastcompany.com/90759792/with-google-dominating-search-the-internet-needs-crawl-neutrality" # blocks htmltest
OutputDir: "linter-configs/htmltest"