webarc/config.toml

73 lines
1.2 KiB
TOML
Raw Permalink Normal View History

2024-12-30 10:00:05 +01:00
# Rewrite links to point back to the archive itself
ROUTE_INTERNAL=true
# Download missing routes on demand
DOWNLOAD_ON_DEMAND=true
2025-01-02 19:00:47 +01:00
[websites]
2024-12-31 02:03:03 +01:00
# You can blacklist sites which wont work well
2025-01-02 19:00:47 +01:00
BLACKLIST_DOMAINS = [
2025-01-11 16:21:15 +01:00
"^gitlab", # All domains starting with gitlab
"youtube" # YouTube
2025-01-02 19:00:47 +01:00
]
2024-12-30 14:06:32 +01:00
2025-01-03 13:34:59 +01:00
# Domain configuration (Example)
[[websites.domains]]
# The domain the config applies to
domain = "example.com"
# Blacklisted Path (Regexes)
blacklist_paths = ["/.*"]
# Exclude <audio> tags
no_audio = false
# Exclude <video> tags
no_video = false
# Exclude <img> tags
no_image = false
# Exclude CSS
no_css = false
# Exclude Javascript
no_javascript = false
# Exclude fonts
no_fonts = false
# Exclude iframes
no_frames = false
# User Agent
user_agent = "Safari"
2025-01-02 19:00:47 +01:00
[ai]
2024-12-30 14:06:32 +01:00
# Ollama URL (Enables vector search)
2025-01-02 19:00:47 +01:00
OLLAMA_URL="127.0.0.1:11434"
2025-01-03 13:34:59 +01:00
# --- Website Config
[[websites.domains]]
domain = "developer.mozilla.org"
no_javascript = true
[[websites.domains]]
domain = "github.com"
no_javascript = true
2025-01-11 16:21:15 +01:00
[[websites.domains]]
domain = "en.wikipedia.org"
no_javascript = true
[[websites.domains]]
domain = "api.flutter.dev"
no_javascript = true
no_video = true
[[websites.domains]]
domain = "docs.flutter.dev"
no_javascript = true
no_video = true