geminispace.info

Unnamed repository; edit this file 'description' to name the repository.
git clone git://code.clttr.info/geminispace.info.git
Log | Files | Refs | README | LICENSE

commit f7de0f8473861f62e2fccd13a1a29a2d73ebb098
parent 72c6ccbf81941ce81541bfbbf5eb8f03ebf77b61
Author: Natalie Pendragon <natpen@natpen.net>
Date:   Wed, 28 Oct 2020 06:55:18 -0400

[crawl] Add a few new exclusions

Diffstat:
Mgus/crawl.py | 17+++++++++++++++++
1 file changed, 17 insertions(+), 0 deletions(-)

diff --git a/gus/crawl.py b/gus/crawl.py @@ -54,6 +54,7 @@ EXCLUDED_URL_PREFIXES = [ "gemini://gus.guru/v/search?", "gemini://gus.guru/add-seed?", "gemini://gus.guru/backlinks?", + "gemini://gus.guru/threads", # Houston "gemini://houston.coder.town/search?", @@ -70,6 +71,13 @@ EXCLUDED_URL_PREFIXES = [ "gemini://acidic.website/cgi-bin/weather.tcl?", # Alex Schroeder's problematic stuff + "gemini://vault.transjovian.org/", + "gemini://transjovian.org/", + "gemini://alexschroeder.ch/", + "gemini://alexschroeder.ch:1967", + "gemini://communitywiki.org:1966/", + "gemini://communitywiki.org/", + "gemini://alexschroeder.ch/image_external", "gemini://alexschroeder.ch/html/", "gemini://alexschroeder.ch/diff/", @@ -127,6 +135,15 @@ EXCLUDED_URL_PREFIXES = [ "gemini://gemini.susa.net/cgi-bin/search?", "gemini://gemini.susa.net/cgi-bin/twitter?", "gemini://gemini.susa.net/cgi-bin/vim-search?", + + "gemini://pboyd.io/cgi-bin/guestbook.pl,", + + "gemini://gemini.spam.works/textfiles/", + "gemini://gemini.spam.works/mirrors/textfiles/", + + # this is a stream that never ends... + "gemini://gemini.thebackupbox.net/radio", + ] EXCLUDED_URL_PATHS = [