t* hacker news on gopher URI git clone git://git.codevoid.de/hn-gopher DIR Log DIR Files DIR Refs --- DIR commit 8623a7302f45460a20b8ff52923e419829e4f40b DIR parent 2ffdbea646f3d5028a12be096dc3e881a363a335 URI Author: Stefan Hagen <sh+git[at]codevoid[dot]de> Date: Wed, 1 Aug 2018 23:07:58 +0200 Extend blacklist Diffstat: M hn-scraper.pl | 11 +++++++---- 1 file changed, 7 insertions(+), 4 deletions(-) --- DIR diff --git a/hn-scraper.pl b/hn-scraper.pl t@@ -278,13 +278,16 @@ sub checkBlacklist { "twitter\.com", "phys\.org", "vimeo\.com", - "github\.com", + "\\/github\.com", "facebook\.com", "laptopmag\.com", "github\.com", "apple\.com", "mjg59\.dreamwidth\.org", - "scmp\.com" + "scmp\.com", + "www\.nature\.com", + "www\.reddit\.com" + "old\.reddit\.com" ); foreach my $item (@list) { if( $url =~ m/.*${item}/ ) { t@@ -339,8 +342,8 @@ sub dumpArticle { $msg = $f->parse($msg); # plausibility check. too small? - if(length($msg) < 500) { - print "Text < 500: $url\n"; + if(length($msg) <= 500) { + print "Text <= 500: $url\n"; return 1; }