it* hacker news on gopher Err codevoid.de 70 i Err codevoid.de 70 hgit clone git://git.codevoid.de/hn-gopher URL:git://git.codevoid.de/hn-gopher codevoid.de 70 1Log /git/hn-gopher/log.gph codevoid.de 70 1Files /git/hn-gopher/files.gph codevoid.de 70 1Refs /git/hn-gopher/refs.gph codevoid.de 70 i--- Err codevoid.de 70 1commit 8623a7302f45460a20b8ff52923e419829e4f40b /git/hn-gopher/commit/8623a7302f45460a20b8ff52923e419829e4f40b.gph codevoid.de 70 1parent 2ffdbea646f3d5028a12be096dc3e881a363a335 /git/hn-gopher/commit/2ffdbea646f3d5028a12be096dc3e881a363a335.gph codevoid.de 70 hAuthor: Stefan Hagen URL:mailto:sh+git[at]codevoid[dot]de codevoid.de 70 iDate: Wed, 1 Aug 2018 23:07:58 +0200 Err codevoid.de 70 i Err codevoid.de 70 iExtend blacklist Err codevoid.de 70 i Err codevoid.de 70 iDiffstat: Err codevoid.de 70 i M hn-scraper.pl | 11 +++++++---- Err codevoid.de 70 i Err codevoid.de 70 i1 file changed, 7 insertions(+), 4 deletions(-) Err codevoid.de 70 i--- Err codevoid.de 70 1diff --git a/hn-scraper.pl b/hn-scraper.pl /git/hn-gopher/file/hn-scraper.pl.gph codevoid.de 70 it@@ -278,13 +278,16 @@ sub checkBlacklist { Err codevoid.de 70 i "twitter\.com", Err codevoid.de 70 i "phys\.org", Err codevoid.de 70 i "vimeo\.com", Err codevoid.de 70 i- "github\.com", Err codevoid.de 70 i+ "\\/github\.com", Err codevoid.de 70 i "facebook\.com", Err codevoid.de 70 i "laptopmag\.com", Err codevoid.de 70 i "github\.com", Err codevoid.de 70 i "apple\.com", Err codevoid.de 70 i "mjg59\.dreamwidth\.org", Err codevoid.de 70 i- "scmp\.com" Err codevoid.de 70 i+ "scmp\.com", Err codevoid.de 70 i+ "www\.nature\.com", Err codevoid.de 70 i+ "www\.reddit\.com" Err codevoid.de 70 i+ "old\.reddit\.com" Err codevoid.de 70 i ); Err codevoid.de 70 i foreach my $item (@list) { Err codevoid.de 70 i if( $url =~ m/.*${item}/ ) { Err codevoid.de 70 it@@ -339,8 +342,8 @@ sub dumpArticle { Err codevoid.de 70 i $msg = $f->parse($msg); Err codevoid.de 70 i Err codevoid.de 70 i # plausibility check. too small? Err codevoid.de 70 i- if(length($msg) < 500) { Err codevoid.de 70 i- print "Text < 500: $url\n"; Err codevoid.de 70 i+ if(length($msg) <= 500) { Err codevoid.de 70 i+ print "Text <= 500: $url\n"; Err codevoid.de 70 i return 1; Err codevoid.de 70 i } Err codevoid.de 70 i Err codevoid.de 70 .