#!/usr/bin/perl use strict; use warnings; my @domains = ( "bestpicever.com" => { comment => <<'EOF', effektz (Alex Weidmann, zen2design) was banned from digg, though they're still active on reddit, del.icio.us, stumbleupon, ... EOF }, "pileofphotos.com" => { comment => "Another effektz domain" }, "bestpicsaround.com" => { comment => "Another effektz domain" }, "uncommonpics.com" => { comment => "Another effektz domain" }, "lackcolor.com" => { comment => "Another effektz domain" }, "picsdown.com" => { comment => "Another effektz domain", actual_link => "http://www.google.com/search?hl=en&ie=UTF-8&oe=UTF-8&q=site:picsdown.com&btnG=Google+Search"}, "knuttz.net" => {}, "yadogg.com" => {}, "amazingfiltered.blogspot.com" => {}, "static.iftk.com.br" => {}, "photo-of-the-day1.blogspot.com" => { comment => <<'EOF', this site is apparently banned from reddit, since google says there were actually 200+ stories. EOF }, "oomsa.com" => {}, ); open FOUT, ">contextless_images.html" or die; print FOUT <<"EOF"; These are blogs that consist mainly of linkjacked images, and almost never contain enough context to actually learn more about the things in the image, or to figure out the trustworthiness of the image's original author. The solution to this problem? Obviously people should stop upmodding images if they don't have adequate context. Until that starts happening though, individual users can install the Reddit Content Filter. It contains a site blacklist that will hide all stories from the sites you specify. EOF sub dump_domains { for (my $ctr=0; $ctr<@domains; $ctr+=2) { my $domain = $domains[$ctr]; my $data = $domains[$ctr+1] || {}; printf FOUT "
  • %s (reddit, digg, stumbleupon, wikipedia) [alexa]\n", $data->{actual_link} || "http://$domain", $domain, "http://reddit.com/search?q=site%3A$domain", "http://search.yahoo.com/search?p=linkdomain%3A$domain+site%3Adigg.com+-inurl%3Aupcoming+-inurl%3Ausers&fr=yfp-t-471&toggle=1&cop=mss&ei=UTF-8", "http://www.google.com/search?hl=en&q=site%3Astumbleupon.com+inurl%3A$domain+inurl%3Aurl+-inurl%3As&btnG=Search&filter=0", "http://en.wikipedia.org/w/index.php?title=Special%3ALinksearch&target=*.$domain", "http://www.alexa.com/data/details/traffic_details?url=$domain", ; if ($data->{comment}) { print FOUT "\n"; } } }