--- comics/fetch.pl.new 2015/02/05 18:05:58 1.16 +++ comics/fetch.pl.new 2015/10/26 14:25:40 1.21 @@ -2,6 +2,21 @@ ############################################################################### # $Log: fetch.pl.new,v $ +# Revision 1.21 2015/10/26 14:25:40 nick +# Fixed a bug that was improperly including the day of week string preventing the weekend comics from fetching proproperly. +# +# Revision 1.20 2015/10/22 12:58:44 nick +# Added the ability for Sunday only comics. Stonesoup is no longer weekdays, this has been added to Sunday only. I also added Foxtrot Classics for weekdays and Foxtrot for Sundays. +# +# Revision 1.19 2015/07/13 12:56:58 nick +# Added Sally Forth and Pearls Before Swine. Adding Sally Forth required a change in the 'wget' command for fetching the index file to include 'user-agent' and 'referer'. +# +# Revision 1.18 2015/05/07 12:31:43 nick +# Added favicon +# +# Revision 1.17 2015/02/19 14:56:10 nick +# Fixed a problem that forced everything to JPG. This would kill GIF animations, but would not display the gifs either because 'convert' appends an index number to the end of the file name for each from of the GIF animation. I fixed this to maintain GIF compatibilty as well as rewritting how the script fetches the size of the file. Additionally, I updated the configuration for Questionable Content to search for GIF or JPG, which is what triggered this entire update. +# # Revision 1.16 2015/02/05 18:05:58 nick # Changed the background and added a fancy title. # @@ -16,12 +31,12 @@ use Data::Dumper; use Pod::Usage; use Getopt::Long; -use Date::Calc qw/Date_to_Text_Long Today/; +use Date::Calc qw/Date_to_Text_Long Today Day_of_Week Day_of_Week_to_Text/; ## ## Some default values ## -my $ver = '$Id: fetch.pl.new,v 1.16 2015/02/05 18:05:58 nick Exp $'; +my $ver = '$Id: fetch.pl.new,v 1.21 2015/10/26 14:25:40 nick Exp $'; my $comicFile = "comics.conf"; my %comics = &readComicConfig ( $comicFile ); my %opts = &fetchOptions( ); @@ -45,18 +60,37 @@ print STDOUT "Starting comic fetch at $D &writeTitle ( \%dates ); foreach my $comic ( sort keys %comics ) { + + ## Skip if this is Sunday and the comic is weekdays only next if ( $comic =~ m/config/ ); - if ( ( $dates{'day2'} eq "Sunday" ) && - ( $comics{$comic}{'sunday'} == 0 ) ) { print "Skipping.\n"; next; } + if (($dates{'wday'} eq "Sunday") && + ($comics{$comic}{'sunday'} == 0)) { + print "Skipping '$comic'; Weekdays only.\n"; + next; + } + + ## Skip if Sunday only comic and it's not Sunday. + if (($dates{'wday'} ne "Sunday") && + ($comics{$comic}{'sunday_only'} == 1)) { + print "Skipping '$comic' ($comics{$comic}{'sunday_only'}); Sunday only.\n"; + next + } + $comics{$comic}{'error'} = &downloadComic ( \%comics, $comic, \%dates ); &writeComic ( \%comics, $comic, \%dates ); -} -print "Finding in $imageDir/*-$dates{'day2'}.jpg\n"; -foreach my $file ( glob( "$imageDir/*-$dates{'day2'}.jpg" ) ) -{ - my $size = `/usr/bin/identify $file`; - $size =~ s/.*\s(\d+)x\d+.*/$1/; + my $file = "$imageDir/$comic-$dates{'day2'}.$comics{$comic}{'ext'}"; + my $size = 0; + + my $cmd = "/usr/bin/identify -verbose $file|"; + open(IMG, $cmd) || die ("Can't open: $!\n"); + while() { + if ($_ =~ m/^\s+geometry:\s+(\d+)x\d+.*/i) { + $size = $1 if ( $size == 0); + } + } + close(IMG); + system( "/usr/bin/convert -resize 640 $file $file" ) if ( $size > 640 ) @@ -123,7 +157,8 @@ sub readComicConfig ($$) { $comicConfig{$res[0]}{'mode'} = $res[3]; $comicConfig{$res[0]}{'fullName'} = $res[4]; $comicConfig{$res[0]}{'ext'} = $res[5]; - $comicConfig{$res[0]}{'sunday'} = $res[6] || 1; + $comicConfig{$res[0]}{'sunday'} = sprintf("%d", $res[6] || 1); + $comicConfig{$res[0]}{'sunday_only'} = sprintf("%d", $res[7] || 0); $comicConfig{$res[0]}{'error'} = 0; } elsif ( $_ =~ m/(.*)\s+=\s+(.*)/ ) { @@ -154,7 +189,7 @@ sub writeComic ($$) { $comics->{$comic}{'url'}
-$comic-$date->{'day2'} +$comic-$date->{'day2'}

@@ -250,6 +285,7 @@ sub writeTitle ($$) { + Daily Comics for $today @@ -277,7 +313,7 @@ sub directDownload ($$) { my $cDir = $date->{'mon2'} . $date->{'year2'}; my $cDate = $date->{'day2'}; - my $cmd = "wget -q $file --referer=\"" . $comics->{$comic}{'url'} ."\" --user-agent=\"$USER_AGENT\" -O - | /usr/bin/convert - jpeg:images/$cDir/$comic-$cDate.jpg"; + my $cmd = "wget -q $file --referer=\"" . $comics->{$comic}{'url'} ."\" --user-agent=\"$USER_AGENT\" -O - | /usr/bin/convert - jpeg:images/$cDir/$comic-$cDate.jpg"; return system($cmd); } @@ -289,7 +325,10 @@ sub indexDownload ($$) { my ( @lines, $comicLine, $mainURL ); my $comicIndex = "indexes/index.$comic"; - `wget -q $comics->{$comic}{'url'} -O $comicIndex`; + my $wget_cmd = "wget -q --referer=\"$comics->{$comic}{'url'}\" " . + "--user-agent=\"$USER_AGENT\" " . + "$comics->{$comic}{'url'} -O $comicIndex"; + system($wget_cmd); if ( ! open FILEN, "<$comicIndex" ) { return "ERROR: Can't open index file for " . $comics->{$comic}{'fullName'} . @@ -309,10 +348,10 @@ sub indexDownload ($$) { ## Find the comic strip URL based on the specified regex in the search ## foreach my $line (@lines) { - if ( $line =~ m/$comics->{$comic}{'search'}/ ) { + if ( $line =~ m/$comics->{$comic}{'search'}/i ) { $comicLine = $1; chomp $comicLine; } - } + } ## ## Save the file to the appropriate directory @@ -323,7 +362,7 @@ sub indexDownload ($$) { if ( $comicLine ) { if ( $comicLine =~ m/(gif|jpg|png)/i ) { $comics->{$comic}{'ext'} = $1; } my $comicURL = ( $comicLine =~ m/http/ ) ? $comicLine : $mainURL . $comicLine; - my $cmd = "wget --user-agent=\"$USER_AGENT\" --referer=\"" . $comics->{$comic}{'url'} . "\" -q $comicURL -O - | /usr/bin/convert - jpeg:images/$cDir/$comic-$cDate.jpg"; + my $cmd = "wget --user-agent=\"$USER_AGENT\" --referer=\"" . $comics->{$comic}{'url'} . "\" -q $comicURL -O images/$cDir/$comic-$cDate.$comics->{$comic}{'ext'}"; system( $cmd ); return 0; } @@ -363,6 +402,8 @@ sub fetchDates () { $dates{'day2'} = ( $dates{'day'} < 10 ) ? "0" . $dates{'day'} : $dates{'day'}; $dates{'mon'}++; $dates{'mon2'} = ( $dates{'mon'} < 10 ) ? "0".$dates{'mon'} : $dates{'mon'}; + my @days = qw/ Sunday Monday Tuesday Wednesday Thursday Friday Saturday /; + $dates{'wday'} = $days[$dates{'dow'}]; return %dates; }