--- comics/fetch.pl.new 2013/03/12 13:09:34 1.13 +++ comics/fetch.pl.new 2015/05/07 12:31:43 1.18 @@ -1,15 +1,33 @@ #!/usr/bin/perl -w +############################################################################### +# $Log: fetch.pl.new,v $ +# Revision 1.18 2015/05/07 12:31:43 nick +# Added favicon +# +# Revision 1.17 2015/02/19 14:56:10 nick +# Fixed a problem that forced everything to JPG. This would kill GIF animations, but would not display the gifs either because 'convert' appends an index number to the end of the file name for each from of the GIF animation. I fixed this to maintain GIF compatibilty as well as rewritting how the script fetches the size of the file. Additionally, I updated the configuration for Questionable Content to search for GIF or JPG, which is what triggered this entire update. +# +# Revision 1.16 2015/02/05 18:05:58 nick +# Changed the background and added a fancy title. +# +# Revision 1.15 2015/01/19 13:46:19 nick +# *** empty log message *** +# +############################################################################### + use strict; use File::Path; use Data::Dumper; use Pod::Usage; use Getopt::Long; +use Date::Calc qw/Date_to_Text_Long Today/; + ## ## Some default values ## -my $ver = q/$Id: fetch.pl.new,v 1.13 2013/03/12 13:09:34 nick Exp $/; +my $ver = '$Id: fetch.pl.new,v 1.18 2015/05/07 12:31:43 nick Exp $'; my $comicFile = "comics.conf"; my %comics = &readComicConfig ( $comicFile ); my %opts = &fetchOptions( ); @@ -22,7 +40,6 @@ my $indexDir = $baseDir . "/" . ( $co my $USER_AGENT = "Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9.2.18) Gecko/20110628 Ubuntu/10.10 (maverick) Firefox/3.6.18"; my @days = qw/ Sunday Monday Tuesday Wednesday Thursday Friday Saturday /; - my $DATE=`date`; chomp $DATE; print STDOUT "Starting comic fetch at $DATE\n"; @@ -35,15 +52,22 @@ print STDOUT "Starting comic fetch at $D foreach my $comic ( sort keys %comics ) { next if ( $comic =~ m/config/ ); + if ( ( $dates{'day2'} eq "Sunday" ) && + ( $comics{$comic}{'sunday'} == 0 ) ) { print "Skipping.\n"; next; } $comics{$comic}{'error'} = &downloadComic ( \%comics, $comic, \%dates ); &writeComic ( \%comics, $comic, \%dates ); -} -print "Finding in $imageDir/*-$dates{'day2'}.jpg\n"; -foreach my $file ( glob( "$imageDir/*-$dates{'day2'}.jpg" ) ) -{ - my $size = `/usr/bin/identify $file`; - $size =~ s/.*\s(\d+)x\d+.*/$1/; + my $file = "$imageDir/$comic-$dates{'day2'}.$comics{$comic}{'ext'}"; + my $size = 0; + + my $cmd = "/usr/bin/identify -verbose $file|"; + open(IMG, $cmd) || die ("Can't open: $!\n"); + while() { + if ($_ =~ m/^\s+geometry:\s+(\d+)x\d+.*/i) { + $size = $1 if ( $size == 0); + } + } + close(IMG); system( "/usr/bin/convert -resize 640 $file $file" ) if ( $size > 640 ) @@ -92,15 +116,25 @@ sub readComicConfig ($$) { my %comicConfig = ( ); my %config = ( ); + my ($year, $mon, $day) =( localtime(time))[5,4,3]; + $year += 1900; + $mon = sprintf("%02d", ($mon + 1)); + $day = sprintf("%02d", $day); + open FILEN, "<$comicFile"; while () { if ( ( $_ !~ m/^#/ ) && ( $_ =~ m/,.*,/) ){ + $_ =~ s/__YEAR__/$year/g; + $_ =~ s/__MON__/$mon/g; + $_ =~ s/__DAY__/$day/g; + my @res = split /,/, $_; $comicConfig{$res[0]}{'url'} = $res[1]; $comicConfig{$res[0]}{'search'} = $res[2]; $comicConfig{$res[0]}{'mode'} = $res[3]; $comicConfig{$res[0]}{'fullName'} = $res[4]; $comicConfig{$res[0]}{'ext'} = $res[5]; + $comicConfig{$res[0]}{'sunday'} = $res[6] || 1; $comicConfig{$res[0]}{'error'} = 0; } elsif ( $_ =~ m/(.*)\s+=\s+(.*)/ ) { @@ -131,7 +165,7 @@ sub writeComic ($$) { $comics->{$comic}{'url'}
-$comic-$date->{'day2'} +$comic-$date->{'day2'}

@@ -217,6 +251,7 @@ sub writeTitle ($$) { $date->{'mon2'} . $date->{'day2'} . "-" . $sd . ".html"; my $today = $days[$date->{'dow'}] . " " . $date->{'mon'} . "/" . $date->{'day'} . "/" . $date->{'year'}; + my $today_long = Date_to_Text_Long(Today()); open INDEX, ">$indexFile"; print INDEX < + Daily Comics for $today -

Daily Comics for $today

+
+ + + + + + EOF close (INDEX); } @@ -247,7 +289,8 @@ sub directDownload ($$) { my $cDir = $date->{'mon2'} . $date->{'year2'}; my $cDate = $date->{'day2'}; - my $cmd = "wget -q $file --referer=\"" . $comics->{$comic}{'url'} ."\" --user-agent=\"$USER_AGENT\" -O - | /usr/bin/convert - jpeg:images/$cDir/$comic-$cDate.jpg"; + my $cmd = "wget -q $file --referer=\"" . $comics->{$comic}{'url'} ."\" --user-agent=\"$USER_AGENT\" -O - | /usr/bin/convert - jpeg:images/$cDir/$comic-$cDate.jpg"; + return system($cmd); } @@ -278,10 +321,10 @@ sub indexDownload ($$) { ## Find the comic strip URL based on the specified regex in the search ## foreach my $line (@lines) { - if ( $line =~ m/$comics->{$comic}{'search'}/ ) { + if ( $line =~ m/$comics->{$comic}{'search'}/i ) { $comicLine = $1; chomp $comicLine; } - } + } ## ## Save the file to the appropriate directory @@ -292,7 +335,7 @@ sub indexDownload ($$) { if ( $comicLine ) { if ( $comicLine =~ m/(gif|jpg|png)/i ) { $comics->{$comic}{'ext'} = $1; } my $comicURL = ( $comicLine =~ m/http/ ) ? $comicLine : $mainURL . $comicLine; - my $cmd = "wget --user-agent=\"$USER_AGENT\" --referer=\"" . $comics->{$comic}{'url'} . "\" -q $comicURL -O - | /usr/bin/convert - jpeg:images/$cDir/$comic-$cDate.jpg"; + my $cmd = "wget --user-agent=\"$USER_AGENT\" --referer=\"" . $comics->{$comic}{'url'} . "\" -q $comicURL -O images/$cDir/$comic-$cDate.$comics->{$comic}{'ext'}"; system( $cmd ); return 0; }
$today_long