--- comics/fetch.pl.new 2015/07/13 12:56:58 1.19
+++ comics/fetch.pl.new 2024/12/13 16:03:49 1.31
@@ -2,6 +2,50 @@
###############################################################################
# $Log: fetch.pl.new,v $
+# Revision 1.31 2024/12/13 16:03:49 nick
+# This adds the ability to specify a comic as a link only with a default splash image.
+#
+# Revision 1.30 2022/10/04 12:02:03 nick
+# Added --no-check-certificate for wget calls as arcamax was failing its cert check. Meh, whatever. It's just comics.
+#
+# Revision 1.29 2020/06/10 21:32:52 nick
+# Centered page
+#
+# Revision 1.28 2020/06/10 21:14:31 nick
+# Updated for w3 validation.
+#
+# Revision 1.27 2019/04/15 12:50:23 nick
+# The script was unable to handle html '&' and convert it, so I added that. I probably should see if there's a library or something that handles all those automagically but I just tossed a regex in there for now that does the trick.
+#
+# Revision 1.26 2018/04/22 14:03:54 nick
+# Changed the default for Sunday comics that was causing issues with some comics.
+#
+# Revision 1.25 2018/02/12 13:30:58 nick
+# Added an easier to compare date string to determine if the status json file was updated today and report if it wasn't.
+#
+# Revision 1.24 2018/02/06 14:31:06 nick
+# A status report is now generated in JSON that can easily be scanned so that
+# I can be alerted when there are failures that I miss if I don't read the
+# comics that day.
+#
+# Revision 1.23 2018/01/26 13:05:27 nick
+# Added a new config option to remove all newline from the resulting index.html
+# file. This allows for easier parsing for certain comics. I then updated
+# the URLs to search for and enabled the newline removal for a handful
+# of uComics.
+#
+# I believe I've also properly fixed the Comic Config version displayed on
+# the webpage itself.
+#
+# Revision 1.22 2017/12/05 13:37:40 nick
+# Added the CVS config version to the outpuit.
+#
+# Revision 1.21 2015/10/26 14:25:40 nick
+# Fixed a bug that was improperly including the day of week string preventing the weekend comics from fetching proproperly.
+#
+# Revision 1.20 2015/10/22 12:58:44 nick
+# Added the ability for Sunday only comics. Stonesoup is no longer weekdays, this has been added to Sunday only. I also added Foxtrot Classics for weekdays and Foxtrot for Sundays.
+#
# Revision 1.19 2015/07/13 12:56:58 nick
# Added Sally Forth and Pearls Before Swine. Adding Sally Forth required a change in the 'wget' command for fetching the index file to include 'user-agent' and 'referer'.
#
@@ -24,14 +68,19 @@ use File::Path;
use Data::Dumper;
use Pod::Usage;
use Getopt::Long;
+use JSON::Create 'create_json';
+use Date::Calc qw/Date_to_Text_Long Today Day_of_Week Day_of_Week_to_Text/;
+use Data::Dumper;
-use Date::Calc qw/Date_to_Text_Long Today/;
+print("Running");
##
## Some default values
##
-my $ver = '$Id: fetch.pl.new,v 1.19 2015/07/13 12:56:58 nick Exp $';
+my $ver = '$Id: fetch.pl.new,v 1.31 2024/12/13 16:03:49 nick Exp $';
my $comicFile = "comics.conf";
+my $comicConfigVer = "Unknown";
+my $reportFile = "/home/httpd/html/daily/comics/status_report.json";
my %comics = &readComicConfig ( $comicFile );
my %opts = &fetchOptions( );
my $days_ago = $opts{'days'} || 0;
@@ -54,33 +103,53 @@ print STDOUT "Starting comic fetch at $D
&writeTitle ( \%dates );
foreach my $comic ( sort keys %comics ) {
+
+ print("Checking Comic $comic\n");
+
+ ## Skip if this is Sunday and the comic is weekdays only
next if ( $comic =~ m/config/ );
- if ( ( $dates{'day2'} eq "Sunday" ) &&
- ( $comics{$comic}{'sunday'} == 0 ) ) { print "Skipping.\n"; next; }
+ if (($dates{'wday'} eq "Sunday") &&
+ ($comics{$comic}{'not_sunday'} == 1)) {
+ print "Skipping '$comic'; Weekdays only.\n";
+ next;
+ }
+
+ ## Skip if Sunday only comic and it's not Sunday.
+ if (($dates{'wday'} ne "Sunday") &&
+ ($comics{$comic}{'sunday_only'} == 1)) {
+ print "Skipping '$comic' ($comics{$comic}{'sunday_only'}); Sunday only.\n";
+ next
+ }
+
$comics{$comic}{'error'} = &downloadComic ( \%comics, $comic, \%dates );
&writeComic ( \%comics, $comic, \%dates );
my $file = "$imageDir/$comic-$dates{'day2'}.$comics{$comic}{'ext'}";
my $size = 0;
- my $cmd = "/usr/bin/identify -verbose $file|";
- open(IMG, $cmd) || die ("Can't open: $!\n");
- while() {
- if ($_ =~ m/^\s+geometry:\s+(\d+)x\d+.*/i) {
- $size = $1 if ( $size == 0);
- }
- }
- close(IMG);
-
-
- system( "/usr/bin/convert -resize 640 $file $file" )
- if ( $size > 640 )
+ ## Resize downloaded images
+ if($comics{$comic}{'mode'} != 3) {
+ my $cmd = "/usr/bin/identify -verbose $file|";
+ open(IMG, $cmd) || die ("Can't open: $!\n");
+ while() {
+ if ($_ =~ m/^\s+geometry:\s+(\d+)x\d+.*/i) {
+ $size = $1 if ( $size == 0);
+ }
+ }
+ close(IMG);
+
+ system( "/usr/bin/convert -resize 800 $file $file" )
+ if ( $size > 800 )
+ }
}
## &writeMainIndex ( \%dates );
&writeFooter( \%dates );
+print STDOUT "Status written to $reportFile.\n"
+ if (&writeStatusReportJSON(\%comics, $reportFile));
+
$DATE=`date`; chomp( $DATE );
print STDOUT "Completed comic fetch at $DATE\n";
@@ -108,6 +177,10 @@ sub downloadComic ($$) {
return directDownload ( \%comics, $comic, $date );
last SWITCH;
}
+ if ( $comics->{$comic}{'mode'} eq 3 ) {
+ return 0;
+ last SWITCH;
+ }
}
return "ERROR: Unknown download method specified for $comics->{$comic}{'fullName'}.";
@@ -127,6 +200,10 @@ sub readComicConfig ($$) {
open FILEN, "<$comicFile";
while (
+Generated on: $sysDate
$comics->{$comic}{'fullName'}
-
+
$comics->{$comic}{'url'}
@@ -220,14 +345,13 @@ sub writeFooter {
print INDEX <
+EOF
+ if ( $comics->{$comic}{'mode'} == 3 ) {
+ print("Mode 3\n");
+ $content .= <
-Version: $ver
-CVS: http://demandred.dyndns.org/cgi-bin/cvsweb/comics/
-
+Version: $ver
+Config Version: $comicConfigVer
+CVS: http://demandred.dyndns.org/cgi-bin/cvsweb/comics/
+
-
-
|
@@ -264,19 +388,15 @@ sub writeTitle ($$) {
- - + +