#!/usr/bin/perl -w # # # rhautoimport # # Copyright (C) 2009-2016 Christian Pointner # # This file is part of rhautoimport. # # rhautoimport is free software: you can redistribute it and/or modify # it under the terms of the GNU General Public License as published by # the Free Software Foundation, either version 3 of the License, or # any later version. # # rhautoimport is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU General Public License for more details. # # You should have received a copy of the GNU General Public License # along with rhautoimport. If not, see . # use strict; use Date::Calc; use Time::localtime; use XML::Feed; use XML::Feed::Entry; use XML::Feed::Content; use XML::Feed::Enclosure; use URI::URL; use IO::Handle; use IPC::Open3; use lib '/usr/local/share/rhautoimport/'; use rhautoimport; my $STAT_FILE = $ENV{'HOME'} . "/rhautoimport-dn.stat"; my $FILES_RSS_URL = "http://www.democracynow.org/podcast-stations.xml"; my $HEADLINES_RSS_URL = "http://www.democracynow.org/podcast.xml"; my $IGNORE_HEADLINE = 0; my $RD_GROUP = "democracyn"; my $PV_ID = '111'; if($#ARGV >= 0 && $ARGV[0] eq 'last') { print "!!!This is the last attempt, there won't be a retry on error!!!\n" } if($#ARGV >= 0 && $ARGV[0] eq 'noheadline') { $IGNORE_HEADLINE = 1; $STAT_FILE = $ENV{'HOME'} . "/rhautoimport-dn-noheadline.stat"; } my @today = Date::Calc::Today(); my @yesterday = Date::Calc::Add_Delta_Days($today[0], $today[1], $today[2], -1); my @tomorrow = Date::Calc::Add_Delta_Days($today[0], $today[1], $today[2], 1); my @broadcast_day = @yesterday; my @import_day = @today; if(localtime->hour >= 12) { print "It's past noon, assuming to import file from today\n"; @broadcast_day = @today; @import_day = @tomorrow; } my $dow = Date::Calc::Day_of_Week(@import_day); $dow = 0 unless $dow < 7; print "day of original broadcast: " . Date::Calc::Date_to_Text(@broadcast_day) . "\n"; print "day of Radio Helsinki broadcast: " . Date::Calc::Date_to_Text(@import_day) . "\n"; my $show_id = -1; my $show_title = ""; my @allowed_dbs = rhautoimport::get_dropboxes($RD_GROUP); if(!defined $allowed_dbs[0] && defined $allowed_dbs[1]) { print "$allowed_dbs[1]\n"; exit 1; } for my $href ( @allowed_dbs ) { if($dow == $href->{'SHOWDOW'}) { $show_title = $href->{'SHOWTITLE'}; $show_id = $href->{'SHOWID'}; last; } } if($show_id < 0) { print "no dropbox for day in question\n"; exit 0; } my $y = sprintf("%04d-%02d-%02d", $broadcast_day[0], $broadcast_day[1], $broadcast_day[2]); my $yc = sprintf("%04d-%02d%02d", $broadcast_day[0], $broadcast_day[1], $broadcast_day[2]); print "looking for files from date $y in RSS Feed\n"; print " -> $FILES_RSS_URL\n"; my $files_feed = rhautoimport::fetch_parse_rss($FILES_RSS_URL) or die "Error fetching feed: " . XML::Feed->errstr; my $uri = ""; my $file = ""; for my $entry ($files_feed->entries) { if($entry->enclosure && $entry->enclosure->type eq "audio/mpeg") { if($entry->enclosure->url =~ /^https?:\/\/.*\.democracynow\.org\/dn([0-9-]+)-1\.mp3$/) { next if($yc ne $1); $uri = new URI::URL($entry->enclosure->url); my @path = $uri->path_components; my $current_file = `cat $STAT_FILE`; if($current_file eq $path[-1]) { print "Already downloaded file of day in question\n"; exit 0; } $file = $path[-1]; if(!rhautoimport::check_file_extension($file)) { print "\n\nThe extension of the matching file '". $file . "' seems to be wrong - manual import necessary!!!\n"; exit 1; } last; } } } if($uri eq "") { print "No Entry found from day in question or download error - "; if($#ARGV >= 0 && $ARGV[0] eq 'last') { print "giving up, manual import necessary!!!\n"; } else { print "will retry later\n"; } exit 1; } unless($IGNORE_HEADLINE) { print "\nlooking for headlines from date $y in RSS Feed\n"; print " -> $HEADLINES_RSS_URL\n"; my $headlines_feed = rhautoimport::fetch_parse_rss($HEADLINES_RSS_URL) or die "Error fetching feed: " . XML::Feed->errstr; for my $entry ($headlines_feed->entries) { if($entry->enclosure && $entry->enclosure->type eq "audio/mpeg") { my $sum_title = $entry->title; my $sum_text = $entry->summary->body . "\n
\nlink . "\">" . $entry->link . "\n"; if($entry->id =~ /tag:democracynow.org,([0-9-]+):media\/mp3podcast\/[^\/]+/) { next if($y ne $1); print "summary:\n" . $sum_title . "\n\n" . $sum_text . "\n"; rhautoimport::pv_add_note($sum_title, $sum_text, $PV_ID, sprintf("%04d-%02d-%02d", @import_day), "1", 0); print "\n"; rhautoimport::pv_add_note($sum_title, $sum_text, $PV_ID, sprintf("%04d-%02d-%02d", @import_day), "1", 1); print "\n"; last; } } } } else { print "\nignoring headlines for they are not available by now\n"; my $dow_string = Date::Calc::Day_of_Week_to_Text(Date::Calc::Day_of_Week(@broadcast_day)); my $sum_title = sprintf("Democracy Now! %04d-%02d-%02d %s", @broadcast_day, $dow_string); my $sum_text = ""; print "summary:\n" . $sum_title . "\n\n" . $sum_text . "\n"; rhautoimport::pv_add_note($sum_title, $sum_text, $PV_ID, sprintf("%04d-%02d-%02d", @broadcast_day), "1", 2); print "\n"; } print "will import '$uri' to show $show_id, $show_title\n\n"; my ($ret, $log) = rhautoimport::import_uri($show_id, $uri->as_string); if($ret) { print "\nImport Error:\n\n"; print $log; exit 1; } print "\nImport Success:\n\n"; print $log; unlink($STAT_FILE); open(my $fhs, '>', $STAT_FILE); print $fhs $file; close($fhs); exit 0;