summaryrefslogtreecommitdiff
path: root/graveyard/rhautoimport-nw
diff options
context:
space:
mode:
authorChristian Pointner <equinox@helsinki.at>2019-01-30 13:36:34 (GMT)
committerChristian Pointner <equinox@helsinki.at>2019-01-30 13:36:34 (GMT)
commitd188f194c29c616b0a5366cbacd5eba052d121b1 (patch)
tree1fef26e92b4685746b6ba0319d0826bbd9a3cc90 /graveyard/rhautoimport-nw
parent01ff101609b75b59b55e9530073a74e83f527af6 (diff)
moved old importer to graveyard
Diffstat (limited to 'graveyard/rhautoimport-nw')
-rwxr-xr-xgraveyard/rhautoimport-nw216
1 files changed, 216 insertions, 0 deletions
diff --git a/graveyard/rhautoimport-nw b/graveyard/rhautoimport-nw
new file mode 100755
index 0000000..e24a998
--- /dev/null
+++ b/graveyard/rhautoimport-nw
@@ -0,0 +1,216 @@
+#!/usr/bin/perl -w
+#
+#
+# rhautoimport
+#
+# Copyright (C) 2009-2017 Christian Pointner <equinox@helsinki.at>
+#
+# This file is part of rhautoimport.
+#
+# rhautoimport is free software: you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# any later version.
+#
+# rhautoimport is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with rhautoimport. If not, see <http://www.gnu.org/licenses/>.
+#
+
+use strict;
+use Date::Calc;
+use XML::Feed;
+use XML::Feed::Entry;
+use XML::Feed::Content;
+use XML::Feed::Enclosure;
+use URI::URL;
+use HTML::Entities;
+
+use lib '/usr/local/share/rhautoimport/';
+use rhautoimport;
+
+my $STAT_FILE = $ENV{'HOME'} . "/rhautoimport-nw.stat";
+my $RSS_URL = "https://cba.fro.at/series/radio-netwatcher/feed";
+$XML::Feed::MULTIPLE_ENCLOSURES=1;
+my $RD_GROUP = "netwatcher";
+my $PV_ID = '73';
+my $TITLE="netwatcher";
+my $LAST_RUN = 0;
+
+binmode(STDIN, ":utf8");
+binmode(STDOUT, ":utf8");
+binmode(STDERR, ":utf8");
+
+if($#ARGV >= 0 && $ARGV[0] eq 'last') {
+ print "!!!This is the last attempt, there won't be a retry on error!!!\n";
+ $LAST_RUN = 1;
+}
+rhautoimport::report_title_and_last($TITLE, $LAST_RUN);
+
+
+my @allowed_dbs = rhautoimport::get_dropboxes($RD_GROUP);
+if(!defined $allowed_dbs[0] && defined $allowed_dbs[1]) {
+ print "$allowed_dbs[1]\n";
+ exit 1;
+}
+
+my $idx = 0;
+my $idx_reb = 1;
+if(scalar(@allowed_dbs) != 2) {
+ print "found more or less than 2 Dropboxes for this group?!\n";
+ exit 1;
+}
+my $show_id = $allowed_dbs[$idx]->{'SHOWID'};
+my $show_title = $allowed_dbs[$idx]->{'SHOWTITLE'};
+my $show_id_reb = $allowed_dbs[$idx_reb]->{'SHOWID'};
+my $show_title_reb = $allowed_dbs[$idx_reb]->{'SHOWTITLE'};
+
+
+my @today = Date::Calc::Today();
+
+my @import_date = @today;
+if( Date::Calc::Day_of_Week(@today) > 3 ) {
+ @import_date = Date::Calc::Add_Delta_Days(@import_date, 7);
+}
+if( Date::Calc::Day_of_Week(@today) != 3 ) {
+ @import_date = Date::Calc::Standard_to_Business(@import_date);
+ $import_date[2] = 3;
+ @import_date = Date::Calc::Business_to_Standard(@import_date);
+}
+my @broadcast_day = Date::Calc::Add_Delta_Days(@import_date, -5);
+my @import_date_reb = Date::Calc::Add_Delta_Days(@import_date, 3);
+print "day of original broadcast: " . Date::Calc::Date_to_Text(@broadcast_day) . "\n";
+print "day of Radio Helsinki broadcast: " . Date::Calc::Date_to_Text(@import_date) . "\n";
+print "day of Radio Helsinki rebroadcast: " . Date::Calc::Date_to_Text(@import_date_reb) . "\n";
+
+my $id = sprintf("%04d-%02d-%02d", @import_date);
+my $bd = sprintf("%04d-%02d-%02d", @broadcast_day);
+my $bdfile = sprintf("NETWATCHER[-_]?%04d%02d%02d(.*)\.MP3", @broadcast_day);
+
+print "looking for files like '$bdfile' in RSS Feed\n";
+print " -> $RSS_URL\n";
+
+my ($result, $feed) = rhautoimport::fetch_parse_rss_cba($RSS_URL);
+unless ($result) {
+ print "Error fetching feed: $feed\n";
+ exit 1;
+}
+
+my $uri = "";
+my $file = "";
+my $sum_title = "";
+my $sum_text = "";
+
+my $i = 0;
+for my $entry ($feed->entries) {
+ $i++;
+ next unless $entry->enclosure;
+ my $j = 0;
+ for my $enclosure($entry->enclosure) {
+ $j++;
+ if($enclosure->type eq "audio/mpeg" || $enclosure->type eq "audio/ogg") {
+ print "$i/$j: (" . $enclosure->type . ", " . $enclosure->length . ") " . $enclosure->url . "\n";
+ my $orig_uri = $enclosure->url;
+ if($orig_uri =~ /^(.*)_cut(\.[^\.]+)$/) {
+ $orig_uri = $1 . $2;
+ }
+
+ $uri = new URI::URL($orig_uri);
+ my @path = $uri->path_components;
+ $file = $path[-1];
+ unless(uc($file) =~ $bdfile) { # file not from correct day
+ $uri = "";
+ next;
+ }
+
+ my $current_file = `cat $STAT_FILE`;
+ if($current_file eq $file) {
+ print "Already downloaded file of today\n";
+ exit 42;
+ }
+ if(!rhautoimport::check_file_extension($file)) {
+ print "\n\nThe extension of the matching file '". $file . "' seems to be wrong - manual import necessary!!!\n";
+ print "\n\n --> https://import.helsinki.at/shows/$show_id\n";
+ exit 1;
+ }
+
+ $sum_title = decode_entities($entry->title);
+ $sum_text = decode_entities($entry->content->body);
+ print "summary:\n" . $sum_title . "\n\n" . $sum_text . "\n";
+ last;
+ }
+ }
+ last if $uri ne "";
+}
+if($uri eq "") {
+ print "No Entry found from $bd - ";
+ if($LAST_RUN) {
+ print "giving up, manual import necessary!!!\n";
+ print "\n\n --> https://import.helsinki.at/shows/$show_id\n";
+ } else {
+ print "will retry later\n";
+ }
+ exit 1;
+}
+
+my $exit_code = 0;
+print "\n\nwill import '$uri' to show $show_id, $show_title\n";
+my ($ret, $log, $keptfile_uri) = rhautoimport::import_uri($show_id, $uri->as_string, "keep");
+if($ret == 0) {
+ print "\nImport Success:\n\n";
+ print $log;
+ print "\n";
+ ($ret, $log) = rhautoimport::pv_add_note($sum_title, $sum_text, $PV_ID, sprintf("%04d-%02d-%02d", @import_date), "1");
+ print $log;
+ if($ret) {
+ print "\nIgnoring failed note import - manual intervention necessary!\n";
+ $exit_code = 23;
+ }
+
+ print "\n";
+
+ if(!defined($keptfile_uri)) {
+ print "rhimportd didn't provide a clue where to find the kept file... will import '$uri' to rebroadcast $show_id_reb, $show_title_reb\n";
+ ($ret, $log) = rhautoimport::import_uri($show_id_reb, $uri->as_string);
+ } else {
+ print "re-using kept file '$keptfile_uri' to import rebroadcast $show_id_reb, $show_title_reb\n";
+ ($ret, $log) = rhautoimport::import_uri($show_id_reb, $keptfile_uri, "delete");
+ }
+
+ if($ret == 0) {
+ print "\nImport Success:\n\n";
+ print $log;
+ print "\n";
+ ($ret, $log) = rhautoimport::pv_add_note($sum_title, $sum_text, $PV_ID, sprintf("%04d-%02d-%02d", @import_date_reb), "2");
+ print $log;
+ if($ret) {
+ print "\nIgnoring failed note import - manual intervention necessary!\n";
+ $exit_code = 23;
+ }
+
+ } else {
+ print "\nImport Error:\n\n";
+ print $log;
+ print "\n\nNot adding PV note!!";
+ print "\n\nSince the import for the regular broadcast went through we will not retry this import!!!";
+ print "\nYou need to manually import the rebroadcast.";
+ print "\n\n --> https://import.helsinki.at/shows/$show_id_reb\n";
+ $exit_code = 23;
+ }
+} else {
+ print "\nImport Error:\n\n";
+ print $log;
+ print "\n\nNot adding PV note!!";
+ exit 1;
+}
+
+unlink($STAT_FILE);
+open(my $fhs, '>', $STAT_FILE);
+print $fhs "$file";
+close($fhs);
+
+exit $exit_code;