summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorChristian Pointner <equinox@helsinki.at>2020-06-17 15:58:05 (GMT)
committerChristian Pointner <equinox@helsinki.at>2020-06-17 15:58:05 (GMT)
commit52920b8ef8b6e49308329f74f6afac1de3bb895a (patch)
treebb47719d192845f227fe6cebf53397195a5c0a9b
parent97043f5c4a8f65262f73f839d5ac8c85209e5d50 (diff)
added importer for crossing borders
-rw-r--r--INFO16
-rw-r--r--Makefile2
-rw-r--r--TODO8
-rw-r--r--debian/changelog6
-rw-r--r--graveyard/INFO8
-rwxr-xr-xrhautoimport-ba2
-rwxr-xr-xrhautoimport-cb208
7 files changed, 232 insertions, 18 deletions
diff --git a/INFO b/INFO
index 6ba830b..862bd68 100644
--- a/INFO
+++ b/INFO
@@ -124,14 +124,6 @@
Such-Kriterium: cba:broadcastDate wenn gesetzt sonst cba:productionDate
RH: 4wöchentlich, Woche 2, Dienstag, 13:00-14:00
-- (ab) A Year Abroad:
- https://cba.fro.at/series/a-year-abroad/feed
-
- Original: vierter Freitag im Monat
- Upload: ein paar tage davor, gelegentlich erst ein paar Tage später...
- Such-Kriterium: cba:broadcastDate wenn gesetzt sonst cba:productionDate
- RH: 4wöchentlich, Woche 3, Freitag, 15:00-16:00
-
- (po) Panoptikum Bildung:
https://cba.fro.at/series/panoptikum-bildung/feed
@@ -147,3 +139,11 @@
Upload: "wir versuchen zwischen Montag und Mittwoch hochzuladen"
Such-Kriterium: cba:broadcastDate wenn gesetzt sonst cba:productionDate
RH: 4wöchentlich, Woche 2, Freitag, 16:30-17:00
+
+- (cb) Crossing Borders
+ https://cba.fro.at/series/crossing-borders/feed
+
+ Original: erster Donnerstag im Monat
+ Upload: meistens 1-2 Tage später, (Ausreisser im Mai und Juni 2020 - aber erst 5 Termine insgesamt)
+ Such-Kriterium: cba:broadcastDate wenn gesetzt sonst cba:productionDate
+ RH: 4wöchentlich, Woche 1, Sonntag, 17:00-18:00
diff --git a/Makefile b/Makefile
index 0241016..7e3526e 100644
--- a/Makefile
+++ b/Makefile
@@ -26,7 +26,7 @@ endif
.PHONY: clean distclean
EXECUTABLE := rhautoimport
-IMPORTER := ba btl dm dn dv ek eu gd lr oi po rs ra tr wr xy
+IMPORTER := ba btl cb dm dn dv ek eu gd lr oi po rs ra tr wr xy
EXECUTABLES := $(IMPORTER:%=$(EXECUTABLE)-%)
all: $(EXECUTABLE)
diff --git a/TODO b/TODO
index b434d5f..eae7e83 100644
--- a/TODO
+++ b/TODO
@@ -23,11 +23,3 @@
Upload: Teilweise ein Monat später - batch upload...
Such-Kriterium: fortlaufende Nummer im Titel?
RH: 2wöchentlich, Woche 2/4, Dienstag, 02:00-03:00
-
-- (cb) Crossing Borders
- https://cba.fro.at/series/crossing-borders/feed
-
- Original: erster Donnerstag im Monat
- Upload: meistens 1-2 Tage später, (Ausreisser im Mai aber erst 4 Sendungen insgesamt)
- Such-Kriterium: cba:broadcastDate wenn gesetzt sonst cba:productionDate
- RH: 4wöchentlich, Woche 1, Sonntag, 17:00-18:00
diff --git a/debian/changelog b/debian/changelog
index d86e7ca..a1894b9 100644
--- a/debian/changelog
+++ b/debian/changelog
@@ -1,3 +1,9 @@
+rhautoimport (62-1) unstable; urgency=medium
+
+ * add importer for crossing borders
+
+ -- Christian Pointner <equinox@helsinki.at> Wed, 17 Jun 2020 17:57:23 +0200
+
rhautoimport (61-1) unstable; urgency=medium
* onda-info: use title not filename
diff --git a/graveyard/INFO b/graveyard/INFO
index a85f901..ca882f0 100644
--- a/graveyard/INFO
+++ b/graveyard/INFO
@@ -34,3 +34,11 @@
Such-Kriterium: fortlaufende Nummer in Titel und Dateiname
RH: wöchentlich, Donnerstag 17:50-18:00 und Samstag 17:50-18:00
keine Wiederholung
+
+- (ab) A Year Abroad:
+ https://cba.fro.at/series/a-year-abroad/feed
+
+ Original: vierter Freitag im Monat
+ Upload: ein paar tage davor, gelegentlich erst ein paar Tage später...
+ Such-Kriterium: cba:broadcastDate wenn gesetzt sonst cba:productionDate
+ RH: 4wöchentlich, Woche 3, Freitag, 15:00-16:00
diff --git a/rhautoimport-ba b/rhautoimport-ba
index 0a53a09..6744ff8 100755
--- a/rhautoimport-ba
+++ b/rhautoimport-ba
@@ -50,7 +50,7 @@ binmode(STDERR, ":utf8");
my $curweek = RHRD::utils::get_rd_week();
-if($curweek == 3) {
+if($curweek == 2) {
if($#ARGV >= 0 && $ARGV[0] eq 'last') {
print "!!!This is the last attempt, there won't be a retry on error!!!\n";
$LAST_RUN = 1;
diff --git a/rhautoimport-cb b/rhautoimport-cb
new file mode 100755
index 0000000..8063ce4
--- /dev/null
+++ b/rhautoimport-cb
@@ -0,0 +1,208 @@
+#!/usr/bin/perl -w
+#
+#
+# rhautoimport
+#
+# Copyright (C) 2009-2017 Christian Pointner <equinox@helsinki.at>
+#
+# This file is part of rhautoimport.
+#
+# rhautoimport is free software: you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# any later version.
+#
+# rhautoimport is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with rhautoimport. If not, see <http://www.gnu.org/licenses/>.
+#
+
+use strict;
+use Date::Calc;
+use DateTime::Format::Strptime;
+use XML::Feed;
+use XML::Feed::Entry;
+use XML::Feed::Content;
+use XML::Feed::Enclosure;
+use URI::URL;
+use HTML::Entities;
+use RHRD::utils;
+
+use lib '/usr/local/share/rhautoimport/';
+use rhautoimport;
+
+my $STAT_FILE = $ENV{'HOME'} . "/rhautoimport-cb.stat";
+my $RSS_URL = "https://cba.fro.at/series/crossing-borders/feed";
+$XML::Feed::MULTIPLE_ENCLOSURES=1;
+my $RD_GROUP = "crossingb";
+my $PV_ID = '809';
+my $TITLE = "Crossing Borders";
+my $LAST_RUN = 0;
+my $upload_delay_days = 0;
+
+binmode(STDIN, ":utf8");
+binmode(STDOUT, ":utf8");
+binmode(STDERR, ":utf8");
+
+my $curweek = RHRD::utils::get_rd_week();
+
+if($curweek == 1) {
+ if($#ARGV >= 0 && $ARGV[0] eq 'last') {
+ print "!!!This is the last attempt, there won't be a retry on error!!!\n";
+ $LAST_RUN = 1;
+ }
+}
+rhautoimport::report_title_and_last($TITLE, $LAST_RUN);
+
+
+my @today = Date::Calc::Today();
+print "today: " . Date::Calc::Date_to_Text(@today) . " (Week: " . $curweek . ")\n";
+
+my @import_date = Date::Calc::Standard_to_Business(@today);
+$import_date[2] = 7;
+@import_date = Date::Calc::Business_to_Standard(@import_date);
+
+my $dow = Date::Calc::Day_of_Week(@today);
+if($curweek == 2) {
+ @import_date = Date::Calc::Add_Delta_Days(@import_date, 21);
+} elsif($curweek == 3) {
+ @import_date = Date::Calc::Add_Delta_Days(@import_date, 14);
+} else {
+ @import_date = Date::Calc::Add_Delta_Days(@import_date, 7);
+}
+print "day of next Radio Helsinki broadcast: " . Date::Calc::Date_to_Text(@import_date) . "\n";
+
+
+my @allowed_dbs = rhautoimport::get_dropboxes($RD_GROUP);
+if(!defined $allowed_dbs[0] && defined $allowed_dbs[1]) {
+ print "$allowed_dbs[1]\n";
+ exit 1;
+}
+
+if(scalar(@allowed_dbs) != 1) {
+ print "found more or less than one Dropbox for this group?!\n";
+ exit 1;
+}
+my $show_id = $allowed_dbs[0]->{'SHOWID'};
+my $show_title = $allowed_dbs[0]->{'SHOWTITLE'};
+
+my @broadcast_date = Date::Calc::Nth_Weekday_of_Month_Year($import_date[0], $import_date[1], 4, 1);
+if(Date::Calc::Delta_Days(@broadcast_date, @import_date) <= 0) {
+ my @tmp_date = Date::Calc::Add_Delta_YM(@broadcast_date, 0, -1);
+ @broadcast_date = Date::Calc::Nth_Weekday_of_Month_Year($tmp_date[0], $tmp_date[1], 4, 1);
+}
+print "day of latest original broadcast before next Radio Helsinki broadcast: " . Date::Calc::Date_to_Text(@broadcast_date) . "\n";
+
+if(Date::Calc::Delta_Days(@broadcast_date, @today) <= $upload_delay_days) {
+ print "File won't be available by now!\n";
+ exit 42;
+}
+
+my $id = sprintf("%04d-%02d-%02d", @import_date);
+my $bd = sprintf("%04d-%02d-%02d", @broadcast_date);
+
+print "looking for files with cba:broadcastDate $bd in RSS Feed (will be using cba:productionDate if cba:broadcastDate is not set)\n";
+print " -> $RSS_URL\n";
+
+my ($result, $feed) = rhautoimport::fetch_parse_rss_cba($RSS_URL);
+unless ($result) {
+ print "Error fetching feed: $feed\n";
+ exit 1;
+}
+
+my $uri = "";
+my $file = "";
+my $sum_title = "";
+my $sum_text = "";
+
+my $i = 0;
+for my $entry ($feed->entries) {
+ $i++;
+ next unless $entry->enclosure;
+
+ my $entry_bdt = $entry->{'entry'}{'https://cba.fro.at/help#feeds'}{'broadcastDate'};
+ my $format_string = "%a, %d %b %Y %H:%M:%S";
+ unless (defined $entry_bdt) {
+ $entry_bdt = $entry->{'entry'}{'https://cba.fro.at/help#feeds'}{'productionDate'};
+ $format_string = "%a, %d %b %Y";
+ }
+ next unless (defined $entry_bdt);
+ my $bdt = DateTime::Format::Strptime::strptime($format_string, $entry_bdt);
+
+ next unless($broadcast_date[0] == $bdt->year && $broadcast_date[1] == $bdt->month && $broadcast_date[2] == $bdt->day);
+
+ my $j = 0;
+ for my $enclosure($entry->enclosure) {
+ $j++;
+ if($enclosure->type eq "audio/mpeg" || $enclosure->type eq "audio/ogg") {
+ print "$i/$j: (" . $enclosure->type . ", " . $enclosure->length . ") " . $enclosure->url . "\n";
+ my $orig_uri = $enclosure->url;
+ if($orig_uri =~ /^(.*)_cut(\.[^\.]+)$/) {
+ $orig_uri = $1 . $2;
+ }
+
+ $uri = new URI::URL($orig_uri);
+ my @path = $uri->path_components;
+ $file = $path[-1];
+
+ my $current_stat = `cat $STAT_FILE`;
+ my ($current_id, $current_file) = $current_stat =~ m/^(.*)\n(.*)/;
+ if($current_id eq $id && $current_file eq $file) {
+ print "Already downloaded file of today\n";
+ exit 42;
+ }
+ if(!rhautoimport::check_file_extension($file)) {
+ print "\n\nThe extension of the matching file '". $file . "' seems to be wrong - manual import necessary!!!\n";
+ print "\n\n --> https://import.helsinki.at/shows/$show_id\n";
+ exit 1;
+ }
+
+ $sum_title = decode_entities($entry->title);
+ $sum_text = decode_entities($entry->content->body);
+ print "summary:\n" . $sum_title . "\n\n" . $sum_text . "\n";
+ last;
+ }
+ }
+ last if $uri ne "";
+}
+if($uri eq "") {
+ print "No Entry found from $bd - ";
+ if($LAST_RUN) {
+ print "giving up, manual import necessary!!!\n";
+ print "\n\n --> https://import.helsinki.at/shows/$show_id\n";
+ } else {
+ print "will retry later\n";
+ }
+ exit 1;
+}
+
+print "\n\nwill import '$uri' to show $show_id, $show_title\n\n";
+
+my ($ret, $log) = rhautoimport::import_uri($show_id, $uri->as_string);
+if($ret) {
+ print "\nImport Error:\n\n";
+ print $log;
+ print "\n\nNot adding PV note!!";
+ exit 1;
+}
+print "\nImport Success:\n\n";
+print $log;
+print "\n";
+my $exit_code = 0;
+($ret, $log) = rhautoimport::pv_add_note($sum_title, $sum_text, $PV_ID, $id, "1");
+print $log;
+if($ret) {
+ print "\nIgnoring failed note import - manual intervention necessary!\n";
+ $exit_code = 23;
+}
+
+unlink($STAT_FILE);
+open(my $fhs, '>', $STAT_FILE);
+print $fhs "$id\n$file";
+close($fhs);
+
+exit $exit_code;