From 3650a2e89f32085a2f8af7157df352ed4d8ee583 Mon Sep 17 00:00:00 2001 From: Christian Pointner Date: Wed, 26 Sep 2018 19:00:51 +0200 Subject: added importer for 'die toten europas' WIP diff --git a/INFO b/INFO index 1e37409..286a875 100644 --- a/INFO +++ b/INFO @@ -119,3 +119,12 @@ Upload: ein paar tage davor, gelegentlich erst ein paar Tage später... Such-Kriterium: cba:broadcastDate wenn gesetzt sonst cba:productionDate RH: 4wöchentlich, Woche 3, Freitag, 15:00-16:00 + +- (dte) Die Toten Europas: + https://cba.fro.at/series/die-toten-europas/feed + + Original: abgeschlossene Reihe betehend aus 34 Episoden + Upload: bereits vollgständig vorhanden + Such-Kriterium: fortlaufende Nummer in Titel und Dateiname + RH: wöchentlich, Dienstag 10:00-10:30 und Samstag 15:00-15:30 + keine Wiederholung diff --git a/rhautoimport-dte b/rhautoimport-dte new file mode 100755 index 0000000..3673a69 --- /dev/null +++ b/rhautoimport-dte @@ -0,0 +1,203 @@ +#!/usr/bin/perl -w +# +# +# rhautoimport +# +# Copyright (C) 2009-2018 Christian Pointner +# +# This file is part of rhautoimport. +# +# rhautoimport is free software: you can redistribute it and/or modify +# it under the terms of the GNU General Public License as published by +# the Free Software Foundation, either version 3 of the License, or +# any later version. +# +# rhautoimport is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU General Public License for more details. +# +# You should have received a copy of the GNU General Public License +# along with rhautoimport. If not, see . +# + +use strict; +use Date::Calc; +use XML::Feed; +use XML::Feed::Entry; +use XML::Feed::Content; +use XML::Feed::Enclosure; +use URI::URL; +use HTML::Entities; +## TODO: remove me! +use lib '../rhrdlibs/lib/'; +use RHRD::utils; + +use lib '/usr/local/share/rhautoimport/'; +use rhautoimport; + +my $STAT_FILE = $ENV{'HOME'} . "/rhautoimport-dte.stat"; +my $LAST_FILE = $ENV{'HOME'} . "/rhautoimport-dte.last"; +my $RSS_URL = "https://cba.fro.at/series/die-toten-europas/feed"; +$XML::Feed::MULTIPLE_ENCLOSURES=1; +my $RD_GROUP = "dietoteneu"; +my $RD_CART_TU = 118201; +my $RD_CART_SA = 118204; +my $PV_ID = '719'; +my $TITLE="Die Toten Europas"; +my $LAST_RUN = 0; + +binmode(STDIN, ":utf8"); +binmode(STDOUT, ":utf8"); +binmode(STDERR, ":utf8"); + +rhautoimport::report_title_and_last($TITLE, $LAST_RUN); + +my @allowed_dbs = rhautoimport::get_dropboxes($RD_GROUP); +if(!defined $allowed_dbs[0] && defined $allowed_dbs[1]) { + print "$allowed_dbs[1]\n"; + exit 1; +} +if(scalar(@allowed_dbs) != 2) { + print "found more or less than two Dropboxes for this group?!\n"; + exit 1; +} +my $idx_tu = 0; +my $idx_sa = 1; +if($allowed_dbs[0]->{'SHOWDOW'} != 2) { + $idx_sa = 0; + $idx_tu = 1; +} + +my $show_id = 0; +my $show_title = ""; +my $rd_cart = 0; + +my @today = Date::Calc::Today(); +my $dow = Date::Calc::Day_of_Week(@today); +my @import_date = Date::Calc::Standard_to_Business(@today); + +if($dow < 2 || $dow > 6) { + $show_id = $allowed_dbs[$idx_tu]->{'SHOWID'}; + $show_title = $allowed_dbs[$idx_tu]->{'SHOWTITLE'}; + $rd_cart=$RD_CART_TU; + $import_date[2] = 2; +} else { + $show_id = $allowed_dbs[$idx_sa]->{'SHOWID'}; + $show_title = $allowed_dbs[$idx_sa]->{'SHOWTITLE'}; + $rd_cart=$RD_CART_SA; + $import_date[2] = 6; +} + +@import_date = Date::Calc::Business_to_Standard(@import_date); +if($dow > 6) { + @import_date = Date::Calc::Add_Delta_Days(@import_date, 7); +} + +my $broadcast_num = `cat $LAST_FILE`; +$broadcast_num += 1; +my $bdfileexp = sprintf("^%02d-", $broadcast_num); + +print "today: " . Date::Calc::Date_to_Text(@today) . "\n"; +print "day of next Radio Helsinki broadcast: " . Date::Calc::Date_to_Text(@import_date) . "\n"; +print "Number of next broadcast: " . $broadcast_num . "\n\n"; + +my $id = sprintf("%04d-%02d-%02d", @import_date); + +my $current_stat = `cat $STAT_FILE`; +my ($current_id, $current_file) = $current_stat =~ m/^(.*)\n(.*)/; +if($current_id eq $id) { + print "Already downloaded current file\n"; + exit 42; +} + +print "looking for file #$broadcast_num using $bdfileexp in RSS Feed\n"; +print " -> $RSS_URL\n"; + +my ($result, $feed) = rhautoimport::fetch_parse_rss_cba($RSS_URL); +unless ($result) { + print "Error fetching feed: $feed\n"; + exit 1; +} + +my $uri = ""; +my $file = ""; +my $sum_title = ""; +my $sum_text = ""; + +my $i = 0; +for my $entry ($feed->entries) { + $i++; + next unless $entry->enclosure; + my $j = 0; + for my $enclosure($entry->enclosure) { + $j++; + if($enclosure->type eq "audio/mpeg" || $enclosure->type eq "audio/ogg") { + my $orig_uri = $enclosure->url; + if($orig_uri =~ /^(.*)_cut(\.[^\.]+)$/) { + $orig_uri = $1 . $2; + } + + $sum_title = decode_entities($entry->title); + $sum_text = decode_entities($entry->content->body); + $uri = new URI::URL($orig_uri); + my @path = $uri->path_components; + $file = $path[-1]; + unless ($file =~ /$bdfileexp/) { + $uri = ""; + } + + if(!rhautoimport::check_file_extension($file)) { + print "\n\nThe extension of the matching file '". $file . "' seems to be wrong - manual import necessary!!!\n"; + print "\n\n --> https://import.helsinki.at/shows/$show_id\n"; + exit 1; + } + + last; + } + } + last if $uri ne ""; +} +if($uri eq "") { + print "No Entry for #$broadcast_num (there are no more shows available) - "; + if($LAST_RUN) { + print "giving up, manual import necessary!!!\n"; + print "\n\n --> https://import.helsinki.at/shows/$show_id\n"; + } else { + print "will retry later\n"; + } + exit 1; +} + +my $exit_code = 0; +print "summary:\n" . $sum_title . "\n\n" . $sum_text . "\n"; +print "\n\nwill import '$uri' to show $show_id, $show_title at cart $rd_cart\n\n"; + +my ($ret, $log) = rhautoimport::import_uri($show_id, $uri->as_string, undef, $rd_cart); +if($ret) { + print "\nImport Error:\n\n"; + print $log; + print "\n\nNot adding PV note!!"; + exit 1; +} +print "\nImport Success:\n\n"; +print $log; +print "\n"; +($ret, $log) = rhautoimport::pv_add_note($sum_title, $sum_text, $PV_ID, $id, "1"); +print $log; +if($ret) { + print "\nIgnoring failed note import - manual intervention necessary!\n"; + $exit_code = 23; +} + +unlink($STAT_FILE); +open(my $fhs, '>', $STAT_FILE); +print $fhs "$id\n$file"; +close($fhs); + +unlink($LAST_FILE); +open($fhs, '>', $LAST_FILE); +print $fhs "$broadcast_num"; +close($fhs); + +exit $exit_code; -- cgit v0.10.2