From b2ce2c9f9bcddff855059b2883ddaf7e8ad01a5b Mon Sep 17 00:00:00 2001 From: Christian Pointner Date: Fri, 29 Apr 2022 13:55:38 +0200 Subject: move importer for Tierrechtsradio to graveyard diff --git a/INFO b/INFO index 477bb5b..a767275 100644 --- a/INFO +++ b/INFO @@ -58,14 +58,6 @@ Such-Kriterium: cba:broadcastDate wenn gesetzt sonst cba:productionDate RH: wöchentlich, Samstag, 15:30-16:00 -- (tr) Tierrechtsradio: - https://cba.fro.at/series/tierrechtsradio/feed - - Original: wöchentlich Freitags - Upload: meistens am selben Tag, nachmittags - Such-Kriterium: cba:broadcastDate - RH: wöchentlich, Freitag, 08:00-09:00 - - (ek) Eigenklang: https://cba.fro.at/series/eigenklang/feed diff --git a/Makefile b/Makefile index 6d62907..6f5065a 100644 --- a/Makefile +++ b/Makefile @@ -26,7 +26,7 @@ endif .PHONY: clean distclean EXECUTABLE := rhautoimport -IMPORTER := ar ba bo btl cb cr dm dn ek eu gd lr mz oi po rs ra tr so +IMPORTER := ar ba bo btl cb cr dm dn ek eu gd lr mz oi po rs ra so EXECUTABLES := $(IMPORTER:%=$(EXECUTABLE)-%) all: $(EXECUTABLE) diff --git a/graveyard/INFO b/graveyard/INFO index 8a72f70..3bca0af 100644 --- a/graveyard/INFO +++ b/graveyard/INFO @@ -71,3 +71,11 @@ sind laut O94 Homepage gelaufen... RH: 4wöchentlich, Woche 3, Dienstag, 16:00-16:30 4wöchentlich, Woche 2, Mittwoch, 14:00-14:30, Wiederholung + +- (tr) Tierrechtsradio: + https://cba.fro.at/series/tierrechtsradio/feed + + Original: wöchentlich Freitags + Upload: meistens am selben Tag, nachmittags + Such-Kriterium: cba:broadcastDate + RH: wöchentlich, Freitag, 08:00-09:00 diff --git a/graveyard/rhautoimport-tr b/graveyard/rhautoimport-tr new file mode 100755 index 0000000..541d2d7 --- /dev/null +++ b/graveyard/rhautoimport-tr @@ -0,0 +1,184 @@ +#!/usr/bin/perl -w +# +# +# rhautoimport +# +# Copyright (C) 2009-2017 Christian Pointner +# +# This file is part of rhautoimport. +# +# rhautoimport is free software: you can redistribute it and/or modify +# it under the terms of the GNU General Public License as published by +# the Free Software Foundation, either version 3 of the License, or +# any later version. +# +# rhautoimport is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU General Public License for more details. +# +# You should have received a copy of the GNU General Public License +# along with rhautoimport. If not, see . +# + +use strict; +use Date::Calc; +use DateTime::Format::Strptime; +use XML::Feed; +use XML::Feed::Entry; +use XML::Feed::Content; +use XML::Feed::Enclosure; +use URI::URL; +use HTML::Entities; + +use lib '/usr/local/share/rhautoimport/'; +use rhautoimport; + +my $STAT_FILE = $ENV{'HOME'} . "/rhautoimport-tr.stat"; +my $RSS_URL = "https://cba.fro.at/series/tierrechtsradio/feed"; +$XML::Feed::MULTIPLE_ENCLOSURES=1; +my $RD_GROUP = "tierrecht"; +my $PV_ID = '506'; +my $TITLE="Tierrechtsradio"; +my $LAST_RUN = 0; +my $upload_delay_days = 0; # files are usally there on the same day of the original broadcast + +binmode(STDIN, ":utf8"); +binmode(STDOUT, ":utf8"); +binmode(STDERR, ":utf8"); + +if($#ARGV >= 0 && $ARGV[0] eq 'last') { + print "!!!This is the last attempt, there won't be a retry on error!!!\n"; + $LAST_RUN = 1; +} +rhautoimport::report_title_and_last($TITLE, $LAST_RUN); + + +my @allowed_dbs = rhautoimport::get_dropboxes($RD_GROUP); +if(!defined $allowed_dbs[0] && defined $allowed_dbs[1]) { + print "$allowed_dbs[1]\n"; + exit 1; +} + +if(scalar(@allowed_dbs) != 1) { + print "found more or less than one Dropbox for this group?!\n"; + exit 1; +} +my $show_id = $allowed_dbs[0]->{'SHOWID'}; +my $show_title = $allowed_dbs[0]->{'SHOWTITLE'}; + + +my @today = Date::Calc::Today(); +my @tmp = Date::Calc::Standard_to_Business(@today); +my @broadcast_date = Date::Calc::Business_to_Standard($tmp[0], $tmp[1], 5); +if($tmp[2] < 5) { + @broadcast_date = Date::Calc::Add_Delta_Days(@broadcast_date, -7); +} +my @import_date = Date::Calc::Add_Delta_Days(@broadcast_date, 7); +print "day of original broadcast: " . Date::Calc::Date_to_Text(@broadcast_date) . "\n"; +print "day of Radio Helsinki broadcast: " . Date::Calc::Date_to_Text(@import_date) . "\n"; + +if(Date::Calc::Delta_Days(@broadcast_date, @today) <= $upload_delay_days) { + print "File won't be available by now!\n"; + exit 42; +} + +my $id = sprintf("%04d-%02d-%02d", @import_date); +my $bd = sprintf("%04d-%02d-%02d", @broadcast_date); + +print "looking for files with cba:broadcastDate $bd in RSS Feed\n"; +print " -> $RSS_URL\n"; + +my ($result, $feed) = rhautoimport::fetch_parse_rss_cba($RSS_URL); +unless ($result) { + print "Error fetching feed: $feed\n"; + exit 1; +} + +my $uri = ""; +my $file = ""; +my $sum_title = ""; +my $sum_text = ""; + +my $i = 0; +for my $entry ($feed->entries) { + $i++; + next unless $entry->enclosure; + + my $entry_bdt = $entry->{'entry'}{'https://cba.fro.at/help#feeds'}{'broadcastDate'}; + next unless (defined $entry_bdt); + my $bdt = DateTime::Format::Strptime::strptime("%a, %d %b %Y %H:%M:%S", $entry_bdt); + + next unless($broadcast_date[0] == $bdt->year && $broadcast_date[1] == $bdt->month && $broadcast_date[2] == $bdt->day); + + my $j = 0; + for my $enclosure($entry->enclosure) { + $j++; + if($enclosure->type eq "audio/mpeg" || $enclosure->type eq "audio/ogg") { + print "$i/$j: (" . $enclosure->type . ", " . $enclosure->length . ") " . $enclosure->url . "\n"; + my $orig_uri = $enclosure->url; + if($orig_uri =~ /^(.*)_cut(\.[^\.]+)$/) { + $orig_uri = $1 . $2; + } + + $uri = new URI::URL($orig_uri); + my @path = $uri->path_components; + $file = $path[-1]; + + my $current_stat = `cat $STAT_FILE`; + my ($current_id, $current_file) = $current_stat =~ m/^(.*)\n(.*)/; + if($current_id eq $id && $current_file eq $file) { + print "Already downloaded file of today\n"; + exit 42; + } + if(!rhautoimport::check_file_extension($file)) { + print "\n\nThe extension of the matching file '". $file . "' seems to be wrong - manual import necessary!!!\n"; + print "\n\n --> https://import.helsinki.at/shows/$show_id\n"; + exit 1; + } + + $sum_title = decode_entities($entry->title); + $sum_text = decode_entities($entry->content->body); + print "summary:\n" . $sum_title . "\n\n" . $sum_text . "\n"; + last; + } + } + last if $uri ne ""; +} +if($uri eq "") { + print "No Entry found from $bd - "; + if($LAST_RUN) { + print "giving up, manual import necessary!!!\n"; + print "\n\n --> https://import.helsinki.at/shows/$show_id\n"; + } else { + print "will retry later\n"; + } + exit 1; +} + +print "\n\nwill import '$uri' to show $show_id, $show_title\n\n"; + +my ($ret, $log) = rhautoimport::import_uri($show_id, $uri->as_string); +if($ret) { + print "\nImport Error:\n\n"; + print $log; + print "\n\nNot adding PV note!!"; + exit 1; +} +print "\nImport Success:\n\n"; +print $log; +print "\n"; +my $exit_code = 0; +($ret, $log) = rhautoimport::pv_add_note($sum_title, $sum_text, $PV_ID, $id, "1"); +print $log; +if($ret) { + print "\nIgnoring failed note import - manual intervention necessary!\n"; + $exit_code = 23; +} + +unlink($STAT_FILE); +open(my $fhs, '>', $STAT_FILE); +print $fhs "$id\n$file"; +close($fhs); + +exit $exit_code; diff --git a/rhautoimport-tr b/rhautoimport-tr deleted file mode 100755 index 541d2d7..0000000 --- a/rhautoimport-tr +++ /dev/null @@ -1,184 +0,0 @@ -#!/usr/bin/perl -w -# -# -# rhautoimport -# -# Copyright (C) 2009-2017 Christian Pointner -# -# This file is part of rhautoimport. -# -# rhautoimport is free software: you can redistribute it and/or modify -# it under the terms of the GNU General Public License as published by -# the Free Software Foundation, either version 3 of the License, or -# any later version. -# -# rhautoimport is distributed in the hope that it will be useful, -# but WITHOUT ANY WARRANTY; without even the implied warranty of -# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the -# GNU General Public License for more details. -# -# You should have received a copy of the GNU General Public License -# along with rhautoimport. If not, see . -# - -use strict; -use Date::Calc; -use DateTime::Format::Strptime; -use XML::Feed; -use XML::Feed::Entry; -use XML::Feed::Content; -use XML::Feed::Enclosure; -use URI::URL; -use HTML::Entities; - -use lib '/usr/local/share/rhautoimport/'; -use rhautoimport; - -my $STAT_FILE = $ENV{'HOME'} . "/rhautoimport-tr.stat"; -my $RSS_URL = "https://cba.fro.at/series/tierrechtsradio/feed"; -$XML::Feed::MULTIPLE_ENCLOSURES=1; -my $RD_GROUP = "tierrecht"; -my $PV_ID = '506'; -my $TITLE="Tierrechtsradio"; -my $LAST_RUN = 0; -my $upload_delay_days = 0; # files are usally there on the same day of the original broadcast - -binmode(STDIN, ":utf8"); -binmode(STDOUT, ":utf8"); -binmode(STDERR, ":utf8"); - -if($#ARGV >= 0 && $ARGV[0] eq 'last') { - print "!!!This is the last attempt, there won't be a retry on error!!!\n"; - $LAST_RUN = 1; -} -rhautoimport::report_title_and_last($TITLE, $LAST_RUN); - - -my @allowed_dbs = rhautoimport::get_dropboxes($RD_GROUP); -if(!defined $allowed_dbs[0] && defined $allowed_dbs[1]) { - print "$allowed_dbs[1]\n"; - exit 1; -} - -if(scalar(@allowed_dbs) != 1) { - print "found more or less than one Dropbox for this group?!\n"; - exit 1; -} -my $show_id = $allowed_dbs[0]->{'SHOWID'}; -my $show_title = $allowed_dbs[0]->{'SHOWTITLE'}; - - -my @today = Date::Calc::Today(); -my @tmp = Date::Calc::Standard_to_Business(@today); -my @broadcast_date = Date::Calc::Business_to_Standard($tmp[0], $tmp[1], 5); -if($tmp[2] < 5) { - @broadcast_date = Date::Calc::Add_Delta_Days(@broadcast_date, -7); -} -my @import_date = Date::Calc::Add_Delta_Days(@broadcast_date, 7); -print "day of original broadcast: " . Date::Calc::Date_to_Text(@broadcast_date) . "\n"; -print "day of Radio Helsinki broadcast: " . Date::Calc::Date_to_Text(@import_date) . "\n"; - -if(Date::Calc::Delta_Days(@broadcast_date, @today) <= $upload_delay_days) { - print "File won't be available by now!\n"; - exit 42; -} - -my $id = sprintf("%04d-%02d-%02d", @import_date); -my $bd = sprintf("%04d-%02d-%02d", @broadcast_date); - -print "looking for files with cba:broadcastDate $bd in RSS Feed\n"; -print " -> $RSS_URL\n"; - -my ($result, $feed) = rhautoimport::fetch_parse_rss_cba($RSS_URL); -unless ($result) { - print "Error fetching feed: $feed\n"; - exit 1; -} - -my $uri = ""; -my $file = ""; -my $sum_title = ""; -my $sum_text = ""; - -my $i = 0; -for my $entry ($feed->entries) { - $i++; - next unless $entry->enclosure; - - my $entry_bdt = $entry->{'entry'}{'https://cba.fro.at/help#feeds'}{'broadcastDate'}; - next unless (defined $entry_bdt); - my $bdt = DateTime::Format::Strptime::strptime("%a, %d %b %Y %H:%M:%S", $entry_bdt); - - next unless($broadcast_date[0] == $bdt->year && $broadcast_date[1] == $bdt->month && $broadcast_date[2] == $bdt->day); - - my $j = 0; - for my $enclosure($entry->enclosure) { - $j++; - if($enclosure->type eq "audio/mpeg" || $enclosure->type eq "audio/ogg") { - print "$i/$j: (" . $enclosure->type . ", " . $enclosure->length . ") " . $enclosure->url . "\n"; - my $orig_uri = $enclosure->url; - if($orig_uri =~ /^(.*)_cut(\.[^\.]+)$/) { - $orig_uri = $1 . $2; - } - - $uri = new URI::URL($orig_uri); - my @path = $uri->path_components; - $file = $path[-1]; - - my $current_stat = `cat $STAT_FILE`; - my ($current_id, $current_file) = $current_stat =~ m/^(.*)\n(.*)/; - if($current_id eq $id && $current_file eq $file) { - print "Already downloaded file of today\n"; - exit 42; - } - if(!rhautoimport::check_file_extension($file)) { - print "\n\nThe extension of the matching file '". $file . "' seems to be wrong - manual import necessary!!!\n"; - print "\n\n --> https://import.helsinki.at/shows/$show_id\n"; - exit 1; - } - - $sum_title = decode_entities($entry->title); - $sum_text = decode_entities($entry->content->body); - print "summary:\n" . $sum_title . "\n\n" . $sum_text . "\n"; - last; - } - } - last if $uri ne ""; -} -if($uri eq "") { - print "No Entry found from $bd - "; - if($LAST_RUN) { - print "giving up, manual import necessary!!!\n"; - print "\n\n --> https://import.helsinki.at/shows/$show_id\n"; - } else { - print "will retry later\n"; - } - exit 1; -} - -print "\n\nwill import '$uri' to show $show_id, $show_title\n\n"; - -my ($ret, $log) = rhautoimport::import_uri($show_id, $uri->as_string); -if($ret) { - print "\nImport Error:\n\n"; - print $log; - print "\n\nNot adding PV note!!"; - exit 1; -} -print "\nImport Success:\n\n"; -print $log; -print "\n"; -my $exit_code = 0; -($ret, $log) = rhautoimport::pv_add_note($sum_title, $sum_text, $PV_ID, $id, "1"); -print $log; -if($ret) { - print "\nIgnoring failed note import - manual intervention necessary!\n"; - $exit_code = 23; -} - -unlink($STAT_FILE); -open(my $fhs, '>', $STAT_FILE); -print $fhs "$id\n$file"; -close($fhs); - -exit $exit_code; -- cgit v0.10.2