From bd90af22c3ca8275de1c8cee6b64cdc9fc52a55c Mon Sep 17 00:00:00 2001 From: Christian Pointner Date: Fri, 28 Jul 2017 01:32:50 +0200 Subject: added importer for x_xy diff --git a/INFO b/INFO index 566e1bf..b83690e 100644 --- a/INFO +++ b/INFO @@ -29,3 +29,21 @@ sind laut O94 Homepage gelaufen... RH: 4wöchentlich, Woche 3, Dienstag, 16:00-16:30 4wöchtenlich, Woche 2, Mittwoch, 14:00-14:30, Wiederholung + +- Pura Vida Sounds: + https://cba.fro.at/series/pura-vida-sounds/feed + + Original: monatlich + Upload: am ersten des Monats oder letzten des Vormonats + Such-Kriterium: Dateiname beginnt mit 'YYYY-mm-dd' + es gibt nur eine Sendung pro Monat -> immer die + aktuellste spielen (manchmal 2 statt eine Wiederh.) + RH: 2wöchentlich, Woche 2/4, Montag, 16:00-17:00 + +- X_XY (Un)gelöst und (Un)erhört!: + https://cba.fro.at/series/x_xy-ungeloest-und-unerhoert/feed + + Original: 2wöchentlich, Woche 2/4, Freitag + Upload: oft ein paar Tage davor, manchmal erst 1 Tag später + Such-Kriterium: Dateiname bgeinnt mit 'dd-mm-YYYY' + RH: 2wöchentlich, Woche 2/4, Dienstag, 13:00-14:00 diff --git a/Makefile b/Makefile index 5040694..f6dfeea 100644 --- a/Makefile +++ b/Makefile @@ -26,7 +26,7 @@ endif .PHONY: clean distclean EXECUTABLE := rhautoimport -IMPORTER := btl dn dv ek er eu fb fl gd nw oi po pv rs ra tr wr +IMPORTER := btl dn dv ek er eu fb fl gd nw oi po pv rs ra tr wr xy EXECUTABLES := $(IMPORTER:%=$(EXECUTABLE)-%) all: $(EXECUTABLE) diff --git a/TODO b/TODO index 7050032..2309dd3 100644 --- a/TODO +++ b/TODO @@ -1,13 +1,3 @@ -- Pura Vida Sounds: - https://cba.fro.at/series/pura-vida-sounds/feed - - Original: monatlich - Upload: am ersten des Monats oder letzten des Vormonats - Such-Kriterium: Dateiname beginnt mit 'YYYY-mm-dd' - es gibt nur eine Sendung pro Monat -> immer die - aktuellste spielen (manchmal 2 statt eine Wiederh.) - RH: 2wöchentlich, Woche 2/4, Montag, 16:00-17:00 - - literadio on air: https://cba.fro.at/series/aufdraht-literadio-on-air/feed @@ -15,12 +5,3 @@ Upload: ? Such-Kriterium: Titel enthält manchmal mm-YY oder m-YYYY RH: 4wöchentlich, Woche 3, Montag, 16:30-17:00 - -- X_XY (Un)gelöst und (Un)erhört!: - https://cba.fro.at/series/x_xy-ungeloest-und-unerhoert/feed - - Original: 2wöchentlich, Woche 2/4, Freitag - Upload: oft ein paar Tage davor, manchmal erst 1 Tag später - Such-Kriterium: Dateiname bgeinnt mit 'dd-mm-YYYY' - wird sehr oft nicht richtig gemacht - RH: 2wöchentlich, Woche 2/4, Montag, 13:00-14:00 diff --git a/debian/changelog b/debian/changelog index 61a5d5c..c470c91 100644 --- a/debian/changelog +++ b/debian/changelog @@ -1,3 +1,9 @@ +rhautoimport (36-1) unstable; urgency=medium + + * added import for x_xy + + -- Christian Pointner Fri, 28 Jul 2017 01:31:35 +0200 + rhautoimport (35-1) unstable; urgency=medium * fix last attempt for pura-vida diff --git a/rhautoimport-xy b/rhautoimport-xy new file mode 100755 index 0000000..6027ed7 --- /dev/null +++ b/rhautoimport-xy @@ -0,0 +1,194 @@ +#!/usr/bin/perl -w +# +# +# rhautoimport +# +# Copyright (C) 2009-2017 Christian Pointner +# +# This file is part of rhautoimport. +# +# rhautoimport is free software: you can redistribute it and/or modify +# it under the terms of the GNU General Public License as published by +# the Free Software Foundation, either version 3 of the License, or +# any later version. +# +# rhautoimport is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU General Public License for more details. +# +# You should have received a copy of the GNU General Public License +# along with rhautoimport. If not, see . +# + +use strict; +use Date::Calc; +use XML::Feed; +use XML::Feed::Entry; +use XML::Feed::Content; +use XML::Feed::Enclosure; +use URI::URL; +use HTML::Entities; + +use lib '/usr/local/share/rhautoimport/'; +use rhautoimport; + +my $STAT_FILE = $ENV{'HOME'} . "/rhautoimport-xy.stat"; +my $RSS_URL = "https://cba.fro.at/series/x_xy-ungeloest-und-unerhoert/feed"; +$XML::Feed::MULTIPLE_ENCLOSURES=1; +my $RD_GROUP = "X_XYungel"; +my $RD_CART = 111001; +my $PV_ID = '608'; +my $TITLE="X_XY (Un)gelöst und (Un)erhört!"; +my $LAST_RUN = 0; +my $upload_delay_days = 1; # files are usally there at least 1 day after original broadcast + +binmode(STDIN, ":utf8"); +binmode(STDOUT, ":utf8"); +binmode(STDERR, ":utf8"); + +my $curweek = RHRD::utils::get_rd_week(); + +if($#ARGV >= 0 && $ARGV[0] eq 'last') { + if($curweek == 2 || $curweek == 4) { + print "!!!This is the last attempt, there won't be a retry on error!!!\n"; + $LAST_RUN = 1; + } +} +rhautoimport::report_title_and_last($TITLE, $LAST_RUN); + + +my @allowed_dbs = rhautoimport::get_dropboxes($RD_GROUP); +if(!defined $allowed_dbs[0] && defined $allowed_dbs[1]) { + print "$allowed_dbs[1]\n"; + exit 1; +} + +if(scalar(@allowed_dbs) != 1) { + print "found more or less than one Dropbox for this group?!\n"; + exit 1; +} +my $show_id = $allowed_dbs[0]->{'SHOWID'}; +my $show_title = $allowed_dbs[0]->{'SHOWTITLE'}; + +my @today = Date::Calc::Today(); + +my @import_date = Date::Calc::Standard_to_Business(@today); +my $dow = $import_date[2]; +@import_date = Date::Calc::Business_to_Standard($import_date[0], $import_date[1], 2); +if($dow <= 2) { + if($curweek == 1 || $curweek == 3) { + @import_date = Date::Calc::Add_Delta_Days(@import_date, 7); + } +} else { + @import_date = Date::Calc::Add_Delta_Days(@import_date, 7); + if($curweek == 2 || $curweek == 4) { + @import_date = Date::Calc::Add_Delta_Days(@import_date, 7); + } +} + +my @broadcast_date = Date::Calc::Add_Delta_Days(@import_date, -11); +print "today: " . Date::Calc::Date_to_Text(@today) . "\n"; +print "day of next Radio Helsinki broadcast: " . Date::Calc::Date_to_Text(@import_date) . "\n"; +print "day of latest original broadcast before next Radio Helsinki broadcast: " . Date::Calc::Date_to_Text(@broadcast_date) . "\n"; + +if(Date::Calc::Delta_Days(@broadcast_date, @today) <= $upload_delay_days) { + print "File won't be available by now!\n"; + exit 42; +} + +my $id = sprintf("%04d-%02d-%02d", @import_date); +my $bd = sprintf("%04d-%02d-%02d", @broadcast_date); +my $bdfile = sprintf("^0?%d-?0?%d-?%04d", $broadcast_date[2], $broadcast_date[1], $broadcast_date[0]); +print "looking for files from $bd in RSS Feed\n"; +print " -> $RSS_URL\n"; + +my ($result, $feed) = rhautoimport::fetch_parse_rss_cba($RSS_URL); +unless ($result) { + print "Error fetching feed: $feed\n"; + exit 1; +} + +my $uri = ""; +my $file = ""; +my $sum_title = ""; +my $sum_text = ""; + +my $i = 0; +for my $entry ($feed->entries) { + $i++; + next unless $entry->enclosure; + my $j = 0; + for my $enclosure($entry->enclosure) { + $j++; + if($enclosure->type eq "audio/mpeg" || $enclosure->type eq "audio/ogg") { + print "$i/$j: (" . $enclosure->type . ", " . $enclosure->length . ") " . $enclosure->url . "\n"; + my $orig_uri = $enclosure->url; + if($orig_uri =~ /^(.*)_cut(\.[^\.]+)$/) { + $orig_uri = $1 . $2; + } + + $uri = new URI::URL($orig_uri); + my @path = $uri->path_components; + $file = $path[-1]; + unless(uc($file) =~ $bdfile) { # file not from correct day + $uri = ""; + next; + } + + my $current_file = `cat $STAT_FILE`; + if($current_file eq $file) { + print "Already downloaded file of today\n"; + exit 42; + } + if(!rhautoimport::check_file_extension($file)) { + print "\n\nThe extension of the matching file '". $file . "' seems to be wrong - manual import necessary!!!\n"; + print "\n\n --> https://import.helsinki.at/shows/$show_id\n"; + exit 1; + } + + $sum_title = decode_entities($entry->title); + $sum_text = decode_entities($entry->content->body); + print "summary:\n" . $sum_title . "\n\n" . $sum_text . "\n"; + last; + } + } + last if $uri ne ""; +} +if($uri eq "") { + print "No Entry found from $bd - "; + if($LAST_RUN) { + print "giving up, manual import necessary!!!\n"; + print "\n\n --> https://import.helsinki.at/shows/$show_id\n"; + } else { + print "will retry later\n"; + } + exit 1; +} + +print "\n\nwill import '$uri' to show $show_id, $show_title\n\n"; + +my ($ret, $log) = rhautoimport::import_uri($show_id, $uri->as_string, undef, $RD_CART); +if($ret) { + print "\nImport Error:\n\n"; + print $log; + print "\n\nNot adding PV note!!"; + exit 1; +} +print "\nImport Success:\n\n"; +print $log; +print "\n"; +my $exit_code = 0; +($ret, $log) = rhautoimport::pv_add_note($sum_title, $sum_text, $PV_ID, $id, "1"); +print $log; +if($ret) { + print "\nIgnoring failed note import - manual intervention necessary!\n"; + $exit_code = 23; +} + +unlink($STAT_FILE); +open(my $fhs, '>', $STAT_FILE); +print $fhs "$file"; +close($fhs); + +exit $exit_code; diff --git a/rhautoimport.pm b/rhautoimport.pm index ed6a8cc..a366d9a 100644 --- a/rhautoimport.pm +++ b/rhautoimport.pm @@ -209,12 +209,17 @@ sub parse_result sub import_uri { - my ($show_id, $uri, $file_policy) = @_; + my ($show_id, $uri, $file_policy, $cart) = @_; my %request; $request{'LOGIN_NAME'} = RD_USER; $request{'SHOW_ID'} = int($show_id); - $request{'CLEAR_SHOW_CARTS'} = JSON->true; + if($cart) { + $request{'CART_NUMBER'} = $cart; + $request{'CLEAR_CART'} = JSON->true; + } else { + $request{'CLEAR_SHOW_CARTS'} = JSON->true; + } $request{'SOURCE_URI'} = $uri; $request{'SOURCE_FILE_POLICY'} = $file_policy if $file_policy; -- cgit v0.10.2