#!/usr/bin/perl -w # # # rhimport # # Copyright (C) 2009-2015 Christian Pointner # # This file is part of rhimport. # # rhimport is free software: you can redistribute it and/or modify # it under the terms of the GNU General Public License as published by # the Free Software Foundation, either version 3 of the License, or # any later version. # # rhimport is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU General Public License for more details. # # You should have received a copy of the GNU General Public License # along with rhimport. If not, see . # use strict; use Date::Calc; use XML::Feed; use XML::Feed::Entry; use XML::Feed::Content; use XML::Feed::Enclosure; use File::Fetch; use IO::Handle; use IPC::Open3; use HTML::Entities; use LWP::Simple; use RHRD::rddb; use lib '/usr/local/share/rhimport/'; use rhimport; my $STAT_FILE = $ENV{'HOME'} . "/rhimport-sv.stat"; my $RSS_URL = "http://cba.fro.at/seriesrss/262457?c=Kfs2IoV2Wmd"; $XML::Feed::MULTIPLE_ENCLOSURES=1; my $PV_ID = '396'; binmode(STDIN, ":utf8"); binmode(STDOUT, ":utf8"); binmode(STDERR, ":utf8"); if($#ARGV >= 0 && $ARGV[0] eq 'last') { print "!!!This is the last attempt, there won't be a retry on error!!!\n" } my $user = `/usr/bin/id -un`; $user =~ s/\n//; my $group = "svetjevas"; my ($dbh, $errorstring) = RHRD::rddb::opendb(); if(!defined $dbh) { print "$errorstring\n"; exit 1; } my @allowed_dbs = RHRD::rddb::get_dropboxes($dbh, $user, $group); if(!defined $allowed_dbs[0] && defined $allowed_dbs[2]) { print "$allowed_dbs[2]\n"; exit 1; } if(scalar(@allowed_dbs) != 1) { print "found more or less than one Dropbox for this group?!\n"; RHRD::rddb::closedb($dbh); exit 1; } my $dropbox = $allowed_dbs[0]->{'PATH'}; my $to_cart = $allowed_dbs[0]->{'TO_CART'}; my $curweek = rhimport::get_rd_week(); my @today = Date::Calc::Today(); my $dow = Date::Calc::Day_of_Week(@today); if(($curweek != 3 && $curweek != 4) || ($curweek == 4 && $dow > 2)) { print "File won't be available by now!\n"; RHRD::rddb::closedb($dbh); exit 0; } print "today: " . Date::Calc::Date_to_Text(@today) . "\n"; my @import_date = Date::Calc::Standard_to_Business(@today); $import_date[2] = 2; @import_date = Date::Calc::Business_to_Standard(@import_date); if($curweek == 3) { @import_date = Date::Calc::Add_Delta_Days(@import_date, 7); } print "day of next Radio Helsinki broadcast: " . Date::Calc::Date_to_Text(@import_date) . "\n"; my @broadcast_date = Date::Calc::Nth_Weekday_of_Month_Year($import_date[0], $import_date[1], 7, 1); if(Date::Calc::Delta_Days(@broadcast_date, @import_date) <= 0) { my @tmp_date = Date::Calc::Add_Delta_YM(@broadcast_date, 0, -1); @broadcast_date = Date::Calc::Nth_Weekday_of_Month_Year($tmp_date[0], $tmp_date[1], 7, 1); } print "day of latest original broadcast before next Radio Helsinki broadcast: " . Date::Calc::Date_to_Text(@broadcast_date) . "\n"; if(Date::Calc::Delta_Days(@broadcast_date, @today) <= 0) { print "File won't be available by now!\n"; RHRD::rddb::closedb($dbh); exit 0; } my $id = sprintf("%04d-%02d-%02d", @import_date); my $bd = sprintf("%04d-%02d-%02d", @broadcast_date); my $bdfile = sprintf("SEOI%02d%02d", $broadcast_date[2], $broadcast_date[1]); print "looking for files from $bd in RSS Feed\n"; print " -> $RSS_URL\n"; my $feed = XML::Feed->parse(URI->new($RSS_URL)) or die "Error fetching feed: " . XML::Feed->errstr; my $file = ""; my $out_file = ""; my $i = 0; for my $entry ($feed->entries) { $i++; next unless $entry->enclosure; my $j = 0; for my $enclosure($entry->enclosure) { $j++; if($enclosure->type eq "audio/mpeg" || $enclosure->type eq "audio/ogg") { print "$i/$j: (" . $enclosure->type . ", " . $enclosure->length . ") " . $enclosure->url . "\n"; my $url = $enclosure->url; if($url =~ /^(.*)_cut(\.[^\.]+)$/) { $url = $1 . $2; } my $ff = File::Fetch->new(uri => $url); next unless (uc($ff->output_file) =~ $bdfile); # file not from correct day my $sum_title = decode_entities($entry->title); my $sum_text = decode_entities($entry->content->body); my $current_stat = `cat $STAT_FILE`; my ($current_id, $current_file) = $current_stat =~ m/^(.*)\n(.*)/; if($current_id eq $id && $current_file eq $ff->output_file) { print "Already downloaded file of today\n"; RHRD::rddb::closedb($dbh); exit 0; } $out_file = $ff->output_file; if(!rhimport::check_file_extension($out_file)) { print "\n\nThe extension of the matching file '". $out_file . "' seems to be wrong - manual import necessary!!!\n"; RHRD::rddb::closedb($dbh); exit 1; } print " --> " . $bdfile . ": downloading " . $url . " (" . $enclosure->length . " Bytes) .. "; $file = $ff->fetch( to => '/tmp' ) or die $ff->error; print "ok\n"; print "summary:\n" . $sum_title . "\n\n" . $sum_text . "\n"; rhimport::pv_add_note($sum_title, $sum_text, $PV_ID, $id, "1"); print "\n"; last; } } last if $file ne ""; } if($file eq "" || !(-e "$file")) { print "No Entry found from $bd or download error - "; if($#ARGV >= 0 && $ARGV[0] eq 'last') { print "giving up, manual import necessary!!!\n"; } else { print "will retry later\n"; } exit 1; } print "will import $file to dropbox $dropbox (cart=$to_cart)\n"; my $error_cb = sub { my ($text) = @_; print "\n$text"; return 0; }; rhimport::check_key_file() or die "Import Key not found, use rhimport-create-id to create one\n"; my $ret; my $log = rhimport::clear_carts($dbh, $group, $to_cart); my $import_log; ($ret, $import_log) = rhimport::import_single($file, $dropbox, $user, 0, $error_cb); $log .= $import_log; RHRD::rddb::closedb($dbh); unlink $file; if(!$ret) { print "\nImport Error:\n"; print $log; exit 1; } unlink($STAT_FILE); open(my $fhs, '>', $STAT_FILE); print $fhs "$id\n$out_file"; close($fhs); exit 0;