2020-07-28 11:01:44 +00:00
|
|
|
package Travelynx::Helper::HAFAS;
|
2021-01-05 21:27:46 +00:00
|
|
|
|
2020-11-27 21:12:56 +00:00
|
|
|
# Copyright (C) 2020 Daniel Friesel
|
|
|
|
#
|
2021-01-29 17:32:13 +00:00
|
|
|
# SPDX-License-Identifier: AGPL-3.0-or-later
|
2020-07-28 11:01:44 +00:00
|
|
|
|
|
|
|
use strict;
|
|
|
|
use warnings;
|
|
|
|
use 5.020;
|
|
|
|
|
|
|
|
use DateTime;
|
|
|
|
use Encode qw(decode);
|
|
|
|
use JSON;
|
|
|
|
use Mojo::Promise;
|
|
|
|
use XML::LibXML;
|
|
|
|
|
|
|
|
sub new {
|
|
|
|
my ( $class, %opt ) = @_;
|
|
|
|
|
|
|
|
my $version = $opt{version};
|
|
|
|
|
2020-07-28 12:19:55 +00:00
|
|
|
$opt{header}
|
|
|
|
= { 'User-Agent' =>
|
2020-09-06 10:41:36 +00:00
|
|
|
"travelynx/${version} on $opt{root_url} +https://finalrewind.org/projects/travelynx"
|
|
|
|
};
|
2020-07-28 11:01:44 +00:00
|
|
|
|
|
|
|
return bless( \%opt, $class );
|
|
|
|
}
|
|
|
|
|
|
|
|
sub get_polyline_p {
|
|
|
|
my ( $self, $train, $trip_id ) = @_;
|
|
|
|
|
2021-10-30 08:02:58 +00:00
|
|
|
my $line = $train->line // 0;
|
|
|
|
my $backend = $self->{hafas_rest_api};
|
|
|
|
my $url = "${backend}/trips/${trip_id}?lineName=${line}&polyline=true";
|
2020-07-28 11:01:44 +00:00
|
|
|
my $cache = $self->{main_cache};
|
|
|
|
my $promise = Mojo::Promise->new;
|
|
|
|
my $version = $self->{version};
|
|
|
|
|
|
|
|
if ( my $content = $cache->thaw($url) ) {
|
2020-09-10 19:20:26 +00:00
|
|
|
return $promise->resolve($content);
|
2020-07-28 11:01:44 +00:00
|
|
|
}
|
|
|
|
|
2021-10-30 08:02:58 +00:00
|
|
|
my $log_url = $url;
|
|
|
|
$log_url =~ s{://\K[^:]+:[^@]+\@}{***@};
|
|
|
|
|
2020-07-28 12:19:55 +00:00
|
|
|
$self->{user_agent}->request_timeout(5)->get_p( $url => $self->{header} )
|
|
|
|
->then(
|
2020-07-28 11:01:44 +00:00
|
|
|
sub {
|
|
|
|
my ($tx) = @_;
|
2020-07-28 12:19:55 +00:00
|
|
|
|
|
|
|
if ( my $err = $tx->error ) {
|
|
|
|
$promise->reject(
|
2021-10-30 08:02:58 +00:00
|
|
|
"hafas->get_polyline_p($log_url) returned HTTP $err->{code} $err->{message}"
|
2020-09-21 17:47:54 +00:00
|
|
|
);
|
2020-07-28 12:19:55 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2020-07-28 11:01:44 +00:00
|
|
|
my $body = decode( 'utf-8', $tx->res->body );
|
|
|
|
my $json = JSON->new->decode($body);
|
|
|
|
my @station_list;
|
|
|
|
my @coordinate_list;
|
|
|
|
|
|
|
|
for my $feature ( @{ $json->{polyline}{features} } ) {
|
|
|
|
if ( exists $feature->{geometry}{coordinates} ) {
|
|
|
|
my $coord = $feature->{geometry}{coordinates};
|
|
|
|
if ( exists $feature->{properties}{type}
|
|
|
|
and $feature->{properties}{type} eq 'stop' )
|
|
|
|
{
|
2020-07-28 12:19:55 +00:00
|
|
|
push( @{$coord}, $feature->{properties}{id} );
|
|
|
|
push( @station_list, $feature->{properties}{name} );
|
2020-07-28 11:01:44 +00:00
|
|
|
}
|
|
|
|
push( @coordinate_list, $coord );
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
my $ret = {
|
|
|
|
name => $json->{line}{name} // '?',
|
|
|
|
polyline => [@coordinate_list],
|
|
|
|
raw => $json,
|
|
|
|
};
|
|
|
|
|
|
|
|
$cache->freeze( $url, $ret );
|
|
|
|
|
2020-07-28 12:19:55 +00:00
|
|
|
# borders ("(Gr)" as in "Grenze") are only returned by HAFAS.
|
|
|
|
# They are not stations.
|
2020-07-28 11:01:44 +00:00
|
|
|
my $iris_stations = join( '|', $train->route );
|
|
|
|
my $hafas_stations
|
2020-07-28 12:19:55 +00:00
|
|
|
= join( '|', grep { $_ !~ m{\(Gr\)$} } @station_list );
|
2020-07-28 11:01:44 +00:00
|
|
|
|
2020-07-28 12:19:55 +00:00
|
|
|
# Do not return polyline if it belongs to an entirely different
|
|
|
|
# train. Trains with longer routes (e.g. due to train number
|
|
|
|
# changes, which are handled by HAFAS but left out in IRIS)
|
|
|
|
# are okay though.
|
2020-07-28 11:01:44 +00:00
|
|
|
if ( $iris_stations ne $hafas_stations
|
|
|
|
and index( $hafas_stations, $iris_stations ) == -1 )
|
|
|
|
{
|
2020-10-08 18:05:31 +00:00
|
|
|
$self->{log}->info( 'Ignoring polyline for '
|
2020-07-28 12:19:55 +00:00
|
|
|
. $train->line
|
|
|
|
. ": IRIS route does not agree with HAFAS route: $iris_stations != $hafas_stations"
|
2020-07-28 11:01:44 +00:00
|
|
|
);
|
2020-09-21 17:47:54 +00:00
|
|
|
$promise->reject(
|
2021-10-30 08:02:58 +00:00
|
|
|
"hafas->get_polyline_p($log_url): polyline route mismatch");
|
2020-07-28 11:01:44 +00:00
|
|
|
}
|
|
|
|
else {
|
|
|
|
$promise->resolve($ret);
|
|
|
|
}
|
2020-09-10 19:20:26 +00:00
|
|
|
return;
|
2020-07-28 11:01:44 +00:00
|
|
|
}
|
|
|
|
)->catch(
|
|
|
|
sub {
|
|
|
|
my ($err) = @_;
|
2021-10-30 08:02:58 +00:00
|
|
|
$promise->reject("hafas->get_polyline_p($log_url): $err");
|
2020-09-10 19:20:26 +00:00
|
|
|
return;
|
2020-07-28 11:01:44 +00:00
|
|
|
}
|
|
|
|
)->wait;
|
|
|
|
|
|
|
|
return $promise;
|
|
|
|
}
|
|
|
|
|
|
|
|
sub get_json_p {
|
|
|
|
my ( $self, $url ) = @_;
|
|
|
|
|
|
|
|
my $cache = $self->{main_cache};
|
|
|
|
my $promise = Mojo::Promise->new;
|
|
|
|
|
|
|
|
if ( my $content = $cache->thaw($url) ) {
|
2020-09-10 19:20:26 +00:00
|
|
|
return $promise->resolve($content);
|
2020-07-28 11:01:44 +00:00
|
|
|
}
|
|
|
|
|
2020-07-28 12:19:55 +00:00
|
|
|
$self->{user_agent}->request_timeout(5)->get_p( $url => $self->{header} )
|
|
|
|
->then(
|
2020-07-28 11:01:44 +00:00
|
|
|
sub {
|
|
|
|
my ($tx) = @_;
|
2020-07-28 12:19:55 +00:00
|
|
|
|
|
|
|
if ( my $err = $tx->error ) {
|
|
|
|
$promise->reject(
|
2020-09-21 17:47:54 +00:00
|
|
|
"hafas->get_json_p($url) returned HTTP $err->{code} $err->{message}"
|
|
|
|
);
|
2020-07-28 12:19:55 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2020-07-28 11:01:44 +00:00
|
|
|
my $body = decode( 'ISO-8859-15', $tx->res->body );
|
|
|
|
|
|
|
|
$body =~ s{^TSLs[.]sls = }{};
|
|
|
|
$body =~ s{;$}{};
|
|
|
|
$body =~ s{(}{(}g;
|
|
|
|
$body =~ s{)}{)}g;
|
|
|
|
my $json = JSON->new->decode($body);
|
|
|
|
$cache->freeze( $url, $json );
|
|
|
|
$promise->resolve($json);
|
2020-09-10 19:20:26 +00:00
|
|
|
return;
|
2020-07-28 11:01:44 +00:00
|
|
|
}
|
|
|
|
)->catch(
|
|
|
|
sub {
|
|
|
|
my ($err) = @_;
|
2020-10-08 18:05:31 +00:00
|
|
|
$self->{log}->info("hafas->get_json_p($url): $err");
|
2020-09-21 17:47:54 +00:00
|
|
|
$promise->reject("hafas->get_json_p($url): $err");
|
2020-09-10 19:20:26 +00:00
|
|
|
return;
|
2020-07-28 11:01:44 +00:00
|
|
|
}
|
|
|
|
)->wait;
|
|
|
|
return $promise;
|
|
|
|
}
|
|
|
|
|
|
|
|
sub get_xml_p {
|
|
|
|
my ( $self, $url ) = @_;
|
|
|
|
|
|
|
|
my $cache = $self->{realtime_cache};
|
|
|
|
my $promise = Mojo::Promise->new;
|
|
|
|
|
|
|
|
if ( my $content = $cache->thaw($url) ) {
|
2020-09-10 19:20:26 +00:00
|
|
|
return $promise->resolve($content);
|
2020-07-28 11:01:44 +00:00
|
|
|
}
|
|
|
|
|
2020-07-28 12:19:55 +00:00
|
|
|
$self->{user_agent}->request_timeout(5)->get_p( $url => $self->{header} )
|
|
|
|
->then(
|
2020-07-28 11:01:44 +00:00
|
|
|
sub {
|
|
|
|
my ($tx) = @_;
|
2020-07-28 12:19:55 +00:00
|
|
|
|
|
|
|
if ( my $err = $tx->error ) {
|
|
|
|
$promise->reject(
|
2020-09-21 17:47:54 +00:00
|
|
|
"hafas->get_xml_p($url) returned HTTP $err->{code} $err->{message}"
|
|
|
|
);
|
2020-07-28 12:19:55 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2020-07-28 11:01:44 +00:00
|
|
|
my $body = decode( 'ISO-8859-15', $tx->res->body );
|
|
|
|
my $tree;
|
|
|
|
|
|
|
|
my $traininfo = {
|
|
|
|
station => {},
|
|
|
|
messages => [],
|
|
|
|
};
|
|
|
|
|
2020-10-25 15:35:43 +00:00
|
|
|
# <SDay text="... > ..."> is invalid XML, but present in
|
2020-07-28 11:01:44 +00:00
|
|
|
# regardless. As it is the last tag, we just throw it away.
|
|
|
|
$body =~ s{<SDay [^>]*/>}{}s;
|
|
|
|
|
|
|
|
# More fixes for invalid XML
|
|
|
|
$body =~ s{P&R}{P&R};
|
2022-03-30 16:29:00 +00:00
|
|
|
$body =~ s{& }{& }g;
|
2020-10-25 15:35:43 +00:00
|
|
|
|
2021-06-05 12:17:49 +00:00
|
|
|
# <Attribute [...] text="[...]"[...]"" /> is invalid XML.
|
2020-10-25 15:35:43 +00:00
|
|
|
# Work around it.
|
|
|
|
$body
|
2021-06-05 12:17:49 +00:00
|
|
|
=~ s{<Attribute([^>]+)text="([^"]*)"([^"=>]*)""}{<Attribute$1text="$2*$3*"}s;
|
|
|
|
|
|
|
|
# Same for <HIMMessage lead="[...]"[...]"[...]" />
|
|
|
|
$body
|
|
|
|
=~ s{<HIMMessage([^>]+)lead="([^"]*)"([^"=>]*)"([^"]*)"}{<Attribute$1text="$2*$3*$4"}s;
|
2021-02-06 11:13:25 +00:00
|
|
|
|
2021-07-12 17:16:14 +00:00
|
|
|
# ... and <HIMMessage [...] lead="[...]<>[...]">
|
|
|
|
# (replace <> with t$t)
|
|
|
|
while ( $body
|
|
|
|
=~ s{<HIMMessage([^>]+)lead="([^"]*)<>([^"=]*)"}{<HIMMessage$1lead="$2⬌$3"}gis
|
|
|
|
)
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2021-02-06 11:13:25 +00:00
|
|
|
# Dito for <HIMMessage [...] lead="[...]<br>[...]">.
|
2021-02-06 17:06:09 +00:00
|
|
|
while ( $body
|
2021-04-24 07:11:18 +00:00
|
|
|
=~ s{<HIMMessage([^>]+)lead="([^"]*)<br/?>([^"=]*)"}{<HIMMessage$1lead="$2 $3"}is
|
|
|
|
)
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
# ... and any other HTML tag inside an XML attribute
|
|
|
|
while ( $body
|
|
|
|
=~ s{<HIMMessage([^>]+)lead="([^"]*)<[^>]+>([^"=]*)"}{<HIMMessage$1lead="$2$3"}is
|
2021-02-06 17:06:09 +00:00
|
|
|
)
|
|
|
|
{
|
|
|
|
}
|
2021-02-06 11:13:25 +00:00
|
|
|
|
2020-07-28 11:01:44 +00:00
|
|
|
eval { $tree = XML::LibXML->load_xml( string => $body ) };
|
2020-11-06 10:23:22 +00:00
|
|
|
if ( my $err = $@ ) {
|
|
|
|
if ( $err =~ m{extra content at the end}i ) {
|
|
|
|
|
|
|
|
# We requested XML, but received an HTML error page
|
|
|
|
# (which was returned with HTTP 200 OK).
|
|
|
|
$self->{log}->debug("load_xml($url): $err");
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
# There is invalid XML which we might be able to fix via
|
|
|
|
# regular expressions, so dump it into the production log.
|
|
|
|
$self->{log}->info("load_xml($url): $err");
|
|
|
|
}
|
2020-07-28 11:01:44 +00:00
|
|
|
$cache->freeze( $url, $traininfo );
|
2020-11-06 10:23:22 +00:00
|
|
|
$promise->reject("hafas->get_xml_p($url): $err");
|
2020-07-28 11:01:44 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
for my $station ( $tree->findnodes('/Journey/St') ) {
|
|
|
|
my $name = $station->getAttribute('name');
|
|
|
|
my $adelay = $station->getAttribute('adelay');
|
|
|
|
my $ddelay = $station->getAttribute('ddelay');
|
|
|
|
$traininfo->{station}{$name} = {
|
|
|
|
adelay => $adelay,
|
|
|
|
ddelay => $ddelay,
|
|
|
|
};
|
|
|
|
}
|
|
|
|
|
2020-07-28 12:19:55 +00:00
|
|
|
for my $message ( $tree->findnodes('/Journey/HIMMessage') ) {
|
2020-07-28 11:01:44 +00:00
|
|
|
my $header = $message->getAttribute('header');
|
|
|
|
my $lead = $message->getAttribute('lead');
|
|
|
|
my $display = $message->getAttribute('display');
|
|
|
|
push(
|
|
|
|
@{ $traininfo->{messages} },
|
|
|
|
{
|
|
|
|
header => $header,
|
|
|
|
lead => $lead,
|
|
|
|
display => $display
|
|
|
|
}
|
|
|
|
);
|
|
|
|
}
|
|
|
|
|
|
|
|
$cache->freeze( $url, $traininfo );
|
|
|
|
$promise->resolve($traininfo);
|
2020-09-10 19:20:26 +00:00
|
|
|
return;
|
2020-07-28 11:01:44 +00:00
|
|
|
}
|
|
|
|
)->catch(
|
|
|
|
sub {
|
|
|
|
my ($err) = @_;
|
2020-10-08 18:05:31 +00:00
|
|
|
$self->{log}->info("hafas->get_xml_p($url): $err");
|
2020-09-21 17:47:54 +00:00
|
|
|
$promise->reject("hafas->get_xml_p($url): $err");
|
2020-09-10 19:20:26 +00:00
|
|
|
return;
|
2020-07-28 11:01:44 +00:00
|
|
|
}
|
|
|
|
)->wait;
|
|
|
|
return $promise;
|
|
|
|
}
|
|
|
|
|
|
|
|
1;
|