From 81806b59e1ebe7ea1f69a6ba0a192e483df0b594 Mon Sep 17 00:00:00 2001 From: Daniel Friesel Date: Fri, 20 Dec 2013 10:28:46 +0100 Subject: Initial commit --- scripts/acronyms.pl | 47 +++++++++++++++++++++++++++++++++++++++++++++++ scripts/acronyms.sh | 5 +++++ 2 files changed, 52 insertions(+) create mode 100755 scripts/acronyms.pl create mode 100755 scripts/acronyms.sh (limited to 'scripts') diff --git a/scripts/acronyms.pl b/scripts/acronyms.pl new file mode 100755 index 0000000..d78afad --- /dev/null +++ b/scripts/acronyms.pl @@ -0,0 +1,47 @@ +#!/usr/bin/env perl + +use strict; +use warnings; +use 5.010; + +my $re_line = qr{ + ^ + (? [A-Z]{2}[A-Z ]{0,3} ) + \s + (? .+) + $ +}x; + +say <<'EOF'; +package Travel::Status::DE::IRIS::Acronyms; + +use strict; +use warnings; +use 5.010; +use utf8; + +our $VERSION = '0.00'; + +my @acronyms = ( +EOF + +while (my $line = ) { + chomp $line; + + if ($line =~ $re_line) { + my ($acronym, $name) = @+{qw{acronym name}}; + $name =~ s{'}{\\'}g; + + printf("\t['%s','%s'],\n", $acronym, $name); + } +} + +say <<'EOF'; +); + +sub get_acronyms { + return @acronyms; +} + +1; +EOF diff --git a/scripts/acronyms.sh b/scripts/acronyms.sh new file mode 100755 index 0000000..a6bd3ca --- /dev/null +++ b/scripts/acronyms.sh @@ -0,0 +1,5 @@ +#!/bin/sh + +curl -s http://www.db-netz.de/file/2361656/data/betriebsstellen.pdf \ +| pdftotext -raw - - | perl scripts/acronyms.pl \ +> lib/Travel/Status/DE/IRIS/Acronyms.pm -- cgit v1.2.3