aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rwxr-xr-xdicts/czech-wordnet.pl5
1 files changed, 4 insertions, 1 deletions
diff --git a/dicts/czech-wordnet.pl b/dicts/czech-wordnet.pl
index d626e5a..d1d32f9 100755
--- a/dicts/czech-wordnet.pl
+++ b/dicts/czech-wordnet.pl
@@ -4,11 +4,14 @@
use warnings;
use strict;
+# GNU Gzip can unpack a ZIP file, but not the BSD one, and unzip can't use stdin
+my $zipcat = qx/command -v bsdtar/ ? 'bsdtar -xOf-' : 'zcat';
+
my $base = 'https://lindat.cz/repository/xmlui';
my $path = 'handle/11858/00-097C-0000-0001-4880-3';
open(my $doc, '-|',
"curl -Lo- '$base/bitstream/$path/Czech_WordNet_1.9_PDT.zip'"
- . ' | zcat | iconv -f latin2 -t UTF-8') or die $!;
+ . " | $zipcat | iconv -f latin2 -t UTF-8") or die $!;
# https://nlp.fi.muni.cz/trac/deb2/wiki/WordNetFormat but not quite;
# for terminology see https://wordnet.princeton.edu/documentation/wngloss7wn