commit | cc3914703908d25fc3bade72a32e0c2169a187da | [log] [tgz] |
---|---|---|
author | Marc Kupietz <kupietz@ids-mannheim.de> | Mon Jun 24 10:48:34 2024 +0200 |
committer | Marc Kupietz <kupietz@ids-mannheim.de> | Mon Jun 24 15:10:49 2024 +0200 |
tree | f3c79d11ad2a8b6bf0e1f5b1f1653423ec7e8714 | |
parent | 249fc8310cea40390425808956d773e5b014cb9b [diff] |
2korapxml: Trim docid to avoid spurious trailing spaces Change-Id: I2b7d80a6add6c6b8867f785813c16dbd0f5c43cd
diff --git a/script/conllu2korapxml b/script/conllu2korapxml index eaa06aa..e285abf 100755 --- a/script/conllu2korapxml +++ b/script/conllu2korapxml
@@ -115,6 +115,7 @@ } } elsif(/^(?:#|0\.2)\s+text_id\s*[:=]\s*(.*)/) { $docid=$1; + $docid =~ s/\s+$//; my $docSigle = $docid; $docSigle =~ s/\..*//; if($docSigle ne $lastDocSigle) {