Akron | 3f875be | 2020-05-11 14:57:19 +0200 | [diff] [blame] | 1 | #!/usr/bin/env perl |
Akron | 3587f36 | 2020-05-20 17:50:38 +0200 | [diff] [blame] | 2 | use strict; |
| 3 | use warnings; |
Akron | 85f5d9e | 2024-12-17 14:45:20 +0100 | [diff] [blame] | 4 | use lib 'lib'; |
Akron | 71cf2f5 | 2024-07-17 08:54:15 +0200 | [diff] [blame] | 5 | use KorAP::Def; |
Akron | a3f74f5 | 2024-07-17 17:18:17 +0200 | [diff] [blame] | 6 | use KorAP::DefList; |
Akron | a0403e0 | 2025-02-28 12:45:18 +0100 | [diff] [blame] | 7 | use KorAP::ScriptLoad; |
Akron | a3f74f5 | 2024-07-17 17:18:17 +0200 | [diff] [blame] | 8 | use Getopt::Long; |
Akron | 3f875be | 2020-05-11 14:57:19 +0200 | [diff] [blame] | 9 | |
Akron | 99d2d08 | 2024-07-18 16:17:08 +0200 | [diff] [blame] | 10 | binmode(STDERR, ':encoding(UTF-8)'); |
| 11 | |
Akron | 340a9cb | 2020-05-20 12:55:22 +0200 | [diff] [blame] | 12 | # 2020-05-20 |
| 13 | # Preliminary support for C2 def-files. |
Akron | 34a4f58 | 2020-05-27 12:18:57 +0200 | [diff] [blame] | 14 | # 2020-05-29 |
| 15 | # Introduce optimizable object system. |
Akron | 71cf2f5 | 2024-07-17 08:54:15 +0200 | [diff] [blame] | 16 | # 2024-07-17 |
| 17 | # Add KorAP::Def. |
Akron | 0989cb3 | 2024-12-16 13:52:47 +0100 | [diff] [blame] | 18 | # 2024-12-16 |
| 19 | # Fix doc trimming |
Akron | adcc8de | 2024-12-16 15:10:50 +0100 | [diff] [blame] | 20 | # Fix country codes. |
Akron | 340a9cb | 2020-05-20 12:55:22 +0200 | [diff] [blame] | 21 | |
Akron | 0989cb3 | 2024-12-16 13:52:47 +0100 | [diff] [blame] | 22 | our $VERSION = 0.4; |
Akron | 26b5970 | 2020-05-19 12:14:41 +0200 | [diff] [blame] | 23 | our @ARGV; |
| 24 | |
Akron | a3f74f5 | 2024-07-17 17:18:17 +0200 | [diff] [blame] | 25 | my $cmd = shift @ARGV; |
Akron | 3f875be | 2020-05-11 14:57:19 +0200 | [diff] [blame] | 26 | |
Akron | a3f74f5 | 2024-07-17 17:18:17 +0200 | [diff] [blame] | 27 | |
Akron | b31321e | 2024-07-18 11:17:46 +0200 | [diff] [blame] | 28 | my ($input, $output, $copysrc); |
Akron | a3f74f5 | 2024-07-17 17:18:17 +0200 | [diff] [blame] | 29 | |
| 30 | GetOptions ( |
Akron | b31321e | 2024-07-18 11:17:46 +0200 | [diff] [blame] | 31 | "input|i=s" => \$input, |
| 32 | "output|o=s" => \$output, |
| 33 | "copy-src|c=s" => \$copysrc, |
Akron | a3f74f5 | 2024-07-17 17:18:17 +0200 | [diff] [blame] | 34 | ) |
| 35 | or die("Error in command line arguments\n"); |
| 36 | |
Akron | bdef2d3 | 2025-02-25 21:14:09 +0100 | [diff] [blame] | 37 | if (!$cmd || ($cmd ne 'def' && $cmd ne 'list' && $cmd ne 'script')) { |
Akron | a3f74f5 | 2024-07-17 17:18:17 +0200 | [diff] [blame] | 38 | print <<'HELP'; |
Akron | bdef2d3 | 2025-02-25 21:14:09 +0100 | [diff] [blame] | 39 | Convert a list of C2 VC definitions, a single definition or a script file into |
Akron | a3f74f5 | 2024-07-17 17:18:17 +0200 | [diff] [blame] | 40 | KoralQuery VCs. |
| 41 | |
| 42 | $ perl cosmasvc2koralquery def my_vc.txt | gzip -vc > my_vc.jsonld.gz |
| 43 | $ cat my_vc.txt | perl cosmasvc2koralquery def - | gzip -vc > my_vc.jsonld.gz |
| 44 | |
Akron | b31321e | 2024-07-18 11:17:46 +0200 | [diff] [blame] | 45 | Command: def |
| 46 | |
| 47 | Convert a def file or a list of sigles to a KoralQuery VC. |
| 48 | |
| 49 | Takes the list or def from STDIN and exports to STDOUT. |
| 50 | |
| 51 | Command: list |
| 52 | |
| 53 | Convert a list with copy or regex instructions to KoralQuery VCs. |
| 54 | |
| 55 | --output: The output directory |
| 56 | --copy-src: The directory for def files to copy |
Akron | 3f875be | 2020-05-11 14:57:19 +0200 | [diff] [blame] | 57 | |
Akron | bdef2d3 | 2025-02-25 21:14:09 +0100 | [diff] [blame] | 58 | Command: script |
| 59 | |
| 60 | Convert a script file with LOAD() instructions to KoralQuery VCs. |
| 61 | |
| 62 | --output: The output directory |
| 63 | |
Akron | 3f875be | 2020-05-11 14:57:19 +0200 | [diff] [blame] | 64 | HELP |
Akron | a3f74f5 | 2024-07-17 17:18:17 +0200 | [diff] [blame] | 65 | exit 1; |
Akron | 3f875be | 2020-05-11 14:57:19 +0200 | [diff] [blame] | 66 | }; |
| 67 | |
Akron | a3f74f5 | 2024-07-17 17:18:17 +0200 | [diff] [blame] | 68 | |
| 69 | # Process a list |
| 70 | if ($cmd eq 'list') { |
Akron | b31321e | 2024-07-18 11:17:46 +0200 | [diff] [blame] | 71 | KorAP::DefList->new( |
| 72 | file => ($input || $ARGV[0]), |
| 73 | copy => ($copysrc || '.'), |
| 74 | output => ($output || '.') |
| 75 | )->parse; |
Akron | a3f74f5 | 2024-07-17 17:18:17 +0200 | [diff] [blame] | 76 | exit(0); |
| 77 | }; |
| 78 | |
Akron | bdef2d3 | 2025-02-25 21:14:09 +0100 | [diff] [blame] | 79 | # Process a list |
| 80 | if ($cmd eq 'script') { |
| 81 | KorAP::ScriptLoad->new( |
| 82 | file => ($input || $ARGV[0]), |
| 83 | output => ($output || '.') |
| 84 | )->parse; |
| 85 | exit(0); |
| 86 | }; |
| 87 | |
| 88 | |
Akron | a3f74f5 | 2024-07-17 17:18:17 +0200 | [diff] [blame] | 89 | # Parse a single def |
Akron | 71cf2f5 | 2024-07-17 08:54:15 +0200 | [diff] [blame] | 90 | my $def_parser; |
Akron | 26b5970 | 2020-05-19 12:14:41 +0200 | [diff] [blame] | 91 | if ($ARGV[0] eq '-') { |
Akron | 71cf2f5 | 2024-07-17 08:54:15 +0200 | [diff] [blame] | 92 | $def_parser = KorAP::Def->new(\*STDIN); |
| 93 | } |
Akron | a3f74f5 | 2024-07-17 17:18:17 +0200 | [diff] [blame] | 94 | elsif ($input) { |
| 95 | $def_parser = KorAP::Def->new($input); |
| 96 | } |
Akron | 71cf2f5 | 2024-07-17 08:54:15 +0200 | [diff] [blame] | 97 | else { |
| 98 | $def_parser = KorAP::Def->new($ARGV[0]); |
Akron | 3f875be | 2020-05-11 14:57:19 +0200 | [diff] [blame] | 99 | }; |
| 100 | |
Akron | 71cf2f5 | 2024-07-17 08:54:15 +0200 | [diff] [blame] | 101 | $def_parser->parse; |
Akron | 26b5970 | 2020-05-19 12:14:41 +0200 | [diff] [blame] | 102 | |
Akron | 1c07045 | 2020-05-25 11:28:30 +0200 | [diff] [blame] | 103 | # Stringify current (extended?) virtual corpus |
Akron | 71cf2f5 | 2024-07-17 08:54:15 +0200 | [diff] [blame] | 104 | print $def_parser->to_string; |