blob: ad286dfd4781118a4fe1099bfe37ccee9422293b [file] [log] [blame]
Akron8b511f92020-07-09 17:28:08 +02001#!/usr/bin/env perl
2use strict;
3use warnings;
4use FindBin;
5BEGIN {
6 unshift @INC, "$FindBin::Bin/../../lib";
7};
8use KorAP::XML::TEI::Tokenizer::Aggressive;
9
Akron8b511f92020-07-09 17:28:08 +020010$| = 1;
11
12# Init tokenizer
13my $tok = KorAP::XML::TEI::Tokenizer::Aggressive->new;
14
15# Read lines from input and return boundaries
16while (!eof(STDIN)) {
17 my $line = <>;
18 $tok->tokenize($line);
19 print join(' ', $tok->boundaries), "\n";
20 $tok->reset;
21};
22
231;