Blame - t/index/xip_constituency.t - KorAP/KorAP-XML-Krill

blob: 89972e4ee0773f37ca3df315129267588cd35758 [file] [log] [blame]

Akron	5f511d2	2016-01-05 20:54:34 +0100	[diff] [blame]	1	#!/usr/bin/env perl
				2	use strict;
				3	use warnings;
				4	use utf8;
				5	use Test::More;
				6	use Scalar::Util qw/weaken/;
				7	use Data::Dumper;
Akron	11ef51d	2016-01-18 19:07:56 +0100	[diff] [blame^]	8	use lib 't/index';
				9	use TestInit;
Akron	5f511d2	2016-01-05 20:54:34 +0100	[diff] [blame]	10
Akron	11ef51d	2016-01-18 19:07:56 +0100	[diff] [blame^]	11	ok(my $tokens = TestInit::tokens('0001'), 'Parse tokens');
Akron	5f511d2	2016-01-05 20:54:34 +0100	[diff] [blame]	12
				13	ok($tokens->add('XIP', 'Constituency'), 'Add Structure');
				14
				15	my $data = $tokens->to_data->{data};
				16	like($data->{foundries}, qr!xip/constituency!, 'data');
				17	like($data->{layerInfos}, qr!xip/c=spans!, 'data');
				18
				19	# The length includes the punct - but that doesn't matter
				20	is($data->{stream}->[0]->[1], '<>:xip/c:PREP$<b>64<i>0<i>3<i>1<b>3', 'Prep phrase');
				21	is($data->{stream}->[0]->[2], '<>:xip/c:PP$<b>64<i>0<i>30<i>4<b>2', 'pp phrase');
				22	is($data->{stream}->[0]->[3], '<>:xip/c:TOP$<b>64<i>0<i>129<i>17<b>0', 'top phrase');
				23	is($data->{stream}->[0]->[4], '<>:xip/c:MC$<b>64<i>0<i>129<i>17<b>1', 'mc phrase');
				24
				25	is($data->{stream}->[-1]->[0], '<>:xip/c:VERB$<b>64<i>124<i>128<i>18<b>4', 'Noun phrase');
				26
				27	done_testing;
				28
				29	__END__
				30
				31
				32
				33