blob: 48dc9fc04df67ee03201f5bd7038fd7575326cd0 [file] [log] [blame]
# text_id = TST_TST.00001
# empty texts are expected to count *not*
# text_id = TST_TST.00002
1 ich ich PPER PPER _ _ _ _ 1
2 bin sein VAFIN VAFIN _ _ _ _ 1.000000
3 alex alex NE NE _ _ _ _ 0.565630
4 . . $. $. _ _ _ _ 1.000000
# text_id = TST_TST.00003
1 alex alex NE NE _ _ _ _ 0.565630
2 bin sein VAFIN VAFIN _ _ _ _ 1.000000
3 ich ich PPER PPER _ _ _ _ 1
4 . . $. $. _ _ _ _ 1.000000
# text_id = TST_TST.00004
# make sure that an empty text header does no harm
# text_id = TST_TST.00005
1 ich ich PPER PPER _ _ _ _ 1
2 heiße heißen VAFIN VAFIN _ _ _ _ 1.000000
3 alex alex NE NE _ _ _ _ 0.565630
4 . . $. $. _ _ _ _ 1.000000
# text_id = TST_TST.00006
# make sure that an empty text header does no harm
# text_id = TST_TST.00007
# in the unigrams we should have 3 start and end tags, because empty texts do not count starting with v2.2.3