blob: 5a907cc028494d7efa374a4cb55b6066aafe0c76 [file] [log] [blame]
# text_id = TST_TST.00001
# empty texts are expected to count
# text_id = TST_TST.00002
1 ich ich PPER PPER _ _ _ _ 1
2 bin sein VAFIN VAFIN _ _ _ _ 1.000000
3 alex alex NE NE _ _ _ _ 0.565630
4 . . $. $. _ _ _ _ 1.000000
# text_id = TST_TST.00003
1 alex alex NE NE _ _ _ _ 0.565630
2 bin sein VAFIN VAFIN _ _ _ _ 1.000000
3 ich ich PPER PPER _ _ _ _ 1
4 . . $. $. _ _ _ _ 1.000000
# text_id = TST_TST.00004
# make sure that an empty text header does no harm
# text_id = TST_TST.00005
1 ich ich PPER PPER _ _ _ _ 1
2 heiße heißen VAFIN VAFIN _ _ _ _ 1.000000
3 alex alex NE NE _ _ _ _ 0.565630
4 . . $. $. _ _ _ _ 1.000000
# text_id = TST_TST.00006
# make sure that an empty text header does no harm
# text_id = TST_TST.00007
# in the unigrams we should have 7 start and end tags