| # text_id = TST_TST.00001 |
| # empty texts are expected to count *not* |
| |
| # text_id = TST_TST.00002 |
| 1 ich ich PPER PPER _ _ _ _ 1 |
| 2 bin sein VAFIN VAFIN _ _ _ _ 1.000000 |
| 3 alex alex NE NE _ _ _ _ 0.565630 |
| 4 . . $. $. _ _ _ _ 1.000000 |
| |
| # text_id = TST_TST.00003 |
| 1 alex alex NE NE _ _ _ _ 0.565630 |
| 2 bin sein VAFIN VAFIN _ _ _ _ 1.000000 |
| 3 ich ich PPER PPER _ _ _ _ 1 |
| 4 . . $. $. _ _ _ _ 1.000000 |
| |
| # text_id = TST_TST.00004 |
| # make sure that an empty text header does no harm |
| |
| # text_id = TST_TST.00005 |
| 1 ich ich PPER PPER _ _ _ _ 1 |
| 2 heiße heißen VAFIN VAFIN _ _ _ _ 1.000000 |
| 3 alex alex NE NE _ _ _ _ 0.565630 |
| 4 . . $. $. _ _ _ _ 1.000000 |
| |
| # text_id = TST_TST.00006 |
| # make sure that an empty text header does no harm |
| |
| # text_id = TST_TST.00007 |
| # in the unigrams we should have 3 start and end tags, because empty texts do not count starting with v2.2.3 |
| |
| |