Marc Kupietz | e4adb69 | 2021-09-26 11:57:01 +0200 | [diff] [blame] | 1 | # text_id = TST_TST.00001 |
Marc Kupietz | 104c94b | 2023-02-02 19:53:53 +0100 | [diff] [blame] | 2 | # empty texts are expected to count *not* |
Marc Kupietz | e4adb69 | 2021-09-26 11:57:01 +0200 | [diff] [blame] | 3 | |
| 4 | # text_id = TST_TST.00002 |
Marc Kupietz | a691041 | 2021-09-23 23:15:20 +0200 | [diff] [blame] | 5 | 1 ich ich PPER PPER _ _ _ _ 1 |
| 6 | 2 bin sein VAFIN VAFIN _ _ _ _ 1.000000 |
| 7 | 3 alex alex NE NE _ _ _ _ 0.565630 |
| 8 | 4 . . $. $. _ _ _ _ 1.000000 |
| 9 | |
Marc Kupietz | e4adb69 | 2021-09-26 11:57:01 +0200 | [diff] [blame] | 10 | # text_id = TST_TST.00003 |
Marc Kupietz | a691041 | 2021-09-23 23:15:20 +0200 | [diff] [blame] | 11 | 1 alex alex NE NE _ _ _ _ 0.565630 |
| 12 | 2 bin sein VAFIN VAFIN _ _ _ _ 1.000000 |
| 13 | 3 ich ich PPER PPER _ _ _ _ 1 |
| 14 | 4 . . $. $. _ _ _ _ 1.000000 |
| 15 | |
Marc Kupietz | e4adb69 | 2021-09-26 11:57:01 +0200 | [diff] [blame] | 16 | # text_id = TST_TST.00004 |
| 17 | # make sure that an empty text header does no harm |
| 18 | |
| 19 | # text_id = TST_TST.00005 |
Marc Kupietz | a691041 | 2021-09-23 23:15:20 +0200 | [diff] [blame] | 20 | 1 ich ich PPER PPER _ _ _ _ 1 |
| 21 | 2 heiße heißen VAFIN VAFIN _ _ _ _ 1.000000 |
| 22 | 3 alex alex NE NE _ _ _ _ 0.565630 |
| 23 | 4 . . $. $. _ _ _ _ 1.000000 |
Marc Kupietz | e4adb69 | 2021-09-26 11:57:01 +0200 | [diff] [blame] | 24 | |
| 25 | # text_id = TST_TST.00006 |
| 26 | # make sure that an empty text header does no harm |
| 27 | |
| 28 | # text_id = TST_TST.00007 |
Marc Kupietz | 104c94b | 2023-02-02 19:53:53 +0100 | [diff] [blame] | 29 | # in the unigrams we should have 3 start and end tags, because empty texts do not count starting with v2.2.3 |
Marc Kupietz | e4adb69 | 2021-09-26 11:57:01 +0200 | [diff] [blame] | 30 | |
| 31 | |