Akron | 78f6714 | 2022-04-09 14:10:44 +0200 | [diff] [blame^] | 1 | ! General rules that require certain language specific definitions |
| 2 | |
| 3 | ! A solution to the "(author): problem" may be to add ) at the end of any |
| 4 | ! string as a possible ending |
| 5 | define Years ["(" Digit+ (".") ")"] | ["[" Digit+ (".") "]"]; |
| 6 | |
| 7 | ! 20:00 Uhr, 00:12:25,34 |
| 8 | define Times [ ( [%0|1|2|3|4|5] ) Digit [ ":" [%0|1|2|3|4|5] Digit ]^{1,2} ( "," [ Digit ]^{1,3} ) ]; |
| 9 | |
| 10 | ! Emoticons |
| 11 | source all/emoticons.xfst |
| 12 | |
| 13 | ! XML sources |
| 14 | source all/xml.xfst |
| 15 | |
| 16 | ! XML entities |
| 17 | source all/entities.xfst |
| 18 | |
| 19 | ! Technical protocols |
| 20 | source all/protocols.xfst |
| 21 | |
| 22 | ! Also supports |
| 23 | ! 19.4.2015, 19/4/2015 etc. |
| 24 | define DigitPunct ["_"|"-"|"."|","|Slash]; |
| 25 | define Num Digit+ [DigitPunct Digit+]* (Char+); |
| 26 | |
| 27 | ! ordinals |
| 28 | define Ord Digit ( Digit (Digit) ) %.; |
| 29 | |
| 30 | ! TODO: |
| 31 | ! floating point, serial, model numbers, ip addresses, etc. |
| 32 | ! every other segment must have at least one digit |
| 33 | |
| 34 | ! Omission words like "fu**ing!" |
| 35 | define Omission Char+ Asterisk Asterisk+ Char*; |
| 36 | |
| 37 | ! acronyms: U.S.A., I.B.M., etc. |
| 38 | ! use a post-filter to remove dots |
| 39 | define AcronymDep Letter %. Letter %. [Letter %.]+; |
| 40 | |
| 41 | |
| 42 | ! TODO: Name words with ' and ` |
| 43 | |
| 44 | ! Support ASCII elements, like |
| 45 | ! +---------------+ |
| 46 | ! <---->, -->, <-- |
| 47 | ! +---------------+ |
| 48 | ! <---> | Worker Node N | |
| 49 | ! +---------------+ |
| 50 | ! |============= Core =============| |
| 51 | |