| commit | 74141b3d2dc0a77833e028370e7e0ff71a4251ad | [log] [tgz] |
|---|---|---|
| author | Marc Kupietz <kupietz@ids-mannheim.de> | Thu Oct 01 23:23:18 2020 +0200 |
| committer | Marc Kupietz <kupietz@ids-mannheim.de> | Mon Oct 12 10:14:58 2020 +0200 |
| tree | 418c4de433b8617e1bb61bf95169493c3ef745bb | |
| parent | 5c6df037afcdc7a149f84d9db50c6c88a5b278db [diff] |
Add -l command line option to choose language Change-Id: I48e1ce119dfbd75ff9f719ce8525a2c63ad47fc5
diff --git a/src/main/jpc/jflex/de/ids_mannheim/korap/tokenizer/DerekoDfaTokenizer.jflex b/src/main/jpc/jflex/de/ids_mannheim/korap/tokenizer/DerekoDfaTokenizer.jflex index 042080d..939260c 100644 --- a/src/main/jpc/jflex/de/ids_mannheim/korap/tokenizer/DerekoDfaTokenizer.jflex +++ b/src/main/jpc/jflex/de/ids_mannheim/korap/tokenizer/DerekoDfaTokenizer.jflex
@@ -54,6 +54,8 @@ import java.util.ArrayList; import java.util.List; import opennlp.tools.util.Span; + +@Languages({ /*$"\""+target.language+"\" })$*/ /*-*/ ""}) %% /** @@ -70,7 +72,7 @@ %char %{ - private static final CharSequence[] targetLanguages = { /*$"\""+target.language+"\"};$*/ /*-*/ "" }; + private static final CharSequence[] targetLanguages = { /*$"\""+target.language+"\"};$*/ /*-*/ "" }; private boolean xmlEcho = false; private boolean normalize = false; private boolean debug = false; @@ -546,7 +548,7 @@ // pragmas used for anonymization etc. PRAGMA = \[_[A-Z\-]+_\] -%include SEABBR_/*$target.language$*/.jflex-macro +%include language-specific_/*$target.language$*/.jflex-macro %s OPEN_QUOTE POLISH_CONDITIONAL_MODE JUST_AFTER_PERIOD CLITIC_MODE
diff --git a/src/main/jpc/jflex/de/ids_mannheim/korap/tokenizer/SEABBR_de.jflex-macro b/src/main/jpc/jflex/de/ids_mannheim/korap/tokenizer/language-specific_de.jflex-macro similarity index 100% rename from src/main/jpc/jflex/de/ids_mannheim/korap/tokenizer/SEABBR_de.jflex-macro rename to src/main/jpc/jflex/de/ids_mannheim/korap/tokenizer/language-specific_de.jflex-macro
diff --git a/src/main/jpc/jflex/de/ids_mannheim/korap/tokenizer/SEABBR_en.jflex-macro b/src/main/jpc/jflex/de/ids_mannheim/korap/tokenizer/language-specific_en.jflex-macro similarity index 100% rename from src/main/jpc/jflex/de/ids_mannheim/korap/tokenizer/SEABBR_en.jflex-macro rename to src/main/jpc/jflex/de/ids_mannheim/korap/tokenizer/language-specific_en.jflex-macro