)]}'
{
  "log": [
    {
      "commit": "c831089410cb48dd1cd6c0212381434e3c7e9f14",
      "tree": "27e01e776ecff1f81414911125f9812e998b6884",
      "parents": [
        "2e42b9754c7d98339115843953fd067f3be3a5ec"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Wed Jan 28 13:46:13 2026 +0100"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Wed Jan 28 13:46:13 2026 +0100"
      },
      "message": "Don\u0027t treat soft hyphens (U+00AD) as token boundaries\n\nResolves #131\n\nChange-Id: Ia62f5ff91d82ef22830d8fd31afb701c9b703c26\n"
    },
    {
      "commit": "be5de89aa8e6be7b5ed0cedba1d9835a92ecfea9",
      "tree": "18978e067d50c607be4fda0b5b855920eb94375a",
      "parents": [
        "18d4430222945702be1c7e54a53fa207e4f3ac4d"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Dec 11 09:46:01 2025 +0100"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Dec 11 10:39:57 2025 +0100"
      },
      "message": "Add hyphenated compound abbreviations for German\n\nResolves #116\n\nChange-Id: I1fed5bcb91ceb7a7e0c71daf9be43528701d1e42\n"
    },
    {
      "commit": "bf9f4de23216aa81f52d075a9b637407fde58f5a",
      "tree": "e0928df6e7020e70f7f1e98c166e75b9d8fc5da4",
      "parents": [
        "c3e42e028199484473651a18cb1e630aeabbbe5a"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sun Dec 07 14:41:40 2025 +0100"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sun Dec 07 14:41:40 2025 +0100"
      },
      "message": "Add Wikipedia emoji template support\n\nResolves #114\n\nChange-Id: I55d4e8d18d1a290b4f918cabbe19ed757c630037\n"
    },
    {
      "commit": "748fcb4802caa3808d358e8932b609a4e8bba95c",
      "tree": "87c03ef2bd028ff59b479ab98ab2e9157e877201",
      "parents": [
        "e937b972399eb8522cd69dae0050098049cf5e13"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sun Dec 07 14:03:29 2025 +0100"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sun Dec 07 14:16:35 2025 +0100"
      },
      "message": "Add support for emoji clusters\n\nResolves #113\n\nChange-Id: Ia5f0da30559a97332748dfc9e2595852e2477d1a\n"
    },
    {
      "commit": "88b15ed83dbae3d9210d7c90b4db81d5c66d6bf2",
      "tree": "0f32e1694029b48fc7027e7eaad878ce9e39a24c",
      "parents": [
        "0235ea0b942103e4d1e730c60e68e1cb5ab15ca7"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sun Dec 07 12:24:25 2025 +0100"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sun Dec 07 13:00:51 2025 +0100"
      },
      "message": "Fix Genderstern and ommission word token breaks after hyphens\n\nResolves #115\n\nChange-Id: Iacf5667b508050a6dfd09ca9938f449d05582a95\n"
    },
    {
      "commit": "0235ea0b942103e4d1e730c60e68e1cb5ab15ca7",
      "tree": "0181ff6e814d16d1cbc57919d7fba9da28d6763d",
      "parents": [
        "1ff43d5f993f19042652bacf365cebd2a1805300"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sun Dec 07 11:56:59 2025 +0100"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sun Dec 07 12:23:22 2025 +0100"
      },
      "message": "Add build variable force.fast to speed up debug builds\n\nChange-Id: I55aca822a3245ee501a2e184d55304bc300341e8\n"
    },
    {
      "commit": "f7ca6d7da838672d3fb2fc0dfc8a07d83bbf0ceb",
      "tree": "0625104452a9a3fd830d94d1a48421197e9f6591",
      "parents": [
        "6cf96f276941c11cce2f7da621efe2792bba178e"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Sep 08 13:40:40 2023 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Sep 08 13:40:40 2023 +0200"
      },
      "message": "Remove or fix some automatic API comments\n\nChange-Id: I73c5b3e2e0e6b3fcdc9afca07d73971d785059d1\n"
    },
    {
      "commit": "439731eeab9174e95bb58f3882c066cb32bdad06",
      "tree": "f2b9b48bb72c783aefedc5d492287cf4caf5a236",
      "parents": [
        "f8b7d95a1c16f4e1ead5eb6d78f6356f0f5d6ee3"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Sep 08 08:02:11 2023 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Sep 08 08:02:11 2023 +0200"
      },
      "message": "Replace deprecated newInstance invocation\n\nChange-Id: Ic74611cc3203ef12dd58f7c2134f52c85a4a2ecc\n"
    },
    {
      "commit": "f8b7d95a1c16f4e1ead5eb6d78f6356f0f5d6ee3",
      "tree": "c4633ac09aaa15fca79e59809feeea14042a316d",
      "parents": [
        "d1dc8488838de6686bde867d8924b77f7f3f3574"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Sep 08 08:00:55 2023 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Sep 08 08:00:55 2023 +0200"
      },
      "message": "Get version information from jar manifest\n\nSee https://github.com/remkop/picocli/issues/1663\n\nChange-Id: I9c35e336dd06956967d3a07318c1f397b8518091\n"
    },
    {
      "commit": "d1dc8488838de6686bde867d8924b77f7f3f3574",
      "tree": "263cb44c0539a52fce109452c52e86df98e41813",
      "parents": [
        "4128bee84abea2a66491f9242f77236e078ef551"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Sep 07 21:28:23 2023 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Sep 07 21:28:23 2023 +0200"
      },
      "message": "Add mostly auto-generated api documentation\n\nChange-Id: Ib007e4fbe69d3197a29f478a809fec4e3a541f4e\n"
    },
    {
      "commit": "c2f448ce40518e8df5fa6e75c22580be09b00ad2",
      "tree": "805b7a00098da81e931ca540f970387838d26019",
      "parents": [
        "ced7882a257daf3001fcadd5b4b3d0ec1e252db6"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Sep 05 16:04:31 2023 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Wed Sep 06 09:36:25 2023 +0200"
      },
      "message": "Bump version to 2.2.3, update Readme and Changlog\n\nChange-Id: Ic4928596d72ce3f738a47f112d8064dc63324f56\n"
    },
    {
      "commit": "33294d9332f8e11f10d6de8b5d461c3a01fd74de",
      "tree": "1b14c1bf190afa29593de7e9bd6ab208976c5004",
      "parents": [
        "eed234f61e0bd0f672f0156b8b6759128c917f2d"
      ],
      "author": {
        "name": "dependabot[bot]",
        "email": "49699333+dependabot[bot]@users.noreply.github.com",
        "time": "Thu Feb 23 18:14:16 2023 +0000"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Mar 02 11:33:56 2023 +0100"
      },
      "message": "Bump opennlp-tools from 1.9.4 to 2.1.1\n\nBumps [opennlp-tools](https://github.com/apache/opennlp) from 1.9.4 to 2.1.1.\n- [Release notes](https://github.com/apache/opennlp/releases)\n- [Commits](https://github.com/apache/opennlp/compare/opennlp-1.9.4...opennlp-2.1.1)\n\nResolves #74\n\n---\nupdated-dependencies:\n- dependency-name: org.apache.opennlp:opennlp-tools\n  dependency-type: direct:production\n  update-type: version-update:semver-major\n...\n\nSigned-off-by: dependabot[bot] \u003csupport@github.com\u003e\nChange-Id: I6881d2657fbd1c76822fed8e3ee3bebdd7587b0f\n"
    },
    {
      "commit": "609ab476ebec829bc51609c16a6bc16fd6a7e058",
      "tree": "8650f6883e7c2cbc25408f4eb1aba6cd30978de8",
      "parents": [
        "7d926b27c9d58602cf664f87dfcd1675b482e8f9"
      ],
      "author": {
        "name": "Gregor Middell",
        "email": "gregor@middell.net",
        "time": "Fri May 27 09:51:49 2022 +0200"
      },
      "committer": {
        "name": "Gregor Middell",
        "email": "gregor@middell.net",
        "time": "Fri May 27 09:51:49 2022 +0200"
      },
      "message": "Imports java.io\u0027s ByteArrayOutputStream instead of 3rd-party class\n"
    },
    {
      "commit": "6e67723708940b577689f959e972ba367bc5315d",
      "tree": "e277a7e955309d6acd96aea9230f5a324eb85674",
      "parents": [
        "b7f8135ccda35c123236f144f5d6e34912fc89f2"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Jan 14 12:38:45 2022 +0100"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Jan 14 12:38:45 2022 +0100"
      },
      "message": "Omission words cannot start with white space\n\nFixes bug that interprets a single quotation mark at the beginning of a word\nnot as token, but as beginning of an omission.\n\nChange-Id: I97ca48755eeecdee1029e90da4df72121d05c688\n"
    },
    {
      "commit": "1501f5ab34b936c4491bcf14b38658c77df47501",
      "tree": "d5debd31f0cc0179d5ccef9d9eb329499a53ad6d",
      "parents": [
        "7cbc20562818db285b044ffc0049001075f893df"
      ],
      "author": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Fri Nov 05 10:58:55 2021 +0100"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Fri Nov 05 10:58:55 2021 +0100"
      },
      "message": "Extend test suite\n\nChange-Id: I251aaacd15a204d941229f12671e82d48efe5653\n"
    },
    {
      "commit": "7cbc20562818db285b044ffc0049001075f893df",
      "tree": "6495a7da240d5d9857b613fb11833bc03070bdc8",
      "parents": [
        "5b8f67494d65ade35833d3770407cc78c2ec9234"
      ],
      "author": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Sat Oct 23 14:21:48 2021 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Sun Oct 24 19:50:46 2021 +0200"
      },
      "message": "Remove \u0027du\u0027 from abbreviation list\n\nChange-Id: I6873861bd6bc51260acca9a9046a3dc72b8b79ac\n"
    },
    {
      "commit": "5b8f67494d65ade35833d3770407cc78c2ec9234",
      "tree": "4aa4f9a0673c8c49025cf96d0c675b3d83aed3f9",
      "parents": [
        "210fc240a02434fa7c0e00365a6c0011b3f80c11",
        "b7084ce4caa7aba342df3ffa5734f64d12bd0978"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Sep 07 18:48:47 2021 +0200"
      },
      "committer": {
        "name": "Gerrit Code Review",
        "email": "gerrit2@korap.ids-mannheim.de",
        "time": "Tue Sep 07 18:48:47 2021 +0200"
      },
      "message": "Merge \"Simplified FNAME rule\""
    },
    {
      "commit": "210fc240a02434fa7c0e00365a6c0011b3f80c11",
      "tree": "53e088d4bd6252102cd8b75d8c0f9cba343914a6",
      "parents": [
        "f061efbd92ef087ee6b8476c5f20632f0e93c3ea"
      ],
      "author": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Fri Aug 13 00:58:19 2021 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Aug 27 18:55:43 2021 +0200"
      },
      "message": "Remove dir/Dir from German abbreviations\n\nIt\u0027s more important and expectable to find the word rather than\nthe abbreviation.\n\nChange-Id: I71a8863830c3d456003c595619ec6f6ec6cc74a5\n"
    },
    {
      "commit": "f061efbd92ef087ee6b8476c5f20632f0e93c3ea",
      "tree": "4de330589c20eb03fd1ffbe48411afcb2cb61605",
      "parents": [
        "0abcb5939eb59bf04e0729792760a46d3d283ecb"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Aug 20 15:44:30 2021 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Aug 20 15:46:15 2021 +0200"
      },
      "message": "Bump to dev version 2.2.0.9000\n\nChange-Id: I0bdf6b4a57c86ad551a7a9a011ffb96566fd238f\n"
    },
    {
      "commit": "b7084ce4caa7aba342df3ffa5734f64d12bd0978",
      "tree": "c5b0c49929d5a07c83f2d5aa0c67d4ba7587d985",
      "parents": [
        "0abcb5939eb59bf04e0729792760a46d3d283ecb"
      ],
      "author": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Wed Aug 11 17:56:54 2021 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Aug 20 15:09:42 2021 +0200"
      },
      "message": "Simplified FNAME rule\n\nChange-Id: I5ae2d9869bab443c3df49383da768dd09d9f3379\n"
    },
    {
      "commit": "ab9187de39116f5566a3cebf6bc142742c0f50ef",
      "tree": "585052cf0844902c8524bd86edfefac672ea5856",
      "parents": [
        "1f90daf87e6c1f8db9864fdbb0efca67c35d5bbb"
      ],
      "author": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Wed Jul 28 17:51:57 2021 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Wed Jul 28 17:51:57 2021 +0200"
      },
      "message": "Improve test suite and lower acceptance values\n\nChange-Id: I80f0adce1787887fb61a052a24d03d798b45c157\n"
    },
    {
      "commit": "1f90daf87e6c1f8db9864fdbb0efca67c35d5bbb",
      "tree": "8328fbd38f5cacd2befbadbb155f4a0e2b23e574",
      "parents": [
        "56481ea82609f27dc2cb4ea1467dcdb2dc68fc0c"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Wed Jul 28 10:47:15 2021 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Wed Jul 28 10:49:22 2021 +0200"
      },
      "message": "Bump version to v2.2.0\n\nChange-Id: I954f1338932e17f60adb9af33bb5b4a8f06c2553\n"
    },
    {
      "commit": "6d28ed1b72bf3dc34fb72894b8998819c0f662c2",
      "tree": "09d246aaf47d08d38bf2ceb2f9e6c5a9b1684951",
      "parents": [
        "a1459227d3b167a31d31d5a706f0a90256ede74b"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Jul 15 21:09:47 2021 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Jul 16 21:36:38 2021 +0200"
      },
      "message": "Separate apostrophe marked contractions and clitics for en and fr\n\nThe original working rule was overwritten with a rule for German \"omission\nwords\" like \"W\u0027schaft\", \"M\u0027gladbach\u0027, ... in:\n\nhttps://korap.ids-mannheim.de/gerrit/c/private/Ingestion/+/390/1/src/main/jflex/de/ids_mannheim/korap/tokenizer/KorAPTokenizerImpl.jflex\n\nFor German we stick to the standard of *not* separating clitics and\ncontractions, however the changes for English end French words will\nalso be applied in the de tokenizer except for \u0027s and \u0027n.\n\nThanks @Mai \u0026 Harald!\n\nResolves #22\n\nChange-Id: I5e0a81fd38709e49a734d16ad077265a1571c824\n"
    },
    {
      "commit": "a1459227d3b167a31d31d5a706f0a90256ede74b",
      "tree": "f2bfc2baf879561fa102a8866dffd2b6e452f676",
      "parents": [
        "732905f6cee69d22fcd18f69ee3c4d42807f82df"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Jul 16 17:48:45 2021 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Jul 16 18:03:25 2021 +0200"
      },
      "message": "Bump to new dev version 2.1.0.9000\n\nChange-Id: I0c588f94ccbb62d93bb1c98e80ecbb50c0c61fa3\n"
    },
    {
      "commit": "732905f6cee69d22fcd18f69ee3c4d42807f82df",
      "tree": "bcf9ce418cab1ae697a69545ebdaee6681577567",
      "parents": [
        "9ead93658891632b1efd886fcc70a86e0604de96"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Jun 28 18:44:53 2021 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Tue Jun 29 11:16:30 2021 +0200"
      },
      "message": "Release v2.1.0\n\nChange-Id: Ic414422b4d0da0265ee6486e343fbd105498d7ab\n"
    },
    {
      "commit": "96bd87c86835cef50d7edbb8be71147f17283640",
      "tree": "67abc5eaf39c886ec4276e74a65acef7b30cd587",
      "parents": [
        "6bf46827dab3955bdfa99ea741bf727fb3d6cdb0"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sun Mar 21 16:41:53 2021 +0100"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sat Jun 05 15:39:44 2021 +0200"
      },
      "message": "Improve systematicity of options -p, -s, --[no-]tokens\n\n-s alone should just print sentence boundary markers an no offsets. E.g.:\n\necho -n -e \u0027Das ist der 1. Satz. Hier folgt der zweite.\u0027 | java -jar\ntarget/KorAP-Tokenizer-2.0.0-standalone.jar -s\n\nDas\nist\nder\n1.\nSatz\n.\n\nHier\nfolgt\nder\nzweite\n.\n\nThanks @Roman!\n\nChange-Id: I6a5f7e169d1ecb433de0c5f7168f9cd6f3930890\n"
    },
    {
      "commit": "72cc171d7bc30ab15b3d99c31ab449133a7cdc07",
      "tree": "333d31a7fb04f13487eb1312e719d46cbdca6cce",
      "parents": [
        "f2d1ffc6d63cc73fb119a73f16f745b66c862b9b"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Wed Dec 09 12:05:35 2020 +0100"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Wed Dec 09 12:05:35 2020 +0100"
      },
      "message": "Release v2.0.0\n\nChange-Id: I4aac363c1f4bbd4109d0430b1969b48e7271e266\n"
    },
    {
      "commit": "755a150690e99688f4bd0d3d499fcc39183f0554",
      "tree": "0893a093990e2fb1a2a064c961d627d2596a6836",
      "parents": [
        "cf9b5f5cb448bcccc15d1bd505f4d4423a1ea3b3"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Wed Oct 14 16:02:28 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Dec 08 12:22:33 2020 +0100"
      },
      "message": "Prepare for v2.0.0\n\nChange-Id: I6845bddca6ad966699cc029a43d1badb113d223a\n"
    },
    {
      "commit": "cf9b5f5cb448bcccc15d1bd505f4d4423a1ea3b3",
      "tree": "d586b4770c065a513790119f147dabbcf2b5c982",
      "parents": [
        "45d2dba17f569b8a32e4a9c1e79d9abd69181313"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Wed Oct 14 06:51:03 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Wed Oct 14 14:45:45 2020 +0200"
      },
      "message": "Add heuristcis for distinguishing I. as abbrevation vs PPER / CARD\n\nChange-Id: I3f9230bb637cf8cd68ae12a4671a35f5b0dd4b22\n"
    },
    {
      "commit": "2199f76ec648de381b3783bb182840b802e36afc",
      "tree": "cc9ded3df40598f3ad166da395512fa615f134a5",
      "parents": [
        "e3282b0936a96957a69abb4d94cc7d36ad1d03fa"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Oct 13 14:49:54 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Wed Oct 14 14:40:27 2020 +0200"
      },
      "message": "Simplify German abbreviations\n\nChange-Id: I9ab151f2cf2de3b09660ddf305899b1b96a89ac4\n"
    },
    {
      "commit": "e3282b0936a96957a69abb4d94cc7d36ad1d03fa",
      "tree": "758d3854a701453ea6ca40d6e18d15df296dd529",
      "parents": [
        "4fb896a5bc95fcd2eb02a6d63ef8d471ca801431"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Oct 13 10:29:23 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Wed Oct 14 14:40:27 2020 +0200"
      },
      "message": "Accept URLs starting with \"www.\" without URI scheme\n\nChange-Id: I5b46b93984f1192ed0b67ddc1fa05051aae16405\n"
    },
    {
      "commit": "4fb896a5bc95fcd2eb02a6d63ef8d471ca801431",
      "tree": "51a78963308b1d7e0d9936cb984535d281d638bf",
      "parents": [
        "f5a7e04885f2149f41323b9abfedd3efec10dfe1"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Oct 12 17:51:48 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Wed Oct 14 14:40:24 2020 +0200"
      },
      "message": "Amend English abbreviation macro\n\n... based on English Wikipedia articles and talk pages\n\nChange-Id: Ia074e125527e89c53423e3c395d872bb5861cabd\n"
    },
    {
      "commit": "f5a7e04885f2149f41323b9abfedd3efec10dfe1",
      "tree": "846699be050458ff833140b3d706682e500ef4e7",
      "parents": [
        "74141b3d2dc0a77833e028370e7e0ff71a4251ad"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Oct 12 10:43:24 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Wed Oct 14 14:34:53 2020 +0200"
      },
      "message": "Add French tokenizer (-l fr)\n\nBased on French Wikipedia articles and talk pages\n\nChange-Id: I3ee72d7d73e567638b6882a101baaf3b5ffee258\n"
    },
    {
      "commit": "74141b3d2dc0a77833e028370e7e0ff71a4251ad",
      "tree": "418c4de433b8617e1bb61bf95169493c3ef745bb",
      "parents": [
        "5c6df037afcdc7a149f84d9db50c6c88a5b278db"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Oct 01 23:23:18 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Oct 12 10:14:58 2020 +0200"
      },
      "message": "Add -l command line option to choose language\n\nChange-Id: I48e1ce119dfbd75ff9f719ce8525a2c63ad47fc5\n"
    },
    {
      "commit": "5c6df037afcdc7a149f84d9db50c6c88a5b278db",
      "tree": "f2a35d8226b827a88135d14a6943e1f5f950618e",
      "parents": [
        "ce48102c8ed132cb97dd89f90c3ecd38009e4a71"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Sep 29 22:19:38 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Oct 12 10:10:07 2020 +0200"
      },
      "message": "List available KorapTokenizerImplementation options for -T\n\nChange-Id: I8e45410f67decb6b44fc9574dfe94c89b7abd0cc\n"
    },
    {
      "commit": "ce48102c8ed132cb97dd89f90c3ecd38009e4a71",
      "tree": "652465801ff4ace03ffe27372170186efc31f29e",
      "parents": [
        "67eed1c2ffa2a4b61958071d61f4f84d9bd10861"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sun Oct 11 12:08:16 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sun Oct 11 12:08:16 2020 +0200"
      },
      "message": "Recognize {LETTER}+str. as abbreviation for Straße in de-tokenizer\n\nChange-Id: If4bdc02994e2a4ee48051f5047f78d2dddeb10c5\n"
    },
    {
      "commit": "67eed1c2ffa2a4b61958071d61f4f84d9bd10861",
      "tree": "ae3a7c8042c9eaaf534909b99ad46d10bfde1e1f",
      "parents": [
        "8e197f3c8895ff5d66d903f17da7e915076c84c8"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Sep 28 21:37:16 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Oct 09 14:48:55 2020 +0200"
      },
      "message": "Build language specific tokenizers: de, en\n\nChange-Id: Iedad4d96aa702e173ed98d888685b4dd7b113cd5\n"
    },
    {
      "commit": "8e197f3c8895ff5d66d903f17da7e915076c84c8",
      "tree": "a0d68069e2c9cc3e9f26f2d23fbd88c501b13063",
      "parents": [
        "ad22e2ce7f253650d96373bb1fd6472f091075a9"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Oct 08 09:20:37 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Oct 08 18:06:46 2020 +0200"
      },
      "message": "Allow setting input encoding explicitely whith -e \u003cencoding\u003e\n\nAnd use UTF-8 as default.\n\nOtherwise tests fail if no UTF-8 locale is set.\n\nChange-Id: Ie2b8ef2009a037b767b95710e84266af75381fb9\n"
    },
    {
      "commit": "37018068f9423b8f229257c9b0c30fe1e64e66d8",
      "tree": "55fea5da9d678375c67cdf09c779fddab77e05f9",
      "parents": [
        "751868b9a6f8c65ae26bd212c746c91e80d00d7c"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Oct 08 17:54:59 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Oct 08 17:55:34 2020 +0200"
      },
      "message": "Do not use commit ids for naming standalone jars\n\nChange-Id: I713ea18c9c9db796bc74e90c7bc5b83885a4b805\n"
    },
    {
      "commit": "751868b9a6f8c65ae26bd212c746c91e80d00d7c",
      "tree": "efa93123637391ce7b6718a269495f9677717a64",
      "parents": [
        "b9f45e084ceca956b3378fe12d20d9d5b08edadc"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Sep 25 17:59:38 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Sep 28 09:04:10 2020 +0200"
      },
      "message": "Make tokenizer implementation exchangeable\n\nAllows for quite an easy adaptation and integration of other language\nspecializations and other tokenizers, also from the command line with\nnew -T option that allows to specify the tokenizer class name.\n\nTODO: add documentation to the KorapTokenizer interface\n\nChange-Id: Ib95793f47887a3b0829d68ebdbf8bc40815a0605\n"
    },
    {
      "commit": "b9f45e084ceca956b3378fe12d20d9d5b08edadc",
      "tree": "c600f3a8d842f7ee6607080840ea0701de57085c",
      "parents": [
        "c419d5b22c508a352f00fb11f23034a10bfbaf3d"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Sep 17 20:03:59 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Sep 18 19:13:17 2020 +0200"
      },
      "message": "Rename tokenizer class to KorAPDFATokenizer\n\nChange-Id: Icad8af7582689f599eda27258cc397e6155aeefe\n"
    },
    {
      "commit": "c419d5b22c508a352f00fb11f23034a10bfbaf3d",
      "tree": "83eb21aa0d47920a7c1fcd225601249c1dc4108c",
      "parents": [
        "de949deb083c43f4e0fed3713617aed768c000aa"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Sep 17 15:21:26 2020 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Fri Sep 18 17:44:06 2020 +0200"
      },
      "message": "Add new command line options using picocli and sanitize code\n\nUsage: koraptokenizer [-hnpsV] [--force] [-ktt] [--[no-]tokens]\n                      [-o\u003d\u003coutput_fillename\u003e] [\u003cinputFiles\u003e...]\nTokenizes (and sentence splits) text input.\n      [\u003cinputFiles\u003e...]   input files\n      --force             Force overwrite (default: false)\n  -h, --help              Show this help message and exit.\n      -ktt                Deprecated. For internal use only. (default: false)\n  -n, --normalize         Normalize tokens (default: false)\n      --[no-]tokens       Print tokens (default: true)\n  -o, --output-file\u003d\u003coutput_fillename\u003e\n                          Output file (default: -)\n  -p, --positions         Print token start and end positions as character\n                            offsets (default: false)\n  -s, --sentence-boundaries\n                          Print sentence boundary positions (default: false)\n  -V, --version           Print version information and exit.\n\nChange-Id: Ib92678c832a2d95799a8f503c3e86dd4da2b4d73\n"
    },
    {
      "commit": "f4df7121d10c9df78288b831a6d397150d140d05",
      "tree": "45b29ed3db785b29cfc25e64c56e666a83c5f3f7",
      "parents": [
        "783e2a27b3e9612cff8348e841c6a484c0d761f9"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Sep 14 10:23:53 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Sep 14 10:24:34 2020 +0200"
      },
      "message": "Change jar target naming conventions\n\nWe now have for example:\n\nKorAP-Tokenizer-1.2-783e2a2.jar\nKorAP-Tokenizer-1.2-783e2a2-src.zip\nKorAP-Tokenizer-1.2-783e2a2-standalone.jar\n\nChange-Id: Ie071ff72cf29e388df9996a0755eb60f0ab9a07e\n"
    },
    {
      "commit": "783e2a27b3e9612cff8348e841c6a484c0d761f9",
      "tree": "e2605d396fbfad73b94a2e0c085e509a2360ca4a",
      "parents": [
        "571c194376e9bfc928da5a4eb765e59eceae096d"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Sep 11 23:34:27 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Sep 14 09:40:25 2020 +0200"
      },
      "message": "Ignore quoted email names like \"John Doe\"@xx.com\n\nThey are rare and are now delivering too many false positives due to Twitter handles, like:\n\n Pluto.\"  Eris-Entdecker Mike Brown, der im Kurznachrichtendienst Twitter unter \"@plutokiller\n\n A different prioritization does not seem necessary either.\n\nChange-Id: I75e328f027f917ab1db246da80201e30604472db\n"
    },
    {
      "commit": "571c194376e9bfc928da5a4eb765e59eceae096d",
      "tree": "ec8d984c8b3b5b1b045315b4591d2954e639133a",
      "parents": [
        "6afd12177bab60924a76c214cacb03029e244c11"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Sep 08 18:39:57 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Wed Sep 09 08:32:37 2020 +0200"
      },
      "message": "Empty text (\u003cEOT\u003e\u003cEOT\u003e) -\u003e empty output line\n\nEmpty texts, i. e. \u003cEOT\u003e\u003cEOF\u003e will result in empty output lines. At the end of a file however one additional \u003cEOT\u003e will not produce an empty outpu line.\n\nChange-Id: Ib989f91f7172441e6b6d8689dfc118f07d91e1c2\n"
    },
    {
      "commit": "6afd12177bab60924a76c214cacb03029e244c11",
      "tree": "d605c7640a1100490e5c02169921217fb8585b23",
      "parents": [
        "793f85dffdd621f671962eb6e080887d5355a802"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Sep 08 14:29:11 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Sep 08 17:51:46 2020 +0200"
      },
      "message": "Use standard EOT/EOF character x04 instead of magic escape \\n\\x03\\n\n\nChange-Id: I06b4eb09064c08b5708a612666b7d807785ae580\n"
    },
    {
      "commit": "793f85dffdd621f671962eb6e080887d5355a802",
      "tree": "baa24b1c4e8075f1b28499431e9c8eb71a800c3f",
      "parents": [
        "b9fb19698cd7703f77d077ca6e23d4aa3ff82062"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Sep 08 14:40:24 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Sep 08 17:50:07 2020 +0200"
      },
      "message": "Add first tests for IPC invocation scenario\n\nChange-Id: Ib6b974a5246f22f9c2b1050fd39912e9be2c8fc6\n"
    },
    {
      "commit": "b2666fc5a425f68797079e32c0e3cb6d25d056d7",
      "tree": "bb2764a228d392c2127d92fee69188d1e0e1a2bb",
      "parents": [
        "07d97146420a0909c9d2c21ab21c95069b3a98b1"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Sep 07 18:03:46 2020 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Tue Sep 08 17:25:08 2020 +0200"
      },
      "message": "Implement sentence splitter\n\nChange-Id: I80969a8ac68193dd2a3dd82c1f606807193c39c8\n"
    },
    {
      "commit": "07d97146420a0909c9d2c21ab21c95069b3a98b1",
      "tree": "a14bb644bb2b3e729ac0a5a1de58b6ba78d6c83f",
      "parents": [
        "c315c2a64a95f9fcf08ae30fef097179bddf7003"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Sep 07 18:03:34 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Sep 08 08:23:44 2020 +0200"
      },
      "message": "Move tests to proper location\n\nChange-Id: I447b4777f0d5a616310f102ce71df487245e1c32\n"
    },
    {
      "commit": "81925096b645bf17cf688d1311bce002b5a9418f",
      "tree": "72e8930b1290ff3567cd9987d7e425d9b5e4c580",
      "parents": [
        "478632eb7e133969531f3b401576564783183707"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Sep 07 15:16:51 2020 +0200"
      },
      "committer": {
        "name": "Marc K",
        "email": "morckx@gmail.com",
        "time": "Mon Sep 07 15:25:28 2020 +0200"
      },
      "message": "Use original Span class and implement Tokenizer interface from OpenNLP\n\nUsing maven assembly plugin to include the required classes into a jar\nfor binary distribution.\n\nThis makes it possible to use KorAPTokenizerImpl as tokenizer in OpenNLP\napplications.\n\nChange-Id: I627dcdd046334db1b1ae9dd60cf7104fd3a3c518\n"
    },
    {
      "commit": "478632eb7e133969531f3b401576564783183707",
      "tree": "750d4b79b2f2b1e4e36794a8d593ebc3cb68b0be",
      "parents": [
        "fe84dd00e4116df5fc7b3bfd026249fe5a8ece5b"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sat Sep 05 21:52:54 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Sep 07 10:59:10 2020 +0200"
      },
      "message": "Clean up code\n\nChange-Id: Icc8d4b091b4f61401d7f4194188b568dd30d627f\n"
    },
    {
      "commit": "45dc0fee5398f28545c8b2f34e0d3c3b894fa0dd",
      "tree": "179fc1f82bc858243c537d369fb338ca76ed82ae",
      "parents": [
        "656055bc573a46cca0ff09db5c498d18740ed7d6"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sat Sep 05 21:46:17 2020 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Mon Sep 07 09:11:37 2020 +0200"
      },
      "message": "Add Apache copyright NOTICE\n\nChange-Id: Iaf7b2f7f15ef53d2a55ac3986b9beb236421df7a\n"
    },
    {
      "commit": "3367773b65d4629b0cdc994d134129b00f0f9a63",
      "tree": "86588a5c60e52c837aa8e16090089bbb7da95abe",
      "parents": [],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Sep 04 22:07:39 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sat Sep 05 22:07:36 2020 +0200"
      },
      "message": "Initial import from private/Ingestion\n\nChange-Id: I96f428c440ef301384de6d7ef2e348df7d729816\n"
    }
  ]
}
