)]}'
{
  "log": [
    {
      "commit": "e3282b0936a96957a69abb4d94cc7d36ad1d03fa",
      "tree": "758d3854a701453ea6ca40d6e18d15df296dd529",
      "parents": [
        "4fb896a5bc95fcd2eb02a6d63ef8d471ca801431"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Oct 13 10:29:23 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Wed Oct 14 14:40:27 2020 +0200"
      },
      "message": "Accept URLs starting with \"www.\" without URI scheme\n\nChange-Id: I5b46b93984f1192ed0b67ddc1fa05051aae16405\n"
    },
    {
      "commit": "4fb896a5bc95fcd2eb02a6d63ef8d471ca801431",
      "tree": "51a78963308b1d7e0d9936cb984535d281d638bf",
      "parents": [
        "f5a7e04885f2149f41323b9abfedd3efec10dfe1"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Oct 12 17:51:48 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Wed Oct 14 14:40:24 2020 +0200"
      },
      "message": "Amend English abbreviation macro\n\n... based on English Wikipedia articles and talk pages\n\nChange-Id: Ia074e125527e89c53423e3c395d872bb5861cabd\n"
    },
    {
      "commit": "f5a7e04885f2149f41323b9abfedd3efec10dfe1",
      "tree": "846699be050458ff833140b3d706682e500ef4e7",
      "parents": [
        "74141b3d2dc0a77833e028370e7e0ff71a4251ad"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Oct 12 10:43:24 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Wed Oct 14 14:34:53 2020 +0200"
      },
      "message": "Add French tokenizer (-l fr)\n\nBased on French Wikipedia articles and talk pages\n\nChange-Id: I3ee72d7d73e567638b6882a101baaf3b5ffee258\n"
    },
    {
      "commit": "74141b3d2dc0a77833e028370e7e0ff71a4251ad",
      "tree": "418c4de433b8617e1bb61bf95169493c3ef745bb",
      "parents": [
        "5c6df037afcdc7a149f84d9db50c6c88a5b278db"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Oct 01 23:23:18 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Oct 12 10:14:58 2020 +0200"
      },
      "message": "Add -l command line option to choose language\n\nChange-Id: I48e1ce119dfbd75ff9f719ce8525a2c63ad47fc5\n"
    },
    {
      "commit": "5c6df037afcdc7a149f84d9db50c6c88a5b278db",
      "tree": "f2a35d8226b827a88135d14a6943e1f5f950618e",
      "parents": [
        "ce48102c8ed132cb97dd89f90c3ecd38009e4a71"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Sep 29 22:19:38 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Oct 12 10:10:07 2020 +0200"
      },
      "message": "List available KorapTokenizerImplementation options for -T\n\nChange-Id: I8e45410f67decb6b44fc9574dfe94c89b7abd0cc\n"
    },
    {
      "commit": "ce48102c8ed132cb97dd89f90c3ecd38009e4a71",
      "tree": "652465801ff4ace03ffe27372170186efc31f29e",
      "parents": [
        "67eed1c2ffa2a4b61958071d61f4f84d9bd10861"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sun Oct 11 12:08:16 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sun Oct 11 12:08:16 2020 +0200"
      },
      "message": "Recognize {LETTER}+str. as abbreviation for Straße in de-tokenizer\n\nChange-Id: If4bdc02994e2a4ee48051f5047f78d2dddeb10c5\n"
    },
    {
      "commit": "67eed1c2ffa2a4b61958071d61f4f84d9bd10861",
      "tree": "ae3a7c8042c9eaaf534909b99ad46d10bfde1e1f",
      "parents": [
        "8e197f3c8895ff5d66d903f17da7e915076c84c8"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Sep 28 21:37:16 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Oct 09 14:48:55 2020 +0200"
      },
      "message": "Build language specific tokenizers: de, en\n\nChange-Id: Iedad4d96aa702e173ed98d888685b4dd7b113cd5\n"
    },
    {
      "commit": "8e197f3c8895ff5d66d903f17da7e915076c84c8",
      "tree": "a0d68069e2c9cc3e9f26f2d23fbd88c501b13063",
      "parents": [
        "ad22e2ce7f253650d96373bb1fd6472f091075a9"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Oct 08 09:20:37 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Oct 08 18:06:46 2020 +0200"
      },
      "message": "Allow setting input encoding explicitely whith -e \u003cencoding\u003e\n\nAnd use UTF-8 as default.\n\nOtherwise tests fail if no UTF-8 locale is set.\n\nChange-Id: Ie2b8ef2009a037b767b95710e84266af75381fb9\n"
    },
    {
      "commit": "37018068f9423b8f229257c9b0c30fe1e64e66d8",
      "tree": "55fea5da9d678375c67cdf09c779fddab77e05f9",
      "parents": [
        "751868b9a6f8c65ae26bd212c746c91e80d00d7c"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Oct 08 17:54:59 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Oct 08 17:55:34 2020 +0200"
      },
      "message": "Do not use commit ids for naming standalone jars\n\nChange-Id: I713ea18c9c9db796bc74e90c7bc5b83885a4b805\n"
    },
    {
      "commit": "751868b9a6f8c65ae26bd212c746c91e80d00d7c",
      "tree": "efa93123637391ce7b6718a269495f9677717a64",
      "parents": [
        "b9f45e084ceca956b3378fe12d20d9d5b08edadc"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Sep 25 17:59:38 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Sep 28 09:04:10 2020 +0200"
      },
      "message": "Make tokenizer implementation exchangeable\n\nAllows for quite an easy adaptation and integration of other language\nspecializations and other tokenizers, also from the command line with\nnew -T option that allows to specify the tokenizer class name.\n\nTODO: add documentation to the KorapTokenizer interface\n\nChange-Id: Ib95793f47887a3b0829d68ebdbf8bc40815a0605\n"
    },
    {
      "commit": "b9f45e084ceca956b3378fe12d20d9d5b08edadc",
      "tree": "c600f3a8d842f7ee6607080840ea0701de57085c",
      "parents": [
        "c419d5b22c508a352f00fb11f23034a10bfbaf3d"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Sep 17 20:03:59 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Sep 18 19:13:17 2020 +0200"
      },
      "message": "Rename tokenizer class to KorAPDFATokenizer\n\nChange-Id: Icad8af7582689f599eda27258cc397e6155aeefe\n"
    },
    {
      "commit": "c419d5b22c508a352f00fb11f23034a10bfbaf3d",
      "tree": "83eb21aa0d47920a7c1fcd225601249c1dc4108c",
      "parents": [
        "de949deb083c43f4e0fed3713617aed768c000aa"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Thu Sep 17 15:21:26 2020 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Fri Sep 18 17:44:06 2020 +0200"
      },
      "message": "Add new command line options using picocli and sanitize code\n\nUsage: koraptokenizer [-hnpsV] [--force] [-ktt] [--[no-]tokens]\n                      [-o\u003d\u003coutput_fillename\u003e] [\u003cinputFiles\u003e...]\nTokenizes (and sentence splits) text input.\n      [\u003cinputFiles\u003e...]   input files\n      --force             Force overwrite (default: false)\n  -h, --help              Show this help message and exit.\n      -ktt                Deprecated. For internal use only. (default: false)\n  -n, --normalize         Normalize tokens (default: false)\n      --[no-]tokens       Print tokens (default: true)\n  -o, --output-file\u003d\u003coutput_fillename\u003e\n                          Output file (default: -)\n  -p, --positions         Print token start and end positions as character\n                            offsets (default: false)\n  -s, --sentence-boundaries\n                          Print sentence boundary positions (default: false)\n  -V, --version           Print version information and exit.\n\nChange-Id: Ib92678c832a2d95799a8f503c3e86dd4da2b4d73\n"
    },
    {
      "commit": "f4df7121d10c9df78288b831a6d397150d140d05",
      "tree": "45b29ed3db785b29cfc25e64c56e666a83c5f3f7",
      "parents": [
        "783e2a27b3e9612cff8348e841c6a484c0d761f9"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Sep 14 10:23:53 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Sep 14 10:24:34 2020 +0200"
      },
      "message": "Change jar target naming conventions\n\nWe now have for example:\n\nKorAP-Tokenizer-1.2-783e2a2.jar\nKorAP-Tokenizer-1.2-783e2a2-src.zip\nKorAP-Tokenizer-1.2-783e2a2-standalone.jar\n\nChange-Id: Ie071ff72cf29e388df9996a0755eb60f0ab9a07e\n"
    },
    {
      "commit": "783e2a27b3e9612cff8348e841c6a484c0d761f9",
      "tree": "e2605d396fbfad73b94a2e0c085e509a2360ca4a",
      "parents": [
        "571c194376e9bfc928da5a4eb765e59eceae096d"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Sep 11 23:34:27 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Sep 14 09:40:25 2020 +0200"
      },
      "message": "Ignore quoted email names like \"John Doe\"@xx.com\n\nThey are rare and are now delivering too many false positives due to Twitter handles, like:\n\n Pluto.\"  Eris-Entdecker Mike Brown, der im Kurznachrichtendienst Twitter unter \"@plutokiller\n\n A different prioritization does not seem necessary either.\n\nChange-Id: I75e328f027f917ab1db246da80201e30604472db\n"
    },
    {
      "commit": "571c194376e9bfc928da5a4eb765e59eceae096d",
      "tree": "ec8d984c8b3b5b1b045315b4591d2954e639133a",
      "parents": [
        "6afd12177bab60924a76c214cacb03029e244c11"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Sep 08 18:39:57 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Wed Sep 09 08:32:37 2020 +0200"
      },
      "message": "Empty text (\u003cEOT\u003e\u003cEOT\u003e) -\u003e empty output line\n\nEmpty texts, i. e. \u003cEOT\u003e\u003cEOF\u003e will result in empty output lines. At the end of a file however one additional \u003cEOT\u003e will not produce an empty outpu line.\n\nChange-Id: Ib989f91f7172441e6b6d8689dfc118f07d91e1c2\n"
    },
    {
      "commit": "6afd12177bab60924a76c214cacb03029e244c11",
      "tree": "d605c7640a1100490e5c02169921217fb8585b23",
      "parents": [
        "793f85dffdd621f671962eb6e080887d5355a802"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Sep 08 14:29:11 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Sep 08 17:51:46 2020 +0200"
      },
      "message": "Use standard EOT/EOF character x04 instead of magic escape \\n\\x03\\n\n\nChange-Id: I06b4eb09064c08b5708a612666b7d807785ae580\n"
    },
    {
      "commit": "793f85dffdd621f671962eb6e080887d5355a802",
      "tree": "baa24b1c4e8075f1b28499431e9c8eb71a800c3f",
      "parents": [
        "b9fb19698cd7703f77d077ca6e23d4aa3ff82062"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Sep 08 14:40:24 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Sep 08 17:50:07 2020 +0200"
      },
      "message": "Add first tests for IPC invocation scenario\n\nChange-Id: Ib6b974a5246f22f9c2b1050fd39912e9be2c8fc6\n"
    },
    {
      "commit": "b2666fc5a425f68797079e32c0e3cb6d25d056d7",
      "tree": "bb2764a228d392c2127d92fee69188d1e0e1a2bb",
      "parents": [
        "07d97146420a0909c9d2c21ab21c95069b3a98b1"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Sep 07 18:03:46 2020 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Tue Sep 08 17:25:08 2020 +0200"
      },
      "message": "Implement sentence splitter\n\nChange-Id: I80969a8ac68193dd2a3dd82c1f606807193c39c8\n"
    },
    {
      "commit": "07d97146420a0909c9d2c21ab21c95069b3a98b1",
      "tree": "a14bb644bb2b3e729ac0a5a1de58b6ba78d6c83f",
      "parents": [
        "c315c2a64a95f9fcf08ae30fef097179bddf7003"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Sep 07 18:03:34 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Tue Sep 08 08:23:44 2020 +0200"
      },
      "message": "Move tests to proper location\n\nChange-Id: I447b4777f0d5a616310f102ce71df487245e1c32\n"
    },
    {
      "commit": "81925096b645bf17cf688d1311bce002b5a9418f",
      "tree": "72e8930b1290ff3567cd9987d7e425d9b5e4c580",
      "parents": [
        "478632eb7e133969531f3b401576564783183707"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Sep 07 15:16:51 2020 +0200"
      },
      "committer": {
        "name": "Marc K",
        "email": "morckx@gmail.com",
        "time": "Mon Sep 07 15:25:28 2020 +0200"
      },
      "message": "Use original Span class and implement Tokenizer interface from OpenNLP\n\nUsing maven assembly plugin to include the required classes into a jar\nfor binary distribution.\n\nThis makes it possible to use KorAPTokenizerImpl as tokenizer in OpenNLP\napplications.\n\nChange-Id: I627dcdd046334db1b1ae9dd60cf7104fd3a3c518\n"
    },
    {
      "commit": "478632eb7e133969531f3b401576564783183707",
      "tree": "750d4b79b2f2b1e4e36794a8d593ebc3cb68b0be",
      "parents": [
        "fe84dd00e4116df5fc7b3bfd026249fe5a8ece5b"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sat Sep 05 21:52:54 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Mon Sep 07 10:59:10 2020 +0200"
      },
      "message": "Clean up code\n\nChange-Id: Icc8d4b091b4f61401d7f4194188b568dd30d627f\n"
    },
    {
      "commit": "45dc0fee5398f28545c8b2f34e0d3c3b894fa0dd",
      "tree": "179fc1f82bc858243c537d369fb338ca76ed82ae",
      "parents": [
        "656055bc573a46cca0ff09db5c498d18740ed7d6"
      ],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sat Sep 05 21:46:17 2020 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Mon Sep 07 09:11:37 2020 +0200"
      },
      "message": "Add Apache copyright NOTICE\n\nChange-Id: Iaf7b2f7f15ef53d2a55ac3986b9beb236421df7a\n"
    },
    {
      "commit": "3367773b65d4629b0cdc994d134129b00f0f9a63",
      "tree": "86588a5c60e52c837aa8e16090089bbb7da95abe",
      "parents": [],
      "author": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Fri Sep 04 22:07:39 2020 +0200"
      },
      "committer": {
        "name": "Marc Kupietz",
        "email": "kupietz@ids-mannheim.de",
        "time": "Sat Sep 05 22:07:36 2020 +0200"
      },
      "message": "Initial import from private/Ingestion\n\nChange-Id: I96f428c440ef301384de6d7ef2e348df7d729816\n"
    }
  ]
}
