)]}'
{
  "log": [
    {
      "commit": "edee6e5115ef54f850ad0fe7f9a9eb0bf8b3a418",
      "tree": "62047eae3e560d4703174708275bc5e92274b20f",
      "parents": [
        "e19aa3e475243e522b07b823b3eb034ec1d02b59"
      ],
      "author": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Mon Jul 27 14:15:11 2020 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Mon Jul 27 22:31:46 2020 +0200"
      },
      "message": "Make tokenization chainable and remove unnecessary tokenization switch\n\nChange-Id: Iaf47a0fcad225931c941fd7379c02e51a428be07\n"
    },
    {
      "commit": "f57ed81463dceb07312a6a3800c013a16d16c2fa",
      "tree": "a0ce13200c0cf7c6a739491926ce3a20e9c09bb9",
      "parents": [
        "190d02213a60059aa1f5641c86fd89c5265abd00"
      ],
      "author": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Mon Jul 27 10:37:52 2020 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Mon Jul 27 18:24:19 2020 +0200"
      },
      "message": "Establish header object for corpus, doc and text header parsing\n\nChange-Id: I26767fc27054bd3f1b70a622557c0b2f04cac816\n"
    },
    {
      "commit": "190d02213a60059aa1f5641c86fd89c5265abd00",
      "tree": "d92d407cb57797a43cca4788d1402dedbedaf6dd",
      "parents": [
        "994aff7addeadc7be57b848e9d8c50bdafb11bd3"
      ],
      "author": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Sat Jul 25 22:44:33 2020 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Sun Jul 26 09:26:20 2020 +0200"
      },
      "message": "Improve utf-8-preprocessing for tokenizers\n\nChange-Id: If18ab6d40b98d372f161a377a0d4efd17444fa69\n"
    },
    {
      "commit": "994aff7addeadc7be57b848e9d8c50bdafb11bd3",
      "tree": "90392a860269ead824f4409bd70475a1488d5b07",
      "parents": [
        "854a11503d3c0e9d22f322c26572d2e032192fc0"
      ],
      "author": {
        "name": "Peter Harders",
        "email": "harders@ids-mannheim.de",
        "time": "Sat Jul 25 09:53:35 2020 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Sat Jul 25 17:58:27 2020 +0200"
      },
      "message": "faster processing of UTF8-chars\n\nChange-Id: I53ebfbf6a54e319dfeb1569b1ac070278059b0dc\n"
    },
    {
      "commit": "854a11503d3c0e9d22f322c26572d2e032192fc0",
      "tree": "39ea0c4db5401d1097ec1a12ed33d27d217376df",
      "parents": [
        "1d65f9467ab04537821c0d6efd565c49ac3649fb"
      ],
      "author": {
        "name": "Peter Harders",
        "email": "harders@ids-mannheim.de",
        "time": "Wed Jul 22 22:48:02 2020 +0200"
      },
      "committer": {
        "name": "Peter Harders",
        "email": "harders@ids-mannheim.de",
        "time": "Fri Jul 24 20:24:20 2020 +0200"
      },
      "message": "bugfixing Conservative.pm\n\n 1. identified wrong tokenization caused by wrong pattern match ($3)\n    (wrote a test in t/tokenization.t, that shows the wrong tokenization)\n\n 2. removed wrong pattern match ($3) and adjusted test in t/tokenization.t\n\n 3. cleaned up (also changed some comments)\n\n 4. fixed missing tokenization of first punctuation char\n\n 5. exchanged [^A-Za-z0-9] by [\\p{Punct}\\s]\n    (TODO: yet no approp. test found)\n\nChange-Id: Ib494c79c3e6971a57ad874fc62583c625095cf28\n"
    },
    {
      "commit": "5fb5e8d0fe8f3b16277a77a68b732dd42a80657b",
      "tree": "4ac1eae081d0179b7dc74d4ea667407c7190cb34",
      "parents": [
        "f9c5124a32e9115155941113bb391402b257bc21"
      ],
      "author": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Thu Jul 23 17:45:13 2020 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Fri Jul 24 07:58:31 2020 +0200"
      },
      "message": "Simplify and centralize temporary file creation\n\nChange-Id: I6674783e7707d66efea05d52381114779f3a64ee\n"
    },
    {
      "commit": "b122717d9a9015ba486eb8503015cfefdb54f1e4",
      "tree": "4dda245d8f2cc516271220a5581aa54dc9f4d522",
      "parents": [
        "4c6ff5b08659b889aeff9cb7ed77eb968d94cab5"
      ],
      "author": {
        "name": "Peter Harders",
        "email": "harders@ids-mannheim.de",
        "time": "Tue Jul 21 02:12:10 2020 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Tue Jul 21 19:40:11 2020 +0200"
      },
      "message": "clean up intern tokenization\n\n- moved intern tokenization out of retr_info()\n- removed $offset parameter (not anymore necessary)\n\nChange-Id: I063efdee193ab41c2705971a95341573884fd3a2\n"
    },
    {
      "commit": "95bc98aeb0a2e0585d5f8c4a5114ea282d6697d4",
      "tree": "c522f5902098494d55ead0b58c67bd598741642b",
      "parents": [
        "8b511f932a7e0f5d3869525b69006466b82c488d"
      ],
      "author": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Sat Jul 11 12:00:12 2020 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Sat Jul 11 12:00:12 2020 +0200"
      },
      "message": "Rename delHTMLcom to be in line with other naming conventions and make the function exportable\n\nChange-Id: I46d30891b17a5f2bddf7ddc0c492413cc2af6007\n"
    },
    {
      "commit": "8b511f932a7e0f5d3869525b69006466b82c488d",
      "tree": "76ace32ccfecb3239b371e5131c91aadaaf321e0",
      "parents": [
        "d962747a4ac7e02a6040fad736e4a8a45a6b4431"
      ],
      "author": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Thu Jul 09 17:28:08 2020 +0200"
      },
      "committer": {
        "name": "Peter Harders",
        "email": "harders@ids-mannheim.de",
        "time": "Fri Jul 10 20:52:27 2020 +0200"
      },
      "message": "Establish tokenizer object for external base tokenization\n\nChange-Id: Ie69c280042da5125e0934c87ccaad88b0be5494f\n"
    },
    {
      "commit": "d962747a4ac7e02a6040fad736e4a8a45a6b4431",
      "tree": "9f39e305982ab20660aaa09b669b8accfe00ddba",
      "parents": [
        "95612c3d5a2aeea3d81915b7a846a8dc69d46df4"
      ],
      "author": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Thu Jul 09 16:53:09 2020 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Thu Jul 09 17:01:06 2020 +0200"
      },
      "message": "Establish tokenizer objects for aggressive and conservative base tokenization\n\nChange-Id: I702098185b0b6292c73217268d4516d55a2f95b5\n"
    },
    {
      "commit": "8571751c366b441fc2ce24ce81b13822261b4cc7",
      "tree": "334cec22e96fc3e18cf4c72f5cbc2bf330478a19",
      "parents": [
        "3479082d7eb20d3f120a89344667aa59a335c2b9"
      ],
      "author": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Wed Jul 08 11:19:19 2020 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Thu Jul 09 14:22:02 2020 +0200"
      },
      "message": "Create Zip-Factory for simpler handling of Zip streams\n\nChange-Id: I66fb1e980437f9b931d71b8bc9fde54bda2aee6f\n"
    },
    {
      "commit": "3479082d7eb20d3f120a89344667aa59a335c2b9",
      "tree": "2badaeaee75b583d82ffb82c6b46777317e6c52f",
      "parents": [
        "510a88cfddf2901fac4c9353b8dbfb73d4fb7c64"
      ],
      "author": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Tue Jul 07 15:32:50 2020 +0200"
      },
      "committer": {
        "name": "Peter Harders",
        "email": "harders@ids-mannheim.de",
        "time": "Thu Jul 09 14:07:25 2020 +0200"
      },
      "message": "Simplify conservative tokenization code\n\nChange-Id: I957c21064ef17691b74de3d57361df62197350ef\n"
    },
    {
      "commit": "510a88cfddf2901fac4c9353b8dbfb73d4fb7c64",
      "tree": "39ff68f8f3fb00a6805b48bab73b19bd2b98d427",
      "parents": [
        "eac374d7e4d87f6d73f67b5658c9084dfead2d12"
      ],
      "author": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Tue Jul 07 10:16:50 2020 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Tue Jul 07 15:31:46 2020 +0200"
      },
      "message": "Minor speedup in tokenization by merging array pushes\n\nChange-Id: I138226acb2648cf606563c57b3783f011bab7795\n"
    },
    {
      "commit": "eac374d7e4d87f6d73f67b5658c9084dfead2d12",
      "tree": "d092ee684de76f63768e8df3af20aa13510a5a26",
      "parents": [
        "7fab93bf003e4737d0b9b260e73948eac1368add"
      ],
      "author": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Tue Jul 07 09:00:44 2020 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Tue Jul 07 09:43:11 2020 +0200"
      },
      "message": "Separate dummy tokenization from main script with minimal changes\n\nChange-Id: I74ca0a47ad897ef639c90f8af564d08dd5050c63\n"
    },
    {
      "commit": "7fab93bf003e4737d0b9b260e73948eac1368add",
      "tree": "bd2d03a4d8f27413b7663707f2fc105d09271bb2",
      "parents": [
        "2d547bcc6c9af8a65973dae1bc804b08445abaf1"
      ],
      "author": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Sat Jul 04 11:14:21 2020 +0200"
      },
      "committer": {
        "name": "Peter Harders",
        "email": "harders@ids-mannheim.de",
        "time": "Mon Jul 06 10:59:36 2020 +0200"
      },
      "message": "Replace recursion and non-essential regexes with index/substr\n(as a very minor performance improvement) and fix a bug\nwhere a single-line regex would ignore the newline symbol.\n\nChange-Id: I573b50b85b7dd2732c2cad3f50e22b0e9e33e2ea\n"
    },
    {
      "commit": "2d547bcc6c9af8a65973dae1bc804b08445abaf1",
      "tree": "cdb6346a80432894224a5e420ac174afda8e70ff",
      "parents": [
        "5ca6efc5fee7874b599841685f03c723a5fe6d32"
      ],
      "author": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Sat Jul 04 10:34:35 2020 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "diewald@ids-mannheim.de",
        "time": "Sat Jul 04 11:58:23 2020 +0200"
      },
      "message": "Fix a bug in delHTMLcom where comments were left open\n\nChange-Id: I424ac394fa7eaad9a2b62c61761d2de6720870a2\n"
    },
    {
      "commit": "4f67cd4981c4b3c960104f2d7bd04e7ce8c084be",
      "tree": "d4c442cac73184b60a0086922ff4cbafa82cc7d8",
      "parents": [
        "9015734b7bd4b0db912e97f4ea8df8139f802c77"
      ],
      "author": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Thu Jul 02 12:27:58 2020 +0200"
      },
      "committer": {
        "name": "Akron",
        "email": "nils@diewald-online.de",
        "time": "Fri Jul 03 15:29:31 2020 +0200"
      },
      "message": "Atomize and test comment stripping\n\nChange-Id: Id798c8bac96214f29659b2764f8861539d6f5210\n"
    }
  ]
}
