| Nils Diewald | d37f7e4 | 2015-02-27 21:08:22 +0000 | [diff] [blame] | 1 | # Krill Backend properties |
| 2 | krill.properties = true |
| 3 | krill.indexDir = [PATH TO INDEX DIRECTORY] |
| 4 | krill.server.name = [UNIQUE NODE NAME] |
| 5 | krill.server.baseURI = [LISTEN-URL INCLUDING PORT] |
| 6 | |
| 7 | # Krill Database properties |
| 8 | krill.db.class = org.mariadb.jdbc.Driver |
| 9 | krill.db.URL = jdbc:mysql://[DB_IP]:[DB_PORT]/[DB_NAME] |
| 10 | krill.db.pwd = [DB_PWD] |
| 11 | krill.db.user = [DB_USER] |
| 12 | |
| 13 | krill.index.commit.count = 134217000 |
| 14 | krill.index.commit.log = log/krill.commit.log |
| 15 | krill.index.commit.auto = 500 |
| 16 | krill.index.relations.max = 100 |
| Marc Kupietz | 3f29812 | 2025-04-17 08:25:05 +0200 | [diff] [blame] | 17 | krill.index.textSize.max = 20000000 |
| Akron | e6958aa | 2025-09-26 11:02:01 +0200 | [diff] [blame] | 18 | |
| 19 | # Token retrieval settings: |
| 20 | # |
| 21 | # krill.match.max.token = 5 |
| 22 | # |
| Akron | 88c66a9 | 2026-05-07 12:11:21 +0200 | [diff] [blame^] | 23 | ## Maximum number (i.e. length) of tokens to be retrievable in a match. |
| Akron | e6958aa | 2025-09-26 11:02:01 +0200 | [diff] [blame] | 24 | ## Matches longer than that will be cut. |
| 25 | ## Defaults to 50 |
| 26 | |
| 27 | # krill.context.max.token = |
| 28 | # |
| 29 | ## Maximum number (i.e. length) of tokens to be retrieved (left and right) of a match. |
| 30 | ## Defaults to 60 |
| 31 | |
| 32 | # krill.kwic.max.token = |
| 33 | # |
| 34 | ## Maximum total number of tokens in a KWIC snippet (left + match + right). |
| 35 | ## When set, this derives krill.context.left.maxShrink and |
| 36 | ## krill.context.right.maxShrink automatically: |
| 37 | ## totalShrink = (krill.match.max.token + 2 * krill.context.max.token) - kwic.max.token |
| 38 | ## Split evenly between left and right. |
| 39 | ## When this property is set, individual maxShrink values are ignored. |
| 40 | ## The existing krill.match.max.token remains in effect as a separate cap |
| 41 | ## on match length, preventing data leakage from sentence-level queries. |
| 42 | ## Not set by default (no KWIC cap - backward compatible). |
| 43 | |
| 44 | # krill.context.left.maxShrink = 0 |
| 45 | # |
| 46 | ## Maximum number of tokens the left context may shrink based on match length. |
| 47 | ## Defaults to 0 (no shrinking - full context is always returned). |
| 48 | ## When a match is long, the context shrinks by up to this many tokens, |
| 49 | ## keeping the total KWIC width manageable. |
| 50 | ## The total shrink is distributed proportionally between left and right |
| 51 | ## according to their respective maxShrink values. |
| 52 | ## Use the string "max" to allow the context to shrink entirely |
| 53 | ## (up to krill.context.max.token tokens). |
| 54 | ## Ignored when krill.kwic.max.token is set. |
| 55 | ## Note: Only token-based contexts are affected; character-based contexts |
| 56 | ## are currently not adjusted by this feature. |
| 57 | |
| 58 | # krill.context.right.maxShrink = 0 |
| 59 | # |
| 60 | ## Maximum number of tokens the right context may shrink based on match length. |
| 61 | ## Defaults to 0 (no shrinking - full context is always returned). |
| 62 | ## When a match is long, the context shrinks by up to this many tokens, |
| 63 | ## keeping the total KWIC width manageable. |
| 64 | ## The total shrink is distributed proportionally between left and right |
| 65 | ## according to their respective maxShrink values. |
| 66 | ## Use the string "max" to allow the context to shrink entirely |
| 67 | ## (up to krill.context.max.token tokens). |
| 68 | ## Ignored when krill.kwic.max.token is set. |
| 69 | ## Note: Only token-based contexts are affected; character-based contexts |
| 70 | ## are currently not adjusted by this feature. |
| 71 | |
| Akron | 88c66a9 | 2026-05-07 12:11:21 +0200 | [diff] [blame^] | 72 | # krill.context.max.char = |
| 73 | # |
| 74 | ## Maximum number of characters to be retrieved (left and right) of a match |
| 75 | ## when the client requests character-based context. |
| 76 | ## Character-based contexts are independent of token-based contexts: |
| 77 | ## the client chooses one or the other per request. When character context |
| 78 | ## is used, token-based maxShrink adjustment does NOT apply. |
| 79 | ## Defaults to 500 |