blob: d782ddaf7d5e9e25e84490baaa3009267f60837d [file] [log] [blame]
Nils Diewald2fe12e12015-03-06 16:47:06 +00001package Kalamar;
Nils Diewald5d1ffb42014-05-21 17:45:34 +00002use Mojo::Base 'Mojolicious';
Nils Diewalde2c83812014-11-11 21:13:18 +00003use Mojo::ByteStream 'b';
Akronc7656e92018-08-30 13:33:25 +02004use Mojo::URL;
Akronf65ad6c2017-02-01 14:36:38 +01005use Mojo::File;
Akron2c2ddbd2021-03-05 12:10:27 +01006use Mojo::JSON qw/decode_json encode_json/;
Akron0c4cd222019-07-19 16:33:34 +02007use Mojo::Util qw/url_escape deprecated slugify/;
Akron4c33c622018-11-12 13:43:27 +01008use List::Util 'none';
Nils Diewald5d1ffb42014-05-21 17:45:34 +00009
Nils Diewald709f52f2015-05-21 18:32:58 +000010# Minor version - may be patched from package.json
Akrone4276a92022-11-30 14:07:15 +010011our $VERSION = '0.48';
Akronc7656e92018-08-30 13:33:25 +020012
13# Supported version of Backend API
14our $API_VERSION = '1.0';
Nils Diewald7cad8402014-07-08 17:06:56 +000015
Nils Diewald7148c6f2015-05-04 15:07:53 +000016# TODO: The FAQ-Page has a contact form for new questions
Nils Diewald709f52f2015-05-21 18:32:58 +000017# TODO: Embed query serialization
18# TODO: Embed collection statistics
19# TODO: Implement tab opener for matches and the tutorial
Nils Diewald709f52f2015-05-21 18:32:58 +000020# TODO: Implement a "projects" system
Nils Diewald7148c6f2015-05-04 15:07:53 +000021
Nils Diewald002e8fb2014-06-22 14:27:01 +000022# Start the application and register all routes and plugins
Nils Diewald5d1ffb42014-05-21 17:45:34 +000023sub startup {
24 my $self = shift;
25
Nils Diewalda944fab2015-04-08 21:02:04 +000026 # Set version based on package file
Nils Diewald709f52f2015-05-21 18:32:58 +000027 # This may introduce a SemVer patch number
Akronf65ad6c2017-02-01 14:36:38 +010028 my $pkg_path = $self->home->child('package.json');
29 if (-e $pkg_path->to_abs) {
30 my $pkg = $pkg_path->slurp;
31 $Kalamar::VERSION = decode_json($pkg)->{version};
32 };
Nils Diewalda944fab2015-04-08 21:02:04 +000033
Akron656c5d92015-11-13 21:17:03 +010034 # Lift maximum template cache
35 $self->renderer->cache->max_keys(200);
36
Nils Diewaldab4d3ca2015-04-17 01:48:43 +000037 # Add additional plugin path
38 push(@{$self->plugins->namespaces}, __PACKAGE__ . '::Plugin');
39
Akron3340ae72022-11-22 12:20:13 +010040 # Add additional commands
41 push(@{$self->commands->namespaces}, __PACKAGE__ . '::Command');
42
Nils Diewaldfccfbcb2015-04-29 20:48:19 +000043 # Set secrets for signed cookies
Akron2c2ddbd2021-03-05 12:10:27 +010044 my $secret_file = $self->home->rel_file('kalamar.secret.json');
45
46 # Support old secrets file
47 # This is deprecated 2021-03-05
48 if (-e (my $old_secret = $self->home->child('kalamar.secret'))) {
Nils Diewalda79b2682015-05-18 18:34:06 +000049
50 # Load file and split lines for multiple secrets
Akron2c2ddbd2021-03-05 12:10:27 +010051 my $secrets = [b($old_secret->slurp)->split("\n")];
Akron3d68ac32022-01-04 14:40:30 +010052
Akron2c2ddbd2021-03-05 12:10:27 +010053 $self->secrets($secrets);
54
Akron3d68ac32022-01-04 14:40:30 +010055 for (@$secrets) {
56 if (length($secrets) > 22) {
57 $self->log->warn(
58 'Unable to automatically switch to Autosecrets, as secret is too long (> 22 chars)'
59 );
60 goto CONF;
61 };
62 }
63
Akron2c2ddbd2021-03-05 12:10:27 +010064 eval {
65 $secret_file->spurt(encode_json(@$secrets));
66 $secret_file->chmod(0600);
67 if (-w $secret_file) {
68 $self->log->warn(
69 "Please delete $old_secret file " .
70 "- $secret_file was created instead"
71 );
72 }
73 };
74 if ($@) {
75 $self->log->error("Please make $secret_file accessible");
76 };
Nils Diewald4347ee92015-05-04 20:32:48 +000077 }
Nils Diewald709f52f2015-05-21 18:32:58 +000078
79 # File not found ...
80 # Kalamar needs secrets in a file to be easily deployable
81 # and publishable at the same time.
Nils Diewald4347ee92015-05-04 20:32:48 +000082 else {
Akron2c2ddbd2021-03-05 12:10:27 +010083 $self->plugin(AutoSecrets => {
84 path => $secret_file
85 });
Nils Diewald19402142015-04-30 15:44:52 +000086 };
Nils Diewaldfccfbcb2015-04-29 20:48:19 +000087
Akron3d68ac32022-01-04 14:40:30 +010088 CONF:
Akron2c2ddbd2021-03-05 12:10:27 +010089
Akroncba9f322016-02-29 23:12:45 +010090 # Configuration framework
Akron09a567c2016-04-11 22:49:20 +030091 $self->plugin('Config');
Nils Diewald709f52f2015-05-21 18:32:58 +000092
Akron741b2b12017-04-13 22:15:59 +020093 $self->log->info('Mode is ' . $self->mode);
94
Akron63d963b2019-07-05 15:35:51 +020095 # Get configuration
Akron47787ca2017-05-17 16:00:10 +020096 my $conf = $self->config('Kalamar');
Akron63d963b2019-07-05 15:35:51 +020097 unless ($conf) {
98 $self->config(Kalamar => {});
99 $conf = $self->config('Kalamar');
100 };
101
102 # Check for API endpoint and set the endpoint accordingly
103 if ($conf->{api}) {
104
105 # The api endpoint should be defined as a separated path
106 # and version string
107 $self->log->warn(
108 'Kalamar.api is no longer supported in configurations '.
109 'in favor of Kalamar.api_path'
110 );
111 };
112
Akron0c4cd222019-07-19 16:33:34 +0200113 $self->sessions->cookie_name('kalamar');
114
115 # Require HTTPS
116 if ($conf->{https_only}) {
117
118 # ... for cookie transport
119 $self->sessions->secure(1);
Akron1bee5a42021-01-13 17:44:18 +0100120
Akron26244a72021-04-28 00:17:56 +0200121 # Temporary for session riding
122 $self->sessions->samesite('None');
123
Akron1bee5a42021-01-13 17:44:18 +0100124 # For all pages
125 $self->hook(
126 before_dispatch => sub {
127 shift->res->headers->header('Strict-Transport-Security' => 'max-age=3600; includeSubDomains');
128 }
129 );
Akron0c4cd222019-07-19 16:33:34 +0200130 };
131
132 # Run the app from a subdirectory
Akron63d963b2019-07-05 15:35:51 +0200133 if ($conf->{proxy_prefix}) {
Akron47787ca2017-05-17 16:00:10 +0200134
Akronf3d856c2017-06-21 17:07:40 +0200135 for ($self->sessions) {
Akron1a394722017-06-21 16:25:30 +0200136 $_->cookie_path($conf->{proxy_prefix});
Akron0c4cd222019-07-19 16:33:34 +0200137 $_->cookie_name('kalamar-' . slugify($conf->{proxy_prefix}));
Akron1a394722017-06-21 16:25:30 +0200138 };
139
Akron47787ca2017-05-17 16:00:10 +0200140 # Set prefix in stash
141 $self->defaults(prefix => $conf->{proxy_prefix});
142
143 # Create base path
144 $self->hook(
145 before_dispatch => sub {
146 shift->req->url->base->path($conf->{proxy_prefix} . '/');
147 });
148 };
149
Akron807225b2021-01-13 18:00:13 +0100150 $self->hook(
151 before_dispatch => sub {
Akron5b6d7272021-01-21 11:26:02 +0100152 my $h = shift->res->headers;
153 $h->header('X-Content-Type-Options' => 'nosniff');
Akron52b32d02021-01-21 17:37:19 +0100154 $h->header('X-XSS-Protection' => '1; mode=block');
Akron5b6d7272021-01-21 11:26:02 +0100155 $h->header(
156 'Access-Control-Allow-Methods' =>
157 $h->header('Access-Control-Allow-Methods') // 'GET, POST, OPTIONS'
158 );
Akron807225b2021-01-13 18:00:13 +0100159 }
160 );
161
Akron90be03b2020-02-03 16:13:37 +0100162 $conf->{proxy_host} //= 1;
163
164 # Take proxy host
165 if ($conf->{proxy_host}) {
166 $self->hook(
167 before_dispatch => sub {
168 my $c = shift;
169 if (my $host = $c->req->headers->header('X-Forwarded-Host')) {
170 foreach ($c->req->url->base) {
171 $_->host($host);
172 $_->scheme(undef);
173 $_->port(undef);
174 };
175 };
176 }
177 );
178 };
179
Akron8f8deda2021-01-15 12:55:06 +0100180 # API is not yet set - define the default Kustvakt api endpoint
181 $conf->{api_path} //= $ENV{KALAMAR_API} || 'https://korap.ids-mannheim.de/api/';
Akron63d963b2019-07-05 15:35:51 +0200182 $conf->{api_version} //= $API_VERSION;
Akronc7656e92018-08-30 13:33:25 +0200183
Akron4036d542018-02-12 13:17:09 +0100184 # Add development path
Akron0e1ed242018-10-11 13:22:00 +0200185 if ($self->mode eq 'development') {
Akron4036d542018-02-12 13:17:09 +0100186 push @{$self->static->paths}, 'dev';
Akronbe9d5b32017-04-05 20:48:24 +0200187 };
188
Akron23ab0472019-12-17 16:55:55 +0100189 # Set proxy timeouts
190 if ($conf->{proxy_inactivity_timeout}) {
191 $self->ua->inactivity_timeout($conf->{proxy_inactivity_timeout});
192 };
193 if ($conf->{proxy_connect_timeout}) {
194 $self->ua->connect_timeout($conf->{proxy_connect_timeout});
195 };
196
Akron09a567c2016-04-11 22:49:20 +0300197 # Client notifications
Akron0504a182016-04-10 21:13:42 +0200198 $self->plugin(Notifications => {
199 'Kalamar::Plugin::Notifications' => 1,
Akron8ea84292018-10-24 13:41:52 +0200200 JSON => 1,
Akron3c390c42020-03-30 09:06:21 +0200201 HTML => 1
Akron0504a182016-04-10 21:13:42 +0200202 });
203
Akronc4ea2e52021-01-27 18:34:05 +0100204 # Establish content security policy
Akron0a4d36e2021-01-18 17:50:48 +0100205 # This needs to be defined prior to Kalamar::Plugin::Piwik!
Akronc4ea2e52021-01-27 18:34:05 +0100206 $self->plugin(CSP => {
207 'default-src' => 'self',
Akron0a4d36e2021-01-18 17:50:48 +0100208 'style-src' => ['self','unsafe-inline'],
Akron1871f032021-01-29 10:35:53 +0100209 # Hash for korap-overview.svg script
210 'script-src' => ['self','sha256-VGXK99kFz+zmAQ0kxgleFrBWZgybFAPOl3GQtS7FQkI='],
Akron5b6d7272021-01-21 11:26:02 +0100211 'connect-src' => 'self',
Akron0a4d36e2021-01-18 17:50:48 +0100212 'frame-src' => '*',
Akronaef5cf22021-06-21 11:45:54 +0200213 'frame-ancestors' => 'self',
Akron0a4d36e2021-01-18 17:50:48 +0100214 'media-src' => 'none',
215 'object-src' => 'self',
216 'font-src' => 'self',
217 'img-src' => ['self', 'data:'],
Akronb7b91c52021-01-27 17:46:52 +0100218 -with_nonce => 1
Akronc4ea2e52021-01-27 18:34:05 +0100219 });
220
Akron09a567c2016-04-11 22:49:20 +0300221 # Localization framework
222 $self->plugin(Localize => {
Akrondbb448c2018-02-14 17:02:36 +0100223 dict => {
224 Q => {
225 _ => sub { shift->config('Kalamar')->{'examplecorpus'} },
226 }
227 },
Akrona7cfd902017-12-21 19:28:36 +0100228 resources => ['kalamar.dict', 'kalamar.queries.dict']
Akron09a567c2016-04-11 22:49:20 +0300229 });
230
231 # Pagination widget
232 $self->plugin('TagHelpers::Pagination' => {
233 prev => '<span><span>&lt;</span></span>',
Akron86e63a92019-02-27 17:35:04 +0100234 next => '<span><span>&gt;</span></span>',
Akrona4b17f72021-11-04 15:37:02 +0100235 ellipsis => '<a class="ellipsis inactive"><span><span>...</span></span></a>',
Akron09a567c2016-04-11 22:49:20 +0300236 separator => '',
237 current => '<span>{current}</span>',
238 page => '<span>{page}</span>'
239 });
240
Akron1011daf2021-03-01 12:34:58 +0100241 # Obfuscate email addresses
242 $self->plugin('TagHelpers::MailToChiffre' => {
243 method_name => 'PArok',
244 pattern_rotate => 673,
245 no_inline => 1
246 });
247
Nils Diewaldab4d3ca2015-04-17 01:48:43 +0000248 # Load plugins
Nils Diewaldfccfbcb2015-04-29 20:48:19 +0000249 foreach (
Akrone8235be2016-06-27 11:02:18 +0200250 'KalamarHelpers', # Specific Helpers for Kalamar
Akronb7b91c52021-01-27 17:46:52 +0100251 'KalamarPages', # Page Helpers for Kalamar
Akron7093b812018-10-19 17:28:21 +0200252 'KalamarErrors', # Specific Errors for Kalamar
253 'KalamarUser', # Specific Helpers for Kalamar Users
Akron429aeda2018-03-19 16:02:29 +0100254 'ClientIP', # Get client IP from X-Forwarded-For
Akron51757cb2018-05-16 13:10:08 +0200255 'ClosedRedirect', # Redirect with OpenRedirect protection
Akronafeca252018-05-23 15:54:28 +0200256 'TagHelpers::ContentBlock', # Flexible content blocks
Nils Diewaldfccfbcb2015-04-29 20:48:19 +0000257 ) {
Nils Diewaldab4d3ca2015-04-17 01:48:43 +0000258 $self->plugin($_);
259 };
260
Akron751e9e42019-03-13 09:54:55 +0100261 my $serializer = 'JSON';
262
263 if (my $chi = $self->config('CHI')) {
264 if ($chi->{default}) {
265 $chi->{default}->{serializer} = $serializer;
266 };
267 if ($chi->{user}) {
268 $chi->{user}->{serializer} = $serializer;
269 };
270 };
271
Akron05c6dd62018-10-11 17:05:06 +0200272 # Global caching mechanism
273 $self->plugin('CHI' => {
274 default => {
275 driver => 'Memory',
Akron751e9e42019-03-13 09:54:55 +0100276 global => 1,
277 serializer => $serializer
Akron05c6dd62018-10-11 17:05:06 +0200278 },
279 user => {
280 driver => 'Memory',
Akron751e9e42019-03-13 09:54:55 +0100281 global => 1,
282 serializer => $serializer
Akron05c6dd62018-10-11 17:05:06 +0200283 }
284 });
Nils Diewald709f52f2015-05-21 18:32:58 +0000285
Nils Diewaldfccfbcb2015-04-29 20:48:19 +0000286 # Configure mail exception
Akron40cc1d82017-05-10 17:58:16 +0200287 if ($self->config('MailException')) {
288 $self->plugin('MailException' => $self->config('MailException'));
289 };
Nils Diewald709f52f2015-05-21 18:32:58 +0000290
Akroncdfd9d52019-07-23 11:35:00 +0200291 # Load further plugins,
292 # that can override core functions,
293 # therefore order may be of importance
Akron4c33c622018-11-12 13:43:27 +0100294 if (exists $conf->{'plugins'}) {
295 foreach (@{$conf->{'plugins'}}) {
296 $self->plugin('Kalamar::Plugin::' . $_);
297 };
298 };
299
Nils Diewaldfccfbcb2015-04-29 20:48:19 +0000300 # Configure documentation navigation
Akrond512ea62019-10-24 15:50:04 +0200301 my $doc_navi = Mojo::File->new($self->home->child('templates','doc','navigation.json'))->slurp;
302 $doc_navi = $doc_navi ? decode_json($doc_navi) : [];
Akron1b1a2712018-12-21 14:59:05 +0100303
Akronf7ec4442019-10-27 20:01:05 +0100304 # TODO:
305 # Use navi->add()
Akron1b1a2712018-12-21 14:59:05 +0100306 if ($conf->{navi_ext}) {
Akrond512ea62019-10-24 15:50:04 +0200307 push @$doc_navi, @{$conf->{navi_ext}};
Akron1b1a2712018-12-21 14:59:05 +0100308 };
309
Akronf7ec4442019-10-27 20:01:05 +0100310 # TODO:
311 # Remove navi entry
Akrond512ea62019-10-24 15:50:04 +0200312 $self->config(doc_navi => $doc_navi);
Nils Diewaldfccfbcb2015-04-29 20:48:19 +0000313
Akronf7ec4442019-10-27 20:01:05 +0100314 $self->navi->set(doc => $doc_navi);
315
Akron63d963b2019-07-05 15:35:51 +0200316 $self->log->info('API expected at ' . $self->korap->api);
Nils Diewald709f52f2015-05-21 18:32:58 +0000317
Akron3cd391e2017-03-29 23:42:54 +0200318 # Establish routes with authentification
Akron7d75ee32017-05-02 13:42:41 +0200319 my $r = $self->routes;
Akron3cd391e2017-03-29 23:42:54 +0200320
Akronafeca252018-05-23 15:54:28 +0200321 # Set footer value
Akronef6d5f12018-05-28 17:54:58 +0200322 $self->content_block(footer => {
Akron3cfa26d2019-10-24 15:17:34 +0200323 inline => '<%= embedded_link_to "doc", "V ' . $Kalamar::VERSION . '", "korap", "kalamar" %>',
Akronafeca252018-05-23 15:54:28 +0200324 position => 100
Akronef6d5f12018-05-28 17:54:58 +0200325 });
Akronafeca252018-05-23 15:54:28 +0200326
Akronb7b91c52021-01-27 17:46:52 +0100327 # Add nonce script
328 $self->content_block(nonce_js => {
329 inline => <<'NONCE_JS'
330 // Remove the no-js class from the body
331 document.body.classList.remove('no-js');
332NONCE_JS
333 });
334
Nils Diewalda79b2682015-05-18 18:34:06 +0000335 # Base query route
Akronfb6d87d2018-10-24 18:10:20 +0200336 $r->get('/')->to('search#query')->name('index');
Nils Diewaldab4d3ca2015-04-17 01:48:43 +0000337
Nils Diewalda79b2682015-05-18 18:34:06 +0000338 # Documentation routes
hebastada903dd2021-07-20 15:58:48 +0200339 $r->get('/doc')->to('documentation#page', page => 'ql')->name('doc_start');
Akron254fe212019-10-24 14:33:28 +0200340 $r->get('/doc/:scope/:page')->to('documentation#page', scope => undef)->name('doc');
Nils Diewaldab4d3ca2015-04-17 01:48:43 +0000341
Akron59992122019-10-29 11:28:45 +0100342 # Settings routes
343 if ($self->navi->exists('settings')) {
344 $r->get('/settings')->to(
345 cb => sub {
Akron88c26b12020-09-07 12:44:18 +0200346 my $c = shift;
347 $c->res->headers->header('X-Robots' => 'noindex');
348 return $c->render('settings');
Akron59992122019-10-29 11:28:45 +0100349 }
350 )->name('settings_start');
351 $r->get('/settings/:scope/:page')->to(
352 scope => undef,
353 page => undef
354 )->name('settings');
355 };
Akronf7ec4442019-10-27 20:01:05 +0100356
Nils Diewaldc46003b2015-05-07 15:55:35 +0000357 # Contact route
358 $r->get('/contact')->to('documentation#contact');
359 $r->get('/contact')->mail_to_chiffre('documentation#contact');
360
Akron63d963b2019-07-05 15:35:51 +0200361 # API proxy route
Akron8a21b4d2020-04-16 16:17:42 +0200362 $r->any('/api/v#apiv' => [apiv => ['1.0']])->name('proxy')->to('Proxy#pass');
Akron03c3c9d2021-02-15 07:41:27 +0100363 $r->any('/api/v#apiv/*api_path' => [apiv => ['1.0']])->to('Proxy#pass');
Akron63d963b2019-07-05 15:35:51 +0200364
Nils Diewald7148c6f2015-05-04 15:07:53 +0000365 # Match route
Akron80a84b22018-10-24 17:44:24 +0200366 # Corpus route
Akronfb6d87d2018-10-24 18:10:20 +0200367 my $corpus = $r->get('/corpus')->to('search#corpus_info')->name('corpus');
Akron8f9aae52020-12-17 15:52:28 +0100368 my $doc = $r->any('/corpus/:corpus_id/:doc_id');
Akronfb6d87d2018-10-24 18:10:20 +0200369 my $text = $doc->get('/:text_id')->to('search#text_info')->name('text');
370 my $match = $doc->get('/:text_id/:match_id')->to('search#match_info')->name('match');
Nils Diewald996aa552014-12-02 03:26:44 +0000371};
372
373
3741;
375
376
377__END__
Nils Diewalda898dac2015-05-06 21:04:16 +0000378
379=pod
380
Nils Diewaldeb5f3072015-05-20 09:32:42 +0000381=encoding utf8
Nils Diewalda898dac2015-05-06 21:04:16 +0000382
Nils Diewaldeb5f3072015-05-20 09:32:42 +0000383=head1 NAME
384
385Kalamar
Nils Diewalda0defc42015-05-07 23:54:17 +0000386
387
Nils Diewaldeb5f3072015-05-20 09:32:42 +0000388=head1 DESCRIPTION
Nils Diewalda0defc42015-05-07 23:54:17 +0000389
Nils Diewaldeb5f3072015-05-20 09:32:42 +0000390L<Kalamar> is a L<Mojolicious|http://mojolicio.us/> based user interface
Akron87468c22021-02-08 09:30:01 +0100391frontend for the L<KorAP Corpus Analysis Platform|https://korap.ids-mannheim.de/>.
Nils Diewaldeb5f3072015-05-20 09:32:42 +0000392
Akron456abd92015-06-02 15:07:21 +0200393B<See the README for further information!>
Nils Diewaldeb5f3072015-05-20 09:32:42 +0000394
Akron456abd92015-06-02 15:07:21 +0200395=head2 COPYRIGHT AND LICENSE
Nils Diewalda748b0e2015-05-19 22:54:06 +0000396
Akronc23ce662021-12-14 12:39:42 +0100397Copyright (C) 2015-2022, L<IDS Mannheim|https://www.ids-mannheim.de/>
Akron87468c22021-02-08 09:30:01 +0100398Author: L<Nils Diewald|https://www.nils-diewald.de/>
Nils Diewalda748b0e2015-05-19 22:54:06 +0000399
400Kalamar is developed as part of the L<KorAP|http://korap.ids-mannheim.de/>
401Corpus Analysis Platform at the
Akron87468c22021-02-08 09:30:01 +0100402L<Leibniz Institute for the German Language (IDS)|https://www.ids-mannheim.de/>,
Nils Diewalda748b0e2015-05-19 22:54:06 +0000403member of the
hebasta21b7baf2019-12-16 10:32:43 +0100404L<Leibniz-Gemeinschaft|http://www.leibniz-gemeinschaft.de>
Nils Diewalda748b0e2015-05-19 22:54:06 +0000405and supported by the L<KobRA|http://www.kobra.tu-dortmund.de> project,
406funded by the
407L<Federal Ministry of Education and Research (BMBF)|http://www.bmbf.de/en/>.
408
409Kalamar is free software published under the
Akron87468c22021-02-08 09:30:01 +0100410L<BSD-2 License|https://opensource.org/licenses/BSD-2-Clause>.
Nils Diewalda748b0e2015-05-19 22:54:06 +0000411
412=cut