blob: f5a111da0b0b82042bb87081034713580b9c1d8b [file] [log] [blame]
Nils Diewald2fe12e12015-03-06 16:47:06 +00001package Kalamar;
Nils Diewald5d1ffb42014-05-21 17:45:34 +00002use Mojo::Base 'Mojolicious';
Nils Diewalde2c83812014-11-11 21:13:18 +00003use Mojo::ByteStream 'b';
Akronc7656e92018-08-30 13:33:25 +02004use Mojo::URL;
Akronf65ad6c2017-02-01 14:36:38 +01005use Mojo::File;
Nils Diewalda944fab2015-04-08 21:02:04 +00006use Mojo::JSON 'decode_json';
Akron0c4cd222019-07-19 16:33:34 +02007use Mojo::Util qw/url_escape deprecated slugify/;
Akron4c33c622018-11-12 13:43:27 +01008use List::Util 'none';
Nils Diewald5d1ffb42014-05-21 17:45:34 +00009
Nils Diewald709f52f2015-05-21 18:32:58 +000010# Minor version - may be patched from package.json
Akron337f15d2021-01-14 12:57:21 +010011our $VERSION = '0.41';
Akronc7656e92018-08-30 13:33:25 +020012
13# Supported version of Backend API
14our $API_VERSION = '1.0';
Nils Diewald7cad8402014-07-08 17:06:56 +000015
Nils Diewald7148c6f2015-05-04 15:07:53 +000016# TODO: The FAQ-Page has a contact form for new questions
Nils Diewald709f52f2015-05-21 18:32:58 +000017# TODO: Embed query serialization
18# TODO: Embed collection statistics
19# TODO: Implement tab opener for matches and the tutorial
Nils Diewald709f52f2015-05-21 18:32:58 +000020# TODO: Implement a "projects" system
Nils Diewald7148c6f2015-05-04 15:07:53 +000021
Nils Diewald002e8fb2014-06-22 14:27:01 +000022# Start the application and register all routes and plugins
Nils Diewald5d1ffb42014-05-21 17:45:34 +000023sub startup {
24 my $self = shift;
25
Nils Diewalda944fab2015-04-08 21:02:04 +000026 # Set version based on package file
Nils Diewald709f52f2015-05-21 18:32:58 +000027 # This may introduce a SemVer patch number
Akronf65ad6c2017-02-01 14:36:38 +010028 my $pkg_path = $self->home->child('package.json');
29 if (-e $pkg_path->to_abs) {
30 my $pkg = $pkg_path->slurp;
31 $Kalamar::VERSION = decode_json($pkg)->{version};
32 };
Nils Diewalda944fab2015-04-08 21:02:04 +000033
Akron656c5d92015-11-13 21:17:03 +010034 # Lift maximum template cache
35 $self->renderer->cache->max_keys(200);
36
Nils Diewaldab4d3ca2015-04-17 01:48:43 +000037 # Add additional plugin path
38 push(@{$self->plugins->namespaces}, __PACKAGE__ . '::Plugin');
39
Nils Diewaldfccfbcb2015-04-29 20:48:19 +000040 # Set secrets for signed cookies
Akronf65ad6c2017-02-01 14:36:38 +010041 if (-e (my $secret = $self->home->child('kalamar.secret'))) {
Nils Diewalda79b2682015-05-18 18:34:06 +000042
43 # Load file and split lines for multiple secrets
Akronf65ad6c2017-02-01 14:36:38 +010044 $self->secrets([b($secret->slurp)->split("\n")]);
Nils Diewald4347ee92015-05-04 20:32:48 +000045 }
Nils Diewald709f52f2015-05-21 18:32:58 +000046
47 # File not found ...
48 # Kalamar needs secrets in a file to be easily deployable
49 # and publishable at the same time.
Nils Diewald4347ee92015-05-04 20:32:48 +000050 else {
51 $self->log->warn('Please create a kalamar.secret file');
Nils Diewald19402142015-04-30 15:44:52 +000052 };
Nils Diewaldfccfbcb2015-04-29 20:48:19 +000053
Akroncba9f322016-02-29 23:12:45 +010054 # Configuration framework
Akron09a567c2016-04-11 22:49:20 +030055 $self->plugin('Config');
Nils Diewald709f52f2015-05-21 18:32:58 +000056
Akron741b2b12017-04-13 22:15:59 +020057 $self->log->info('Mode is ' . $self->mode);
58
Akron63d963b2019-07-05 15:35:51 +020059 # Get configuration
Akron47787ca2017-05-17 16:00:10 +020060 my $conf = $self->config('Kalamar');
Akron63d963b2019-07-05 15:35:51 +020061 unless ($conf) {
62 $self->config(Kalamar => {});
63 $conf = $self->config('Kalamar');
64 };
65
66 # Check for API endpoint and set the endpoint accordingly
67 if ($conf->{api}) {
68
69 # The api endpoint should be defined as a separated path
70 # and version string
71 $self->log->warn(
72 'Kalamar.api is no longer supported in configurations '.
73 'in favor of Kalamar.api_path'
74 );
75 };
76
77 unless ($conf->{api_path} || $ENV{KALAMAR_API}) {
78 $self->log->warn('Kalamar-api_path not defined in configuration');
79 };
80
Akron0c4cd222019-07-19 16:33:34 +020081 $self->sessions->cookie_name('kalamar');
82
83 # Require HTTPS
84 if ($conf->{https_only}) {
85
86 # ... for cookie transport
87 $self->sessions->secure(1);
88 };
89
90 # Run the app from a subdirectory
Akron63d963b2019-07-05 15:35:51 +020091 if ($conf->{proxy_prefix}) {
Akron47787ca2017-05-17 16:00:10 +020092
Akronf3d856c2017-06-21 17:07:40 +020093 for ($self->sessions) {
Akron1a394722017-06-21 16:25:30 +020094 $_->cookie_path($conf->{proxy_prefix});
Akron0c4cd222019-07-19 16:33:34 +020095 $_->cookie_name('kalamar-' . slugify($conf->{proxy_prefix}));
Akron1a394722017-06-21 16:25:30 +020096 };
97
Akron47787ca2017-05-17 16:00:10 +020098 # Set prefix in stash
99 $self->defaults(prefix => $conf->{proxy_prefix});
100
101 # Create base path
102 $self->hook(
103 before_dispatch => sub {
104 shift->req->url->base->path($conf->{proxy_prefix} . '/');
105 });
106 };
107
Akron90be03b2020-02-03 16:13:37 +0100108 $conf->{proxy_host} //= 1;
109
110 # Take proxy host
111 if ($conf->{proxy_host}) {
112 $self->hook(
113 before_dispatch => sub {
114 my $c = shift;
115 if (my $host = $c->req->headers->header('X-Forwarded-Host')) {
116 foreach ($c->req->url->base) {
117 $_->host($host);
118 $_->scheme(undef);
119 $_->port(undef);
120 };
121 };
122 }
123 );
124 };
125
Akronbc6b3f22021-01-13 14:53:12 +0100126 my $csp = $conf->{cs_policy} // (
127 "default-src 'self';".
128 "style-src 'self' 'unsafe-inline';".
129 "frame-src *;".
130 "media-src 'none';".
131 "object-src 'self';".
132 "font-src 'self';".
133 "img-src 'self' data:;"
134 );
135
136 $self->hook(
137 before_render => sub {
138 shift->res->headers->header('Content-Security-Policy' => $csp);
139 }
140 );
141
Akronc7656e92018-08-30 13:33:25 +0200142 # API is not yet set - define
Akron63d963b2019-07-05 15:35:51 +0200143 $conf->{api_path} //= $ENV{KALAMAR_API};
144 $conf->{api_version} //= $API_VERSION;
Akronc7656e92018-08-30 13:33:25 +0200145
Akron4036d542018-02-12 13:17:09 +0100146 # Add development path
Akron0e1ed242018-10-11 13:22:00 +0200147 if ($self->mode eq 'development') {
Akron4036d542018-02-12 13:17:09 +0100148 push @{$self->static->paths}, 'dev';
Akronbe9d5b32017-04-05 20:48:24 +0200149 };
150
Akron23ab0472019-12-17 16:55:55 +0100151 # Set proxy timeouts
152 if ($conf->{proxy_inactivity_timeout}) {
153 $self->ua->inactivity_timeout($conf->{proxy_inactivity_timeout});
154 };
155 if ($conf->{proxy_connect_timeout}) {
156 $self->ua->connect_timeout($conf->{proxy_connect_timeout});
157 };
158
Akron09a567c2016-04-11 22:49:20 +0300159 # Client notifications
Akron0504a182016-04-10 21:13:42 +0200160 $self->plugin(Notifications => {
161 'Kalamar::Plugin::Notifications' => 1,
Akron8ea84292018-10-24 13:41:52 +0200162 JSON => 1,
Akron3c390c42020-03-30 09:06:21 +0200163 HTML => 1
Akron0504a182016-04-10 21:13:42 +0200164 });
165
Akron09a567c2016-04-11 22:49:20 +0300166 # Localization framework
167 $self->plugin(Localize => {
Akrondbb448c2018-02-14 17:02:36 +0100168 dict => {
169 Q => {
170 _ => sub { shift->config('Kalamar')->{'examplecorpus'} },
171 }
172 },
Akrona7cfd902017-12-21 19:28:36 +0100173 resources => ['kalamar.dict', 'kalamar.queries.dict']
Akron09a567c2016-04-11 22:49:20 +0300174 });
175
176 # Pagination widget
177 $self->plugin('TagHelpers::Pagination' => {
178 prev => '<span><span>&lt;</span></span>',
Akron86e63a92019-02-27 17:35:04 +0100179 next => '<span><span>&gt;</span></span>',
Akron09a567c2016-04-11 22:49:20 +0300180 ellipsis => '<a class="ellipsis"><span><span>...</span></span></a>',
181 separator => '',
182 current => '<span>{current}</span>',
183 page => '<span>{page}</span>'
184 });
185
Nils Diewaldab4d3ca2015-04-17 01:48:43 +0000186 # Load plugins
Nils Diewaldfccfbcb2015-04-29 20:48:19 +0000187 foreach (
Nils Diewaldc46003b2015-05-07 15:55:35 +0000188 'TagHelpers::MailToChiffre', # Obfuscate email addresses
Akrone8235be2016-06-27 11:02:18 +0200189 'KalamarHelpers', # Specific Helpers for Kalamar
Akron41a190a2019-10-16 18:01:02 +0200190 'KalamarPages', # Page Helpers for Kalamar
Akron7093b812018-10-19 17:28:21 +0200191 'KalamarErrors', # Specific Errors for Kalamar
192 'KalamarUser', # Specific Helpers for Kalamar Users
Akron429aeda2018-03-19 16:02:29 +0100193 'ClientIP', # Get client IP from X-Forwarded-For
Akron51757cb2018-05-16 13:10:08 +0200194 'ClosedRedirect', # Redirect with OpenRedirect protection
Akronafeca252018-05-23 15:54:28 +0200195 'TagHelpers::ContentBlock', # Flexible content blocks
Nils Diewaldfccfbcb2015-04-29 20:48:19 +0000196 ) {
Nils Diewaldab4d3ca2015-04-17 01:48:43 +0000197 $self->plugin($_);
198 };
199
Akron751e9e42019-03-13 09:54:55 +0100200 my $serializer = 'JSON';
201
202 if (my $chi = $self->config('CHI')) {
203 if ($chi->{default}) {
204 $chi->{default}->{serializer} = $serializer;
205 };
206 if ($chi->{user}) {
207 $chi->{user}->{serializer} = $serializer;
208 };
209 };
210
Akron05c6dd62018-10-11 17:05:06 +0200211 # Global caching mechanism
212 $self->plugin('CHI' => {
213 default => {
214 driver => 'Memory',
Akron751e9e42019-03-13 09:54:55 +0100215 global => 1,
216 serializer => $serializer
Akron05c6dd62018-10-11 17:05:06 +0200217 },
218 user => {
219 driver => 'Memory',
Akron751e9e42019-03-13 09:54:55 +0100220 global => 1,
221 serializer => $serializer
Akron05c6dd62018-10-11 17:05:06 +0200222 }
223 });
Nils Diewald709f52f2015-05-21 18:32:58 +0000224
Nils Diewaldfccfbcb2015-04-29 20:48:19 +0000225 # Configure mail exception
Akron40cc1d82017-05-10 17:58:16 +0200226 if ($self->config('MailException')) {
227 $self->plugin('MailException' => $self->config('MailException'));
228 };
Nils Diewald709f52f2015-05-21 18:32:58 +0000229
Akroncdfd9d52019-07-23 11:35:00 +0200230 # Load further plugins,
231 # that can override core functions,
232 # therefore order may be of importance
Akron4c33c622018-11-12 13:43:27 +0100233 if (exists $conf->{'plugins'}) {
234 foreach (@{$conf->{'plugins'}}) {
235 $self->plugin('Kalamar::Plugin::' . $_);
236 };
237 };
238
Akron864c2932018-11-16 17:18:55 +0100239 # Deprecated Legacy code
Akron4c33c622018-11-12 13:43:27 +0100240 if ($self->config('Piwik') &&
241 none { $_ eq 'Piwik' } @{$conf->{plugins} // []}) {
Akron864c2932018-11-16 17:18:55 +0100242
243 # 2018-11-12
244 deprecated 'Piwik is no longer considered a mandatory plugin';
245 $self->plugin('Kalamar::Plugin::Piwik');
246 };
247
248 # Deprecated Legacy code
249 if ($self->config('Kalamar')->{auth_support} &&
250 none { $_ eq 'Auth' } @{$conf->{plugins} // []}) {
251
252 # 2018-11-16
253 deprecated 'auth_support configuration is deprecated in favor of Plugin loading';
254 $self->plugin('Kalamar::Plugin::Auth')
Akron4c33c622018-11-12 13:43:27 +0100255 };
256
Nils Diewaldfccfbcb2015-04-29 20:48:19 +0000257 # Configure documentation navigation
Akrond512ea62019-10-24 15:50:04 +0200258 my $doc_navi = Mojo::File->new($self->home->child('templates','doc','navigation.json'))->slurp;
259 $doc_navi = $doc_navi ? decode_json($doc_navi) : [];
Akron1b1a2712018-12-21 14:59:05 +0100260
Akronf7ec4442019-10-27 20:01:05 +0100261 # TODO:
262 # Use navi->add()
Akron1b1a2712018-12-21 14:59:05 +0100263 if ($conf->{navi_ext}) {
Akrond512ea62019-10-24 15:50:04 +0200264 push @$doc_navi, @{$conf->{navi_ext}};
Akron1b1a2712018-12-21 14:59:05 +0100265 };
266
Akronf7ec4442019-10-27 20:01:05 +0100267 # TODO:
268 # Remove navi entry
Akrond512ea62019-10-24 15:50:04 +0200269 $self->config(doc_navi => $doc_navi);
Nils Diewaldfccfbcb2015-04-29 20:48:19 +0000270
Akronf7ec4442019-10-27 20:01:05 +0100271 $self->navi->set(doc => $doc_navi);
272
Akron63d963b2019-07-05 15:35:51 +0200273 $self->log->info('API expected at ' . $self->korap->api);
Nils Diewald709f52f2015-05-21 18:32:58 +0000274
Akron3cd391e2017-03-29 23:42:54 +0200275 # Establish routes with authentification
Akron7d75ee32017-05-02 13:42:41 +0200276 my $r = $self->routes;
Akron3cd391e2017-03-29 23:42:54 +0200277
Akronafeca252018-05-23 15:54:28 +0200278 # Set footer value
Akronef6d5f12018-05-28 17:54:58 +0200279 $self->content_block(footer => {
Akron3cfa26d2019-10-24 15:17:34 +0200280 inline => '<%= embedded_link_to "doc", "V ' . $Kalamar::VERSION . '", "korap", "kalamar" %>',
Akronafeca252018-05-23 15:54:28 +0200281 position => 100
Akronef6d5f12018-05-28 17:54:58 +0200282 });
Akronafeca252018-05-23 15:54:28 +0200283
Nils Diewalda79b2682015-05-18 18:34:06 +0000284 # Base query route
Akronfb6d87d2018-10-24 18:10:20 +0200285 $r->get('/')->to('search#query')->name('index');
Nils Diewaldab4d3ca2015-04-17 01:48:43 +0000286
Nils Diewalda79b2682015-05-18 18:34:06 +0000287 # Documentation routes
Nils Diewald7148c6f2015-05-04 15:07:53 +0000288 $r->get('/doc')->to('documentation#page', page => 'korap')->name('doc_start');
Akron254fe212019-10-24 14:33:28 +0200289 $r->get('/doc/:scope/:page')->to('documentation#page', scope => undef)->name('doc');
Nils Diewaldab4d3ca2015-04-17 01:48:43 +0000290
Akron59992122019-10-29 11:28:45 +0100291 # Settings routes
292 if ($self->navi->exists('settings')) {
293 $r->get('/settings')->to(
294 cb => sub {
Akron88c26b12020-09-07 12:44:18 +0200295 my $c = shift;
296 $c->res->headers->header('X-Robots' => 'noindex');
297 return $c->render('settings');
Akron59992122019-10-29 11:28:45 +0100298 }
299 )->name('settings_start');
300 $r->get('/settings/:scope/:page')->to(
301 scope => undef,
302 page => undef
303 )->name('settings');
304 };
Akronf7ec4442019-10-27 20:01:05 +0100305
Nils Diewaldc46003b2015-05-07 15:55:35 +0000306 # Contact route
307 $r->get('/contact')->to('documentation#contact');
308 $r->get('/contact')->mail_to_chiffre('documentation#contact');
309
Akron63d963b2019-07-05 15:35:51 +0200310 # API proxy route
Akron8a21b4d2020-04-16 16:17:42 +0200311 $r->any('/api/v#apiv' => [apiv => ['1.0']])->name('proxy')->to('Proxy#pass');
312 $r->any('/api/v#apiv/*path' => [apiv => ['1.0']])->to('Proxy#pass');
Akron63d963b2019-07-05 15:35:51 +0200313
Nils Diewald7148c6f2015-05-04 15:07:53 +0000314 # Match route
Akron80a84b22018-10-24 17:44:24 +0200315 # Corpus route
Akronfb6d87d2018-10-24 18:10:20 +0200316 my $corpus = $r->get('/corpus')->to('search#corpus_info')->name('corpus');
Akron8f9aae52020-12-17 15:52:28 +0100317 my $doc = $r->any('/corpus/:corpus_id/:doc_id');
Akronfb6d87d2018-10-24 18:10:20 +0200318 my $text = $doc->get('/:text_id')->to('search#text_info')->name('text');
319 my $match = $doc->get('/:text_id/:match_id')->to('search#match_info')->name('match');
Nils Diewald996aa552014-12-02 03:26:44 +0000320};
321
322
3231;
324
325
326__END__
Nils Diewalda898dac2015-05-06 21:04:16 +0000327
328=pod
329
Nils Diewaldeb5f3072015-05-20 09:32:42 +0000330=encoding utf8
Nils Diewalda898dac2015-05-06 21:04:16 +0000331
Nils Diewaldeb5f3072015-05-20 09:32:42 +0000332=head1 NAME
333
334Kalamar
Nils Diewalda0defc42015-05-07 23:54:17 +0000335
336
Nils Diewaldeb5f3072015-05-20 09:32:42 +0000337=head1 DESCRIPTION
Nils Diewalda0defc42015-05-07 23:54:17 +0000338
Nils Diewaldeb5f3072015-05-20 09:32:42 +0000339L<Kalamar> is a L<Mojolicious|http://mojolicio.us/> based user interface
340frontend for the L<KorAP Corpus Analysis Platform|http://korap.ids-mannheim.de/>.
341
Akron456abd92015-06-02 15:07:21 +0200342B<See the README for further information!>
Nils Diewaldeb5f3072015-05-20 09:32:42 +0000343
Akron456abd92015-06-02 15:07:21 +0200344=head2 COPYRIGHT AND LICENSE
Nils Diewalda748b0e2015-05-19 22:54:06 +0000345
Akron59992122019-10-29 11:28:45 +0100346Copyright (C) 2015-2020, L<IDS Mannheim|http://www.ids-mannheim.de/>
Nils Diewalda748b0e2015-05-19 22:54:06 +0000347Author: L<Nils Diewald|http://nils-diewald.de/>
348
349Kalamar is developed as part of the L<KorAP|http://korap.ids-mannheim.de/>
350Corpus Analysis Platform at the
Akrona2d92de2019-02-27 15:51:07 +0100351L<Leibniz Institute for the German Language (IDS)|http://ids-mannheim.de/>,
Nils Diewalda748b0e2015-05-19 22:54:06 +0000352member of the
hebasta21b7baf2019-12-16 10:32:43 +0100353L<Leibniz-Gemeinschaft|http://www.leibniz-gemeinschaft.de>
Nils Diewalda748b0e2015-05-19 22:54:06 +0000354and supported by the L<KobRA|http://www.kobra.tu-dortmund.de> project,
355funded by the
356L<Federal Ministry of Education and Research (BMBF)|http://www.bmbf.de/en/>.
357
358Kalamar is free software published under the
Akron456abd92015-06-02 15:07:21 +0200359L<BSD-2 License|https://raw.githubusercontent.com/KorAP/Kalamar/master/LICENSE>.
Nils Diewalda748b0e2015-05-19 22:54:06 +0000360
361=cut