| Akron | 0a0e924 | 2016-10-28 14:42:29 +0200 | [diff] [blame] | 1 | package Krawfish::Koral::Query; |
| Akron | 290f59f | 2017-08-17 21:55:07 +0200 | [diff] [blame] | 2 | use Role::Tiny::With; |
| 3 | with 'Krawfish::Koral::Info'; |
| Akron | 2c6c716 | 2017-05-15 18:15:33 +0200 | [diff] [blame] | 4 | # TODO: Use the same parent as Koral::Corpus |
| Akron | 4763ea6 | 2016-11-02 19:36:18 +0100 | [diff] [blame] | 5 | use Krawfish::Koral::Query::Builder; |
| Akron | 944091b | 2016-11-24 16:40:58 +0100 | [diff] [blame] | 6 | use Krawfish::Koral::Query::Importer; |
| Akron | 6ce5108 | 2017-07-26 17:31:41 +0200 | [diff] [blame] | 7 | use Krawfish::Log; |
| Akron | 965f5d9 | 2017-01-20 18:38:08 +0100 | [diff] [blame] | 8 | use Mojo::Util qw/md5_sum/; |
| Akron | 0a0e924 | 2016-10-28 14:42:29 +0200 | [diff] [blame] | 9 | use warnings; |
| Akron | 944091b | 2016-11-24 16:40:58 +0100 | [diff] [blame] | 10 | use strict; |
| Akron | 0a0e924 | 2016-10-28 14:42:29 +0200 | [diff] [blame] | 11 | |
| Akron | a588d07 | 2017-10-13 14:45:34 +0200 | [diff] [blame] | 12 | # Base class for span queries |
| 13 | |
| Akron | 6b19563 | 2017-06-09 23:47:49 +0200 | [diff] [blame] | 14 | # TODO: |
| Akron | 8231ca7 | 2017-06-16 16:08:32 +0200 | [diff] [blame] | 15 | # - extended_* may be queried |
| 16 | # automatically without parameter |
| Akron | 55fb308 | 2017-07-18 13:24:53 +0200 | [diff] [blame] | 17 | # - rename all sorts of single ops to operand |
| 18 | # - rename all sorts of multiple ops to operands |
| Akron | 6b19563 | 2017-06-09 23:47:49 +0200 | [diff] [blame] | 19 | |
| Akron | 818e852 | 2017-07-22 12:34:01 +0200 | [diff] [blame] | 20 | # TODO: |
| 21 | # This is now double with Krawfish::Koral! |
| Akron | a588d07 | 2017-10-13 14:45:34 +0200 | [diff] [blame] | 22 | |
| Akron | 818e852 | 2017-07-22 12:34:01 +0200 | [diff] [blame] | 23 | use constant { |
| Akron | 6ce5108 | 2017-07-26 17:31:41 +0200 | [diff] [blame] | 24 | CONTEXT => 'http://korap.ids-mannheim.de/ns/koral/0.6/context.jsonld', |
| 25 | DEBUG => 0 |
| Akron | 818e852 | 2017-07-22 12:34:01 +0200 | [diff] [blame] | 26 | }; |
| 27 | |
| Akron | a588d07 | 2017-10-13 14:45:34 +0200 | [diff] [blame] | 28 | |
| 29 | # Constructor |
| Akron | 33f1dcb | 2016-10-29 17:27:23 +0200 | [diff] [blame] | 30 | sub new { |
| 31 | my $class = shift; |
| Akron | 944091b | 2016-11-24 16:40:58 +0100 | [diff] [blame] | 32 | my $self = bless { |
| Akron | 655a10a | 2017-09-11 14:13:18 +0200 | [diff] [blame] | 33 | anywhere => 0, |
| Akron | 4763ea6 | 2016-11-02 19:36:18 +0100 | [diff] [blame] | 34 | optional => 0, |
| 35 | null => 0, |
| 36 | negative => 0, |
| 37 | extended => 0, |
| Akron | ddf077a | 2016-11-05 15:00:00 +0100 | [diff] [blame] | 38 | extended_left => 0, |
| Akron | 6621e11 | 2016-11-05 17:21:39 +0100 | [diff] [blame] | 39 | extended_right => 0 |
| Akron | 4763ea6 | 2016-11-02 19:36:18 +0100 | [diff] [blame] | 40 | }, $class; |
| Akron | 944091b | 2016-11-24 16:40:58 +0100 | [diff] [blame] | 41 | |
| 42 | if ($_[0]) { |
| 43 | return $self->from_koral(shift); |
| 44 | }; |
| 45 | |
| 46 | $self; |
| Akron | 33f1dcb | 2016-10-29 17:27:23 +0200 | [diff] [blame] | 47 | }; |
| 48 | |
| Akron | 55fb308 | 2017-07-18 13:24:53 +0200 | [diff] [blame] | 49 | |
| Akron | a588d07 | 2017-10-13 14:45:34 +0200 | [diff] [blame] | 50 | # Override type |
| Akron | 290f59f | 2017-08-17 21:55:07 +0200 | [diff] [blame] | 51 | sub type { |
| Akron | a588d07 | 2017-10-13 14:45:34 +0200 | [diff] [blame] | 52 | warn 'override'; |
| Akron | 290f59f | 2017-08-17 21:55:07 +0200 | [diff] [blame] | 53 | }; |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 54 | |
| 55 | |
| Akron | 4763ea6 | 2016-11-02 19:36:18 +0100 | [diff] [blame] | 56 | ######################################### |
| 57 | # Query Planning methods and attributes # |
| 58 | ######################################### |
| Akron | a211bf5 | 2016-10-29 18:03:29 +0200 | [diff] [blame] | 59 | |
| Akron | 55fb308 | 2017-07-18 13:24:53 +0200 | [diff] [blame] | 60 | |
| Akron | 6b19563 | 2017-06-09 23:47:49 +0200 | [diff] [blame] | 61 | # Normalize the query |
| Akron | 290f59f | 2017-08-17 21:55:07 +0200 | [diff] [blame] | 62 | sub normalize { |
| Akron | a588d07 | 2017-10-13 14:45:34 +0200 | [diff] [blame] | 63 | warn 'override'; |
| Akron | 290f59f | 2017-08-17 21:55:07 +0200 | [diff] [blame] | 64 | }; |
| Akron | 6b19563 | 2017-06-09 23:47:49 +0200 | [diff] [blame] | 65 | |
| 66 | |
| 67 | # Refer to common subqueries |
| 68 | sub refer { |
| 69 | $_[0]; |
| 70 | }; |
| 71 | |
| 72 | |
| Akron | a588d07 | 2017-10-13 14:45:34 +0200 | [diff] [blame] | 73 | # Translate to ids |
| Akron | 7dc2a64 | 2017-08-02 15:39:49 +0200 | [diff] [blame] | 74 | # TODO: |
| Akron | 5a5595b | 2017-09-10 13:00:57 +0200 | [diff] [blame] | 75 | # If "nowhere" returns, optimize away |
| Akron | 7dc2a64 | 2017-08-02 15:39:49 +0200 | [diff] [blame] | 76 | # before ->optimize(). |
| 77 | sub identify { |
| 78 | my ($self, $dict) = @_; |
| 79 | |
| 80 | my $ops = $self->operands; |
| 81 | return $self unless $ops; |
| 82 | for (my $i = 0; $i < @$ops; $i++) { |
| 83 | $ops->[$i] = $ops->[$i]->identify($dict); |
| 84 | }; |
| 85 | return $self; |
| 86 | }; |
| 87 | |
| 88 | |
| Akron | 6b19563 | 2017-06-09 23:47:49 +0200 | [diff] [blame] | 89 | # Check for cached subqueries |
| 90 | sub cache { |
| 91 | $_[0]; |
| 92 | }; |
| 93 | |
| 94 | |
| 95 | # Optimize for an index |
| Akron | 290f59f | 2017-08-17 21:55:07 +0200 | [diff] [blame] | 96 | sub optimize { |
| 97 | ... |
| 98 | }; |
| Akron | 6b19563 | 2017-06-09 23:47:49 +0200 | [diff] [blame] | 99 | |
| 100 | |
| Akron | c552937 | 2017-06-21 15:56:18 +0200 | [diff] [blame] | 101 | # This is the class to be overwritten |
| 102 | # by subclasses |
| 103 | sub _finalize { |
| 104 | $_[0]; |
| 105 | }; |
| 106 | |
| Akron | 55fb308 | 2017-07-18 13:24:53 +0200 | [diff] [blame] | 107 | |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 108 | # Treat the operand like a root operand |
| Akron | 6b19563 | 2017-06-09 23:47:49 +0200 | [diff] [blame] | 109 | sub finalize { |
| 110 | my $self = shift; |
| 111 | |
| Akron | 6ce5108 | 2017-07-26 17:31:41 +0200 | [diff] [blame] | 112 | if (DEBUG) { |
| 113 | print_log('kq_query', 'Finalize query ' . $self->to_string); |
| 114 | }; |
| 115 | |
| Akron | 6b19563 | 2017-06-09 23:47:49 +0200 | [diff] [blame] | 116 | my $query = $self; |
| 117 | |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 118 | # The query matches everywhere |
| Akron | 655a10a | 2017-09-11 14:13:18 +0200 | [diff] [blame] | 119 | if ($query->is_anywhere || $query->is_null) { |
| Akron | c552937 | 2017-06-21 15:56:18 +0200 | [diff] [blame] | 120 | $self->error(780, "This query matches everywhere"); |
| 121 | return; |
| 122 | }; |
| 123 | |
| Akron | 6ce5108 | 2017-07-26 17:31:41 +0200 | [diff] [blame] | 124 | |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 125 | # The query matches nowhere |
| Akron | 5a5595b | 2017-09-10 13:00:57 +0200 | [diff] [blame] | 126 | if ($query->is_nowhere) { |
| 127 | return $query->builder->nowhere; |
| Akron | c552937 | 2017-06-21 15:56:18 +0200 | [diff] [blame] | 128 | }; |
| 129 | |
| 130 | if ($query->is_negative) { |
| Akron | c4bf5fb | 2017-07-18 02:20:40 +0200 | [diff] [blame] | 131 | $query->warning(782, 'Exclusivity of query is ignored'); |
| Akron | 5ddc38f | 2017-07-18 00:16:22 +0200 | [diff] [blame] | 132 | # TODO: |
| 133 | # Better not search at all, because in case the query was classed, |
| 134 | # this class information would be lost in the normalization process, so |
| 135 | # {1:[!der]} would become [der], which is somehow weird. |
| Akron | c552937 | 2017-06-21 15:56:18 +0200 | [diff] [blame] | 136 | $query->is_negative(0); |
| 137 | }; |
| 138 | |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 139 | # Ignore optionality |
| Akron | c552937 | 2017-06-21 15:56:18 +0200 | [diff] [blame] | 140 | if ($query->is_optional) { |
| Akron | c4bf5fb | 2017-07-18 02:20:40 +0200 | [diff] [blame] | 141 | $query->warning(781, "Optionality of query is ignored"); |
| Akron | c552937 | 2017-06-21 15:56:18 +0200 | [diff] [blame] | 142 | $query->is_optional(0); |
| 143 | }; |
| 144 | |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 145 | # Use a finalize method |
| Akron | c552937 | 2017-06-21 15:56:18 +0200 | [diff] [blame] | 146 | $query = $query->_finalize; |
| 147 | |
| Akron | 5ddc38f | 2017-07-18 00:16:22 +0200 | [diff] [blame] | 148 | # TODO: |
| 149 | # This needs to be in the finalize stage |
| 150 | # on the segment level! |
| 151 | |
| Akron | 655a10a | 2017-09-11 14:13:18 +0200 | [diff] [blame] | 152 | # There is a possible 'anywhere' extension, |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 153 | # that may exceed the text boundary |
| Akron | 6b19563 | 2017-06-09 23:47:49 +0200 | [diff] [blame] | 154 | if ($query->is_extended_right) { |
| 155 | return $self->builder->in_text($query); |
| 156 | }; |
| 157 | |
| 158 | # Return the planned query |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 159 | # TODO: |
| 160 | # Check for serialization errors |
| Akron | 6b19563 | 2017-06-09 23:47:49 +0200 | [diff] [blame] | 161 | return $query; |
| 162 | }; |
| 163 | |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 164 | |
| Akron | 55fb308 | 2017-07-18 13:24:53 +0200 | [diff] [blame] | 165 | # Returns a list of classes used by the query, |
| 166 | # e.g. in a focus() context. |
| Akron | 290f59f | 2017-08-17 21:55:07 +0200 | [diff] [blame] | 167 | sub uses_classes { |
| Akron | a588d07 | 2017-10-13 14:45:34 +0200 | [diff] [blame] | 168 | warn 'override'; |
| Akron | 290f59f | 2017-08-17 21:55:07 +0200 | [diff] [blame] | 169 | }; |
| Akron | 55fb308 | 2017-07-18 13:24:53 +0200 | [diff] [blame] | 170 | |
| Akron | 6b19563 | 2017-06-09 23:47:49 +0200 | [diff] [blame] | 171 | |
| Akron | ce10cb4 | 2017-06-14 01:12:40 +0200 | [diff] [blame] | 172 | sub remove_unused_classes { |
| 173 | my ($self, $classes) = @_; |
| 174 | my $used = $self->uses_classes; |
| 175 | # Pass classes required for highlighting or grouping, |
| 176 | # and take classes from uses_classes() into account. |
| 177 | # This is not done recursively, as it first needs to |
| 178 | # gather all classes and then can remove them. |
| 179 | }; |
| 180 | |
| 181 | |
| Akron | 5ddc38f | 2017-07-18 00:16:22 +0200 | [diff] [blame] | 182 | # Remove classes passed as an array references |
| 183 | sub remove_classes { |
| 184 | my ($self, $keep) = @_; |
| 185 | unless ($keep) { |
| 186 | $keep = []; |
| 187 | }; |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 188 | my $ops = $self->operands; |
| Akron | 4f9eef4 | 2017-07-24 11:41:09 +0200 | [diff] [blame] | 189 | |
| 190 | return $self unless $ops; |
| 191 | |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 192 | for (my $i = 0; $i < @$ops; $i++) { |
| 193 | $ops->[$i] = $ops->[$i]->remove_classes($keep); |
| 194 | }; |
| Akron | 5ddc38f | 2017-07-18 00:16:22 +0200 | [diff] [blame] | 195 | return $self; |
| 196 | }; |
| 197 | |
| Akron | ce10cb4 | 2017-06-14 01:12:40 +0200 | [diff] [blame] | 198 | |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 199 | # Get and set operands |
| 200 | sub operands { |
| 201 | my $self = shift; |
| 202 | if (@_) { |
| Akron | a84ef2d | 2017-08-07 14:45:46 +0200 | [diff] [blame] | 203 | my $ops = shift; |
| 204 | my @new_ops = (); |
| 205 | foreach my $op (@$ops) { |
| 206 | $self->remove_info_from($op); |
| 207 | push @new_ops, $op; |
| 208 | }; |
| 209 | $self->{operands} = \@new_ops; |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 210 | }; |
| 211 | $self->{operands}; |
| 212 | }; |
| 213 | |
| 214 | |
| 215 | # Get and set first and only operand |
| 216 | sub operand { |
| 217 | if (@_ == 2) { |
| 218 | $_[0]->{operands} = [$_[1]]; |
| 219 | }; |
| 220 | $_[0]->{operands}->[0]; |
| 221 | }; |
| 222 | |
| 223 | |
| Akron | ce10cb4 | 2017-06-14 01:12:40 +0200 | [diff] [blame] | 224 | # Matches everything |
| Akron | 655a10a | 2017-09-11 14:13:18 +0200 | [diff] [blame] | 225 | sub is_anywhere { |
| Akron | ce10cb4 | 2017-06-14 01:12:40 +0200 | [diff] [blame] | 226 | my $self = shift; |
| 227 | if (defined $_[0]) { |
| Akron | 655a10a | 2017-09-11 14:13:18 +0200 | [diff] [blame] | 228 | $self->{anywhere} = shift; |
| Akron | ce10cb4 | 2017-06-14 01:12:40 +0200 | [diff] [blame] | 229 | }; |
| Akron | 655a10a | 2017-09-11 14:13:18 +0200 | [diff] [blame] | 230 | return $self->{anywhere} // 0; |
| Akron | ce10cb4 | 2017-06-14 01:12:40 +0200 | [diff] [blame] | 231 | }; |
| 232 | |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 233 | |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 234 | # Is optional |
| 235 | sub is_optional { |
| Akron | c552937 | 2017-06-21 15:56:18 +0200 | [diff] [blame] | 236 | my $self = shift; |
| 237 | if (defined $_[0]) { |
| 238 | $self->{optional} = shift; |
| 239 | }; |
| 240 | return $self->{optional} // 0; |
| 241 | }; |
| Akron | 2c6c716 | 2017-05-15 18:15:33 +0200 | [diff] [blame] | 242 | |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 243 | |
| Akron | 2c6c716 | 2017-05-15 18:15:33 +0200 | [diff] [blame] | 244 | # Null is empty - e.g. in |
| Akron | c048b18 | 2017-06-13 01:29:03 +0200 | [diff] [blame] | 245 | # Der >alte{0}< Mann |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 246 | sub is_null { |
| 247 | $_[0]->{null} // 0 |
| 248 | }; |
| 249 | |
| Akron | 2c6c716 | 2017-05-15 18:15:33 +0200 | [diff] [blame] | 250 | |
| 251 | # Nothing matches nowhere - e.g. in |
| 252 | # Der [alte & !alte] Mann |
| Akron | 5a5595b | 2017-09-10 13:00:57 +0200 | [diff] [blame] | 253 | sub is_nowhere { |
| Akron | ce10cb4 | 2017-06-14 01:12:40 +0200 | [diff] [blame] | 254 | my $self = shift; |
| 255 | if (defined $_[0]) { |
| Akron | 5a5595b | 2017-09-10 13:00:57 +0200 | [diff] [blame] | 256 | $self->{nowhere} = shift; |
| Akron | ce10cb4 | 2017-06-14 01:12:40 +0200 | [diff] [blame] | 257 | }; |
| Akron | 5a5595b | 2017-09-10 13:00:57 +0200 | [diff] [blame] | 258 | return $self->{nowhere} // 0; |
| Akron | ce10cb4 | 2017-06-14 01:12:40 +0200 | [diff] [blame] | 259 | }; |
| Akron | 2c6c716 | 2017-05-15 18:15:33 +0200 | [diff] [blame] | 260 | |
| Akron | 24ab289 | 2017-07-18 14:05:33 +0200 | [diff] [blame] | 261 | |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 262 | # Check if the query is a leaf node in the tree |
| 263 | sub is_leaf { |
| 264 | 0; |
| 265 | }; |
| Akron | a211bf5 | 2016-10-29 18:03:29 +0200 | [diff] [blame] | 266 | |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 267 | |
| 268 | # Check if the result of the query is extended to the right |
| 269 | sub is_extended_right { |
| 270 | $_[0]->{extended_right} // 0 |
| 271 | }; |
| 272 | |
| 273 | |
| 274 | # Check if the result of the query is extended to the left |
| 275 | sub is_extended_left { |
| 276 | $_[0]->{extended_left} // 0 |
| 277 | }; |
| 278 | |
| 279 | |
| 280 | # Check if the result of the query is extended |
| 281 | sub is_extended { |
| 282 | $_[0]->is_extended_right || $_[0]->is_extended_left // 0 |
| 283 | }; |
| 284 | |
| 285 | |
| 286 | # Is negative |
| Akron | 2c6c716 | 2017-05-15 18:15:33 +0200 | [diff] [blame] | 287 | sub is_negative { |
| 288 | my $self = shift; |
| 289 | if (scalar @_ == 1) { |
| 290 | $self->{negative} = shift; |
| Akron | 5ddc38f | 2017-07-18 00:16:22 +0200 | [diff] [blame] | 291 | return $self; |
| Akron | 2c6c716 | 2017-05-15 18:15:33 +0200 | [diff] [blame] | 292 | }; |
| 293 | return $self->{negative} // 0; |
| 294 | }; |
| 295 | |
| 296 | |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 297 | # Toggle negativity |
| Akron | 2c6c716 | 2017-05-15 18:15:33 +0200 | [diff] [blame] | 298 | sub toggle_negative { |
| 299 | my $self = shift; |
| 300 | $self->is_negative($self->is_negative ? 0 : 1); |
| 301 | return $self; |
| 302 | }; |
| 303 | |
| 304 | |
| Akron | 774c5db | 2016-11-09 16:11:38 +0100 | [diff] [blame] | 305 | # TODO: Probably better to be renamed "potential_anchor" |
| Akron | a211bf5 | 2016-10-29 18:03:29 +0200 | [diff] [blame] | 306 | sub maybe_anchor { |
| 307 | my $self = shift; |
| 308 | return if $self->is_negative; |
| 309 | return if $self->is_optional; |
| Akron | 655a10a | 2017-09-11 14:13:18 +0200 | [diff] [blame] | 310 | return if $self->is_anywhere; |
| Akron | a211bf5 | 2016-10-29 18:03:29 +0200 | [diff] [blame] | 311 | return 1; |
| 312 | }; |
| 313 | |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 314 | |
| Akron | a211bf5 | 2016-10-29 18:03:29 +0200 | [diff] [blame] | 315 | # Check if the wrapped query may need to be sorted |
| 316 | # on focussing on a specific class. |
| 317 | # Normally spans are always sorted, but in case of |
| 318 | # a wrapped relation query, classed operands may |
| 319 | # be in arbitrary order. When focussing on these |
| 320 | # classes, the span has to me reordered. |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 321 | # TODO: |
| 322 | # Rename to classes_maybe_unsorted |
| 323 | sub maybe_unsorted { |
| 324 | $_[0]->{maybe_unsorted} // 0 |
| 325 | }; |
| Akron | a211bf5 | 2016-10-29 18:03:29 +0200 | [diff] [blame] | 326 | |
| Akron | 965f5d9 | 2017-01-20 18:38:08 +0100 | [diff] [blame] | 327 | |
| Akron | 704ec06 | 2017-07-24 15:46:21 +0200 | [diff] [blame] | 328 | # Get the minimum tokens the query spans |
| 329 | sub min_span { |
| Akron | a588d07 | 2017-10-13 14:45:34 +0200 | [diff] [blame] | 330 | warn 'override'; |
| Akron | 704ec06 | 2017-07-24 15:46:21 +0200 | [diff] [blame] | 331 | }; |
| 332 | |
| 333 | |
| 334 | # Get the maximum tokens the query spans |
| 335 | # -1 means arbitrary |
| 336 | sub max_span { |
| Akron | a588d07 | 2017-10-13 14:45:34 +0200 | [diff] [blame] | 337 | warn 'override'; |
| Akron | 704ec06 | 2017-07-24 15:46:21 +0200 | [diff] [blame] | 338 | }; |
| 339 | |
| Akron | 965f5d9 | 2017-01-20 18:38:08 +0100 | [diff] [blame] | 340 | |
| Akron | a211bf5 | 2016-10-29 18:03:29 +0200 | [diff] [blame] | 341 | ############################# |
| 342 | # Query Application methods # |
| 343 | ############################# |
| Akron | 33f1dcb | 2016-10-29 17:27:23 +0200 | [diff] [blame] | 344 | |
| Akron | a211bf5 | 2016-10-29 18:03:29 +0200 | [diff] [blame] | 345 | # Deserialization of KoralQuery |
| Akron | 944091b | 2016-11-24 16:40:58 +0100 | [diff] [blame] | 346 | # TODO: export this method from Importer |
| Akron | 33f1dcb | 2016-10-29 17:27:23 +0200 | [diff] [blame] | 347 | sub from_koral { |
| Akron | 944091b | 2016-11-24 16:40:58 +0100 | [diff] [blame] | 348 | my ($class, $kq) = @_; |
| 349 | my $importer = Krawfish::Koral::Query::Importer->new; |
| 350 | |
| 351 | my $type = $kq->{'@type'}; |
| 352 | if ($type eq 'koral:group') { |
| 353 | my $op = $kq->{operation}; |
| 354 | if ($op eq 'operation:sequence') { |
| 355 | return $importer->seq($kq); |
| 356 | } |
| 357 | |
| 358 | elsif ($op eq 'operation:class') { |
| 359 | return $importer->class($kq); |
| 360 | } |
| 361 | else { |
| Akron | 2c6c716 | 2017-05-15 18:15:33 +0200 | [diff] [blame] | 362 | warn 'Operation ' . $op . ' no supported'; |
| Akron | 944091b | 2016-11-24 16:40:58 +0100 | [diff] [blame] | 363 | }; |
| 364 | } |
| 365 | |
| 366 | elsif ($type eq 'koral:token') { |
| 367 | return $importer->token($kq); |
| 368 | } |
| 369 | else { |
| 370 | warn $type . ' unknown'; |
| 371 | }; |
| 372 | |
| 373 | return; |
| Akron | 33f1dcb | 2016-10-29 17:27:23 +0200 | [diff] [blame] | 374 | }; |
| 375 | |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 376 | |
| Akron | a588d07 | 2017-10-13 14:45:34 +0200 | [diff] [blame] | 377 | # Serialize |
| Akron | 290f59f | 2017-08-17 21:55:07 +0200 | [diff] [blame] | 378 | sub to_koral_fragment { |
| Akron | a588d07 | 2017-10-13 14:45:34 +0200 | [diff] [blame] | 379 | warn 'override'; |
| Akron | 290f59f | 2017-08-17 21:55:07 +0200 | [diff] [blame] | 380 | }; |
| 381 | |
| Akron | a211bf5 | 2016-10-29 18:03:29 +0200 | [diff] [blame] | 382 | |
| Akron | a588d07 | 2017-10-13 14:45:34 +0200 | [diff] [blame] | 383 | # Serialize |
| Akron | 818e852 | 2017-07-22 12:34:01 +0200 | [diff] [blame] | 384 | sub to_koral_query { |
| 385 | my $self = shift; |
| 386 | my $koral = $self->to_koral_fragment; |
| 387 | $koral->{'@context'} = CONTEXT; |
| 388 | $koral; |
| 389 | }; |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 390 | |
| Akron | a588d07 | 2017-10-13 14:45:34 +0200 | [diff] [blame] | 391 | |
| 392 | # Stringification |
| Akron | 290f59f | 2017-08-17 21:55:07 +0200 | [diff] [blame] | 393 | sub to_string { |
| Akron | a588d07 | 2017-10-13 14:45:34 +0200 | [diff] [blame] | 394 | warn 'override'; |
| Akron | 290f59f | 2017-08-17 21:55:07 +0200 | [diff] [blame] | 395 | }; |
| Akron | 33f1dcb | 2016-10-29 17:27:23 +0200 | [diff] [blame] | 396 | |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 397 | |
| Akron | 8231ca7 | 2017-06-16 16:08:32 +0200 | [diff] [blame] | 398 | sub to_neutral { |
| 399 | $_[0]->to_string; |
| 400 | }; |
| 401 | |
| 402 | |
| Akron | 965f5d9 | 2017-01-20 18:38:08 +0100 | [diff] [blame] | 403 | # TODO: This may be optimizable and |
| 404 | # implemented in all query and corpus wrappers |
| 405 | sub to_signature { |
| 406 | md5_sum $_[0]->to_string; |
| 407 | }; |
| 408 | |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 409 | |
| Akron | 965f5d9 | 2017-01-20 18:38:08 +0100 | [diff] [blame] | 410 | # TODO: Returns a value of complexity of the query, |
| 411 | # that can be used to decide, if a query should be cached. |
| Akron | 290f59f | 2017-08-17 21:55:07 +0200 | [diff] [blame] | 412 | sub complexity { |
| Akron | a588d07 | 2017-10-13 14:45:34 +0200 | [diff] [blame] | 413 | warn 'override'; |
| Akron | 290f59f | 2017-08-17 21:55:07 +0200 | [diff] [blame] | 414 | }; |
| Akron | 965f5d9 | 2017-01-20 18:38:08 +0100 | [diff] [blame] | 415 | |
| Akron | c3657bf | 2016-10-31 00:15:43 +0100 | [diff] [blame] | 416 | |
| Akron | 4763ea6 | 2016-11-02 19:36:18 +0100 | [diff] [blame] | 417 | # Create KoralQuery builder |
| 418 | sub builder { |
| 419 | return Krawfish::Koral::Query::Builder->new; |
| 420 | }; |
| 421 | |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 422 | |
| Akron | 944091b | 2016-11-24 16:40:58 +0100 | [diff] [blame] | 423 | # Create KoralQuery builder |
| 424 | sub importer { |
| 425 | return Krawfish::Koral::Query::Importer->new; |
| 426 | }; |
| 427 | |
| Akron | 169ede4 | 2017-02-05 12:52:22 +0100 | [diff] [blame] | 428 | |
| 429 | # Serialization helper |
| 430 | sub boundary { |
| 431 | my $self = shift; |
| 432 | my %hash = ( |
| 433 | '@type' => 'koral:boundary' |
| 434 | ); |
| 435 | $hash{min} = $self->{min} if defined $self->{min}; |
| 436 | $hash{max} = $self->{max} if defined $self->{max}; |
| 437 | return \%hash; |
| Akron | 5b6264f | 2017-07-19 01:14:01 +0200 | [diff] [blame] | 438 | }; |
| Akron | 169ede4 | 2017-02-05 12:52:22 +0100 | [diff] [blame] | 439 | |
| 440 | |
| Akron | a588d07 | 2017-10-13 14:45:34 +0200 | [diff] [blame] | 441 | # sub replace_references { |
| 442 | # my ($self, $refs) = @_; |
| 443 | # my $sig = $self->signature; |
| 444 | # |
| 445 | # # Subquery is identical to given query |
| 446 | # if ($refs->{$sig}) { |
| 447 | # ... |
| 448 | # } |
| 449 | # else { |
| 450 | # $refs->{$sig} = $self->operand; |
| 451 | # }; |
| 452 | # }; |
| 453 | |
| 454 | |
| Akron | 0a0e924 | 2016-10-28 14:42:29 +0200 | [diff] [blame] | 455 | 1; |