blob: 9d32042ed4e8916a39e05bd8df725353dea9648c [file] [log] [blame]
Akron32d53de2025-05-22 13:45:32 +02001package mapper
2
3import (
4 "encoding/json"
5 "fmt"
6
Akronfa55bb22025-05-26 15:10:42 +02007 "github.com/KorAP/KoralPipe-TermMapper/ast"
8 "github.com/KorAP/KoralPipe-TermMapper/config"
9 "github.com/KorAP/KoralPipe-TermMapper/matcher"
10 "github.com/KorAP/KoralPipe-TermMapper/parser"
Akron32d53de2025-05-22 13:45:32 +020011)
12
13// Direction represents the mapping direction (A to B or B to A)
Akrona1a183f2025-05-26 17:47:33 +020014type Direction bool
Akron32d53de2025-05-22 13:45:32 +020015
16const (
Akrona1a183f2025-05-26 17:47:33 +020017 AtoB Direction = true
18 BtoA Direction = false
Akron32d53de2025-05-22 13:45:32 +020019)
20
Akrona1a183f2025-05-26 17:47:33 +020021// String converts the Direction to its string representation
22func (d Direction) String() string {
23 if d {
24 return "atob"
25 }
26 return "btoa"
27}
28
29// ParseDirection converts a string direction to Direction type
30func ParseDirection(dir string) (Direction, error) {
31 switch dir {
32 case "atob":
33 return AtoB, nil
34 case "btoa":
35 return BtoA, nil
36 default:
37 return false, fmt.Errorf("invalid direction: %s", dir)
38 }
39}
40
Akron32d53de2025-05-22 13:45:32 +020041// Mapper handles the application of mapping rules to JSON objects
42type Mapper struct {
43 mappingLists map[string]*config.MappingList
44 parsedRules map[string][]*parser.MappingResult
45}
46
Akrona00d4752025-05-26 17:34:36 +020047// NewMapper creates a new Mapper instance from a list of MappingLists
48func NewMapper(lists []config.MappingList) (*Mapper, error) {
Akron32d53de2025-05-22 13:45:32 +020049 m := &Mapper{
50 mappingLists: make(map[string]*config.MappingList),
51 parsedRules: make(map[string][]*parser.MappingResult),
52 }
53
Akrona00d4752025-05-26 17:34:36 +020054 // Store mapping lists by ID
55 for _, list := range lists {
56 if _, exists := m.mappingLists[list.ID]; exists {
57 return nil, fmt.Errorf("duplicate mapping list ID found: %s", list.ID)
58 }
59
60 // Create a copy of the list to store
61 listCopy := list
62 m.mappingLists[list.ID] = &listCopy
63
64 // Parse the rules immediately
65 parsedRules, err := list.ParseMappings()
Akron32d53de2025-05-22 13:45:32 +020066 if err != nil {
Akrona00d4752025-05-26 17:34:36 +020067 return nil, fmt.Errorf("failed to parse mappings for list %s: %w", list.ID, err)
Akron32d53de2025-05-22 13:45:32 +020068 }
Akrona00d4752025-05-26 17:34:36 +020069 m.parsedRules[list.ID] = parsedRules
Akron32d53de2025-05-22 13:45:32 +020070 }
71
72 return m, nil
73}
74
75// MappingOptions contains the options for applying mappings
76type MappingOptions struct {
77 FoundryA string
78 LayerA string
79 FoundryB string
80 LayerB string
81 Direction Direction
82}
83
Akron7b4984e2025-05-26 19:12:20 +020084// ApplyQueryMappings applies the specified mapping rules to a JSON object
85func (m *Mapper) ApplyQueryMappings(mappingID string, opts MappingOptions, jsonData any) (any, error) {
Akron32d53de2025-05-22 13:45:32 +020086 // Validate mapping ID
87 if _, exists := m.mappingLists[mappingID]; !exists {
88 return nil, fmt.Errorf("mapping list with ID %s not found", mappingID)
89 }
90
Akron32d53de2025-05-22 13:45:32 +020091 // Get the parsed rules
92 rules := m.parsedRules[mappingID]
93
Akron7b4984e2025-05-26 19:12:20 +020094 // Check if we have a wrapper object with a "query" field
95 var queryData any
96 var hasQueryWrapper bool
97
98 if jsonMap, ok := jsonData.(map[string]any); ok {
99 if query, exists := jsonMap["query"]; exists {
100 queryData = query
101 hasQueryWrapper = true
102 }
103 }
104
105 // If no query wrapper was found, use the entire input
106 if !hasQueryWrapper {
107 // If the input itself is not a valid query object, return it as is
108 if !isValidQueryObject(jsonData) {
109 return jsonData, nil
110 }
111 queryData = jsonData
112 } else if queryData == nil || !isValidQueryObject(queryData) {
113 // If we have a query wrapper but the query is nil or not a valid object,
114 // return the original data
115 return jsonData, nil
116 }
117
Akron32d53de2025-05-22 13:45:32 +0200118 // Convert input JSON to AST
Akron7b4984e2025-05-26 19:12:20 +0200119 jsonBytes, err := json.Marshal(queryData)
Akron32d53de2025-05-22 13:45:32 +0200120 if err != nil {
121 return nil, fmt.Errorf("failed to marshal input JSON: %w", err)
122 }
123
124 node, err := parser.ParseJSON(jsonBytes)
125 if err != nil {
126 return nil, fmt.Errorf("failed to parse JSON into AST: %w", err)
127 }
128
Akrond5850f82025-05-23 16:44:44 +0200129 // Store whether the input was a Token
130 isToken := false
131 var tokenWrap ast.Node
Akron32d53de2025-05-22 13:45:32 +0200132 if token, ok := node.(*ast.Token); ok {
Akrond5850f82025-05-23 16:44:44 +0200133 isToken = true
134 tokenWrap = token.Wrap
135 node = tokenWrap
Akron32d53de2025-05-22 13:45:32 +0200136 }
137
138 // Apply each rule to the AST
139 for _, rule := range rules {
140 // Create pattern and replacement based on direction
141 var pattern, replacement ast.Node
Akrona1a183f2025-05-26 17:47:33 +0200142 if opts.Direction { // true means AtoB
Akron32d53de2025-05-22 13:45:32 +0200143 pattern = rule.Upper
144 replacement = rule.Lower
145 } else {
146 pattern = rule.Lower
147 replacement = rule.Upper
148 }
149
150 // Extract the inner nodes from the pattern and replacement tokens
151 if token, ok := pattern.(*ast.Token); ok {
152 pattern = token.Wrap
153 }
154 if token, ok := replacement.(*ast.Token); ok {
155 replacement = token.Wrap
156 }
157
158 // Apply foundry and layer overrides
Akrona1a183f2025-05-26 17:47:33 +0200159 if opts.Direction { // true means AtoB
Akron32d53de2025-05-22 13:45:32 +0200160 applyFoundryAndLayerOverrides(pattern, opts.FoundryA, opts.LayerA)
161 applyFoundryAndLayerOverrides(replacement, opts.FoundryB, opts.LayerB)
162 } else {
163 applyFoundryAndLayerOverrides(pattern, opts.FoundryB, opts.LayerB)
164 applyFoundryAndLayerOverrides(replacement, opts.FoundryA, opts.LayerA)
165 }
166
167 // Create matcher and apply replacement
Akrond5850f82025-05-23 16:44:44 +0200168 m, err := matcher.NewMatcher(ast.Pattern{Root: pattern}, ast.Replacement{Root: replacement})
169 if err != nil {
170 return nil, fmt.Errorf("failed to create matcher: %w", err)
171 }
Akron32d53de2025-05-22 13:45:32 +0200172 node = m.Replace(node)
173 }
174
Akrond5850f82025-05-23 16:44:44 +0200175 // Wrap the result in a token if the input was a token
176 var result ast.Node
177 if isToken {
178 result = &ast.Token{Wrap: node}
179 } else {
180 result = node
181 }
Akron32d53de2025-05-22 13:45:32 +0200182
183 // Convert AST back to JSON
184 resultBytes, err := parser.SerializeToJSON(result)
185 if err != nil {
186 return nil, fmt.Errorf("failed to serialize AST to JSON: %w", err)
187 }
188
Akron6f455152025-05-27 09:03:00 +0200189 // Parse the JSON string back into
190 var resultData any
Akron32d53de2025-05-22 13:45:32 +0200191 if err := json.Unmarshal(resultBytes, &resultData); err != nil {
192 return nil, fmt.Errorf("failed to parse result JSON: %w", err)
193 }
194
Akron7b4984e2025-05-26 19:12:20 +0200195 // If we had a query wrapper, put the transformed data back in it
196 if hasQueryWrapper {
197 if wrapper, ok := jsonData.(map[string]any); ok {
198 wrapper["query"] = resultData
199 return wrapper, nil
200 }
201 }
202
Akron32d53de2025-05-22 13:45:32 +0200203 return resultData, nil
204}
205
Akron7b4984e2025-05-26 19:12:20 +0200206// isValidQueryObject checks if the query data is a valid object that can be processed
207func isValidQueryObject(data any) bool {
208 // Check if it's a map
209 queryMap, ok := data.(map[string]any)
210 if !ok {
211 return false
212 }
213
214 // Check if it has the required @type field
215 if _, ok := queryMap["@type"]; !ok {
216 return false
217 }
218
219 return true
220}
221
Akron32d53de2025-05-22 13:45:32 +0200222// applyFoundryAndLayerOverrides recursively applies foundry and layer overrides to terms
223func applyFoundryAndLayerOverrides(node ast.Node, foundry, layer string) {
224 if node == nil {
225 return
226 }
227
228 switch n := node.(type) {
229 case *ast.Term:
230 if foundry != "" {
231 n.Foundry = foundry
232 }
233 if layer != "" {
234 n.Layer = layer
235 }
236 case *ast.TermGroup:
237 for _, op := range n.Operands {
238 applyFoundryAndLayerOverrides(op, foundry, layer)
239 }
240 case *ast.Token:
241 if n.Wrap != nil {
242 applyFoundryAndLayerOverrides(n.Wrap, foundry, layer)
243 }
244 case *ast.CatchallNode:
245 if n.Wrap != nil {
246 applyFoundryAndLayerOverrides(n.Wrap, foundry, layer)
247 }
248 for _, op := range n.Operands {
249 applyFoundryAndLayerOverrides(op, foundry, layer)
250 }
251 }
252}