blob: 7a47d4b34bb506993ffe8747c2c13eeffadaf158 [file] [log] [blame]
Radek Krejcie7b95092019-05-15 11:03:07 +02001/**
2 * @file parser_xml.c
3 * @author Radek Krejci <rkrejci@cesnet.cz>
4 * @brief XML data parser for libyang
5 *
6 * Copyright (c) 2019 CESNET, z.s.p.o.
7 *
8 * This source code is licensed under BSD 3-Clause License (the "License").
9 * You may not use this file except in compliance with the License.
10 * You may obtain a copy of the License at
11 *
12 * https://opensource.org/licenses/BSD-3-Clause
13 */
14
15#include "common.h"
16
17#include <stdint.h>
18#include <stdlib.h>
19#include <string.h>
20
21#include "context.h"
22#include "dict.h"
23#include "log.h"
24#include "plugins_types.h"
25#include "set.h"
26#include "tree_data.h"
27#include "tree_data_internal.h"
28#include "tree_schema.h"
29#include "xml.h"
30
31/**
32 * @brief internal context for XML YANG data parser.
33 *
34 * The leading part is compatible with the struct lyxml_context
35 */
36struct lyd_xml_ctx {
37 struct ly_ctx *ctx; /**< libyang context */
38 uint64_t line; /**< number of the line being currently processed */
39 enum LYXML_PARSER_STATUS status; /**< status providing information about the next expected object in input data */
40 struct ly_set elements; /**< list of not-yet-closed elements */
41 struct ly_set ns; /**< handled with LY_SET_OPT_USEASLIST */
42
43 uint16_t options; /**< various @ref dataparseroptions. */
44 uint16_t path_len; /**< used bytes in the path buffer */
45#define LYD_PARSER_BUFSIZE 4078
46 char path[LYD_PARSER_BUFSIZE]; /**< buffer for the generated path */
Radek Krejcie553e6d2019-06-07 15:33:18 +020047 struct ly_set incomplete_type_validation; /**< set of nodes validated with LY_EINCOMPLETE result */
Radek Krejcie7b95092019-05-15 11:03:07 +020048};
49
50/**
Radek Krejciaca74032019-06-04 08:53:06 +020051 * @brief XML-parser's implementation of ly_type_resolve_prefix() callback to provide mapping between prefixes used in the values to the schema
52 * via XML namespaces.
53 */
54static const struct lys_module *
55lydxml_resolve_prefix(struct ly_ctx *ctx, const char *prefix, size_t prefix_len, void *parser)
56{
57 const struct lyxml_ns *ns;
58 struct lyxml_context *xmlctx = (struct lyxml_context*)parser;
59
60 ns = lyxml_ns_get(xmlctx, prefix, prefix_len);
61 if (!ns) {
62 return NULL;
63 }
64
65 return ly_ctx_get_module_implemented_ns(ctx, ns->uri);
66}
67
68/**
Radek Krejcie7b95092019-05-15 11:03:07 +020069 * @brief Parse XML attributes of the XML element of YANG data.
70 *
71 * @param[in] ctx XML YANG data parser context.
Radek Krejcie7b95092019-05-15 11:03:07 +020072 * @param[in,out] data Pointer to the XML string representation of the YANG data to parse.
73 * @param[out] attributes Resulting list of the parsed attributes. XML namespace definitions are not parsed
74 * as attributes, they are stored internally in the parser context.
75 * @reutn LY_ERR value.
76 */
77static LY_ERR
Radek Krejci17a78d82019-05-15 15:49:55 +020078lydxml_attributes(struct lyd_xml_ctx *ctx, const char **data, struct lyd_attr **attributes)
Radek Krejcie7b95092019-05-15 11:03:07 +020079{
80 LY_ERR ret = LY_SUCCESS;
81 unsigned int u;
82 const char *prefix, *name;
83 size_t prefix_len, name_len;
84 struct lyd_attr *attr = NULL, *last = NULL;
85 const struct lyxml_ns *ns;
86 struct ly_set attr_prefixes = {0};
87 struct attr_prefix_s {
88 const char *prefix;
89 size_t prefix_len;
90 } *attr_prefix;
91 struct lys_module *mod;
92
93 while(ctx->status == LYXML_ATTRIBUTE &&
94 lyxml_get_attribute((struct lyxml_context*)ctx, data, &prefix, &prefix_len, &name, &name_len) == LY_SUCCESS) {
95 int dynamic = 0;
96 char *buffer = NULL, *value;
97 size_t buffer_size = 0, value_len;
98
Radek Krejci17a78d82019-05-15 15:49:55 +020099 if (!name) {
100 /* seems like all the attrributes were internally processed as namespace definitions */
101 continue;
Radek Krejcie7b95092019-05-15 11:03:07 +0200102 }
Radek Krejci17a78d82019-05-15 15:49:55 +0200103
104 /* get attribute value */
105 ret = lyxml_get_string((struct lyxml_context *)ctx, data, &buffer, &buffer_size, &value, &value_len, &dynamic);
106 LY_CHECK_GOTO(ret, cleanup);
107
108 attr = calloc(1, sizeof *attr);
109 LY_CHECK_ERR_GOTO(!attr, LOGMEM(ctx->ctx); ret = LY_EMEM, cleanup);
110
111 attr->name = lydict_insert(ctx->ctx, name, name_len);
112 /* auxiliary store the prefix information and wait with resolving prefix to the time when all the namespaces,
113 * defined in this element, are parsed, so we will get the correct namespace for this prefix */
114 attr_prefix = malloc(sizeof *attr_prefix);
115 attr_prefix->prefix = prefix;
116 attr_prefix->prefix_len = prefix_len;
117 ly_set_add(&attr_prefixes, attr_prefix, LY_SET_OPT_USEASLIST);
118
119 /* TODO process value */
120
121 if (last) {
122 last->next = attr;
123 } else {
124 (*attributes) = attr;
125 }
126 last = attr;
Radek Krejcie7b95092019-05-15 11:03:07 +0200127 }
128
129 /* resolve annotation pointers in all the attributes */
130 for (last = *attributes, u = 0; u < attr_prefixes.count && last; u++, last = last->next) {
131 attr_prefix = (struct attr_prefix_s*)attr_prefixes.objs[u];
132 ns = lyxml_ns_get((struct lyxml_context *)ctx, attr_prefix->prefix, attr_prefix->prefix_len);
133 mod = ly_ctx_get_module_implemented_ns(ctx->ctx, ns->uri);
134
135 /* TODO get annotation */
136 }
137
138cleanup:
139
140 ly_set_erase(&attr_prefixes, free);
141 return ret;
142}
143
144/**
145 * @brief Parse XML elements as children YANG data node of the specified parent node.
146 *
147 * @param[in] ctx XML YANG data parser context.
148 * @param[in] parent Parent node where the children are inserted. NULL in case of parsing top-level elements.
149 * @param[in,out] data Pointer to the XML string representation of the YANG data to parse.
150 * @param[out] node Resulting list of the parsed nodes.
151 * @reutn LY_ERR value.
152 */
153static LY_ERR
154lydxml_nodes(struct lyd_xml_ctx *ctx, struct lyd_node_inner *parent, const char **data, struct lyd_node **node)
155{
156 LY_ERR ret = LY_SUCCESS;
157 const char *prefix, *name;
Radek Krejcie7b95092019-05-15 11:03:07 +0200158 size_t prefix_len, name_len;
159 struct lyd_attr *attributes = NULL;
160 const struct lyxml_ns *ns;
161 const struct lysc_node *snode;
162 struct lys_module *mod;
163 unsigned int parents_count = ctx->elements.count;
Radek Krejci710226d2019-07-24 17:24:59 +0200164 struct lyd_node *cur = NULL, *prev = NULL, *last = NULL;
Radek Krejcie7b95092019-05-15 11:03:07 +0200165
166 (*node) = NULL;
167
168 while(ctx->status == LYXML_ELEMENT) {
169 ret = lyxml_get_element((struct lyxml_context *)ctx, data, &prefix, &prefix_len, &name, &name_len);
170 LY_CHECK_GOTO(ret, cleanup);
171 if (!name) {
172 /* closing previous element */
Radek Krejcie7b95092019-05-15 11:03:07 +0200173 if (ctx->elements.count < parents_count) {
174 /* all siblings parsed */
175 break;
176 } else {
177 continue;
178 }
179 }
180 attributes = NULL;
Radek Krejci1f05b6a2019-07-18 16:15:06 +0200181 if (ctx->status == LYXML_ATTRIBUTE) {
182 LY_CHECK_GOTO(lydxml_attributes(ctx, data, &attributes), cleanup);
183 }
184
Radek Krejcie7b95092019-05-15 11:03:07 +0200185 ns = lyxml_ns_get((struct lyxml_context *)ctx, prefix, prefix_len);
186 if (!ns) {
187 LOGVAL(ctx->ctx, LY_VLOG_LINE, &ctx->line, LYVE_REFERENCE, "Unknown XML prefix \"%*.s\".", prefix_len, prefix);
188 goto cleanup;
189 }
190 mod = ly_ctx_get_module_implemented_ns(ctx->ctx, ns->uri);
191 if (!mod) {
192 LOGVAL(ctx->ctx, LY_VLOG_LINE, &ctx->line, LYVE_REFERENCE, "No module with namespace \"%s\" in the context.", ns->uri);
193 goto cleanup;
194 }
195 snode = lys_child(parent ? parent->schema : NULL, mod, name, name_len, 0, (ctx->options & LYD_OPT_RPCREPLY) ? LYS_GETNEXT_OUTPUT : 0);
196 if (!snode) {
197 LOGVAL(ctx->ctx, LY_VLOG_LINE, &ctx->line, LYVE_REFERENCE, "Element \"%.*s\" not found in the \"%s\" module.", name_len, name, mod->name);
198 goto cleanup;
199 }
200
201 /* allocate new node */
202 switch (snode->nodetype) {
Radek Krejcif3b6fec2019-07-24 15:53:11 +0200203 case LYS_ACTION:
204 if ((ctx->options & LYD_OPT_TYPEMASK) != LYD_OPT_RPC) {
205 LOGVAL(ctx->ctx, LY_VLOG_LINE, &ctx->line, LYVE_RESTRICTION, "Unexpected RPC/action element \"%.*s\" in %s data set.",
206 name_len, name, lyd_parse_options_type2str(ctx->options & LYD_OPT_TYPEMASK));
207 goto cleanup;
208 }
209 cur = calloc(1, sizeof(struct lyd_node_inner));
210 break;
211 case LYS_NOTIF:
212 if ((ctx->options & LYD_OPT_TYPEMASK) != LYD_OPT_RPC) {
213 LOGVAL(ctx->ctx, LY_VLOG_LINE, &ctx->line, LYVE_RESTRICTION, "Unexpected Notification element \"%.*s\" in %s data set.",
214 name_len, name, lyd_parse_options_type2str(ctx->options));
215 goto cleanup;
216 }
217 cur = calloc(1, sizeof(struct lyd_node_inner));
218 break;
Radek Krejcie7b95092019-05-15 11:03:07 +0200219 case LYS_CONTAINER:
220 case LYS_LIST:
221 cur = calloc(1, sizeof(struct lyd_node_inner));
222 break;
223 case LYS_LEAF:
224 case LYS_LEAFLIST:
225 cur = calloc(1, sizeof(struct lyd_node_term));
226 break;
227 case LYS_ANYDATA:
228 case LYS_ANYXML:
229 cur = calloc(1, sizeof(struct lyd_node_any));
230 break;
Radek Krejcie7b95092019-05-15 11:03:07 +0200231 default:
232 LOGINT(ctx->ctx);
233 goto cleanup;
234 }
235 if (!(*node)) {
236 (*node) = cur;
237 }
Radek Krejci710226d2019-07-24 17:24:59 +0200238 last = cur;
Radek Krejcie7b95092019-05-15 11:03:07 +0200239 cur->schema = snode;
Radek Krejci710226d2019-07-24 17:24:59 +0200240 cur->prev = cur;
Radek Krejcie7b95092019-05-15 11:03:07 +0200241 cur->parent = parent;
Radek Krejcie92210c2019-05-17 15:53:35 +0200242 if (parent) {
Radek Krejci710226d2019-07-24 17:24:59 +0200243 if (prev && cur->schema->nodetype == LYS_LEAF && (cur->schema->flags & LYS_KEY)) {
244 /* it is key and we need to insert it into a correct place */
245 struct lysc_node_leaf **keys = ((struct lysc_node_list*)parent->schema)->keys;
246 unsigned int cur_index, key_index;
247 struct lyd_node *key;
248
249 for (cur_index = 0; keys[cur_index] != (struct lysc_node_leaf*)cur->schema; ++cur_index);
250 for (key = prev; !(key->schema->flags & LYS_KEY) && key->prev != prev; key = key->prev);
251 for (; key->schema->flags & LYS_KEY; key = key->prev) {
252 for (key_index = 0; keys[key_index] != (struct lysc_node_leaf*)key->schema; ++key_index);
253 if (key_index < cur_index) {
254 /* cur key is supposed to be placed after the key */
255 cur->next = key->next;
256 cur->prev = key;
257 key->next = cur;
258 if (cur->next) {
259 cur->next->prev = cur;
260 } else {
261 parent->child->prev = cur;
262 }
263 break;
264 }
265 if (key->prev == prev) {
266 /* current key is supposed to be the first child from the current children */
267 key = NULL;
268 break;
269 }
270 }
271 if (!key || !(key->schema->flags & LYS_KEY)) {
272 /* current key is supposed to be the first child from the current children */
273 cur->next = parent->child;
274 cur->prev = parent->child->prev;
275 parent->child->prev = cur;
276 parent->child = cur;
277 }
278 if (cur->next) {
279 last = prev;
280 if (ctx->options & LYD_OPT_STRICT) {
281 LOGVAL(ctx->ctx, LY_VLOG_LINE, &ctx->line, LYVE_RESTRICTION, "Invalid position of the key \"%.*s\" in a list.",
282 name_len, name);
283 goto cleanup;
284 } else {
285 LOGWRN(ctx->ctx, "Invalid position of the key \"%.*s\" in a list.", name_len, name);
286 }
287 }
288 } else {
289 /* last child of the parent */
290 if (prev) {
291 parent->child->prev = cur;
292 prev->next = cur;
293 cur->prev = prev;
294 }
295 }
Radek Krejcie7b95092019-05-15 11:03:07 +0200296 } else {
Radek Krejci710226d2019-07-24 17:24:59 +0200297 /* top level */
298 if (prev) {
299 /* last top level node */
300 struct lyd_node *iter;
301 for (iter = prev; iter->prev->next; iter = iter->prev);
302 iter->prev = cur;
303 prev->next = cur;
304 cur->prev = prev;
305 } /* first top level node - nothing more to do */
Radek Krejcie7b95092019-05-15 11:03:07 +0200306 }
Radek Krejci710226d2019-07-24 17:24:59 +0200307 prev = last;
Radek Krejcie7b95092019-05-15 11:03:07 +0200308 cur->attr = attributes;
309 attributes = NULL;
310
311 if (snode->nodetype & LYD_NODE_TERM) {
312 int dynamic = 0;
313 char *buffer = NULL, *value;
314 size_t buffer_size = 0, value_len;
315
316 if (ctx->status == LYXML_ELEM_CONTENT) {
317 /* get the value */
Radek Krejci339e2de2019-05-17 14:28:24 +0200318 LY_ERR r = lyxml_get_string((struct lyxml_context *)ctx, data, &buffer, &buffer_size, &value, &value_len, &dynamic);
319 if (r == LY_EINVAL) {
320 /* just indentation of a child element found */
321 LOGVAL(ctx->ctx, LY_VLOG_LINE, &ctx->line, LYVE_SYNTAX, "Child element inside terminal node \"%s\" found.", cur->schema->name);
322 goto cleanup;
323 }
Radek Krejcie92210c2019-05-17 15:53:35 +0200324 } else {
325 /* no content - validate empty value */
326 value = "";
327 value_len = 0;
Radek Krejcie7b95092019-05-15 11:03:07 +0200328 }
Radek Krejci3c9758d2019-07-11 16:49:10 +0200329 ret = lyd_value_parse((struct lyd_node_term*)cur, value, value_len, dynamic, 0, lydxml_resolve_prefix, ctx, LYD_XML, NULL);
Radek Krejcie553e6d2019-06-07 15:33:18 +0200330 if (ret == LY_EINCOMPLETE) {
331 ly_set_add(&ctx->incomplete_type_validation, cur, LY_SET_OPT_USEASLIST);
332 } else if (ret) {
333 if (dynamic){
334 free(value);
335 }
336 goto cleanup;
337 }
Radek Krejcie7b95092019-05-15 11:03:07 +0200338 } else if (snode->nodetype & LYD_NODE_INNER) {
339 int dynamic = 0;
340 char *buffer = NULL, *value;
341 size_t buffer_size = 0, value_len;
342
343 if (ctx->status == LYXML_ELEM_CONTENT) {
344 LY_ERR r = lyxml_get_string((struct lyxml_context *)ctx, data, &buffer, &buffer_size, &value, &value_len, &dynamic);
Radek Krejcie553e6d2019-06-07 15:33:18 +0200345 if (r != LY_EINVAL && (r != LY_SUCCESS || value_len != 0)) {
Radek Krejcie7b95092019-05-15 11:03:07 +0200346 LOGINT(ctx->ctx);
347 goto cleanup;
348 }
349 }
Radek Krejciee4cab22019-07-17 17:07:47 +0200350 /* process children */
Radek Krejcie553e6d2019-06-07 15:33:18 +0200351 if (ctx->status == LYXML_ELEMENT && parents_count != ctx->elements.count) {
Radek Krejcie7b95092019-05-15 11:03:07 +0200352 ret = lydxml_nodes(ctx, (struct lyd_node_inner*)cur, data, lyd_node_children_p(cur));
Radek Krejcie92210c2019-05-17 15:53:35 +0200353 LY_CHECK_GOTO(ret, cleanup);
Radek Krejcie7b95092019-05-15 11:03:07 +0200354 }
Radek Krejciee4cab22019-07-17 17:07:47 +0200355 } else if (snode->nodetype & LYD_NODE_ANY) {
356 unsigned int cur_element_index = ctx->elements.count;
357 const char *start = *data, *stop;
358 const char *p, *n;
359 size_t p_len, n_len;
360
361 /* skip children data and store them as a string */
362 while (cur_element_index <= ctx->elements.count) {
363 switch (ctx->status) {
364 case LYXML_ELEMENT:
365 ret = lyxml_get_element((struct lyxml_context *)ctx, data, &p, &p_len, &n, &n_len);
366 break;
367 case LYXML_ATTRIBUTE:
368 lyxml_get_attribute((struct lyxml_context*)ctx, data, &p, &p_len, &n, &n_len);
369 break;
370 case LYXML_ELEM_CONTENT:
371 case LYXML_ATTR_CONTENT:
372 ret = lyxml_get_string((struct lyxml_context *)ctx, data, NULL, NULL, NULL, NULL, NULL);
373 if (ret == LY_EINVAL) {
374 /* not an error, just incorrect XML parser status */
375 ret = LY_SUCCESS;
376 }
377 break;
378 case LYXML_END:
379 /* unexpected end of data */
380 LOGINT(ctx->ctx);
381 goto cleanup;
382 }
383 LY_CHECK_GOTO(ret, cleanup);
384 }
385 /* data now points after the anydata's closing element tag, we need just end of its content */
386 for (stop = *data - 1; *stop != '<'; --stop);
387
388 ((struct lyd_node_any*)cur)->value_type = LYD_ANYDATA_XML;
389 ((struct lyd_node_any*)cur)->value.xml = lydict_insert(ctx->ctx, start, stop - start);
Radek Krejcie7b95092019-05-15 11:03:07 +0200390 }
Radek Krejci1f05b6a2019-07-18 16:15:06 +0200391
392 /* calculate the hash and insert it into parent (list with keys is handled when its keys are inserted) */
393 lyd_hash(cur);
394 lyd_insert_hash(cur);
Radek Krejcib6f7ae52019-07-19 10:31:42 +0200395
396 /* if we have empty non-presence container, we keep it, but mark it as default */
397 if (cur->schema->nodetype == LYS_CONTAINER && !((struct lyd_node_inner*)cur)->child &&
398 !cur->attr && !(((struct lysc_node_container*)cur->schema)->flags & LYS_PRESENCE)) {
399 cur->flags |= LYD_DEFAULT;
400 }
401
402 /* TODO context validation */
Radek Krejcie7b95092019-05-15 11:03:07 +0200403 }
404
Radek Krejcif3b6fec2019-07-24 15:53:11 +0200405 /* TODO add missing siblings default elements */
406
Radek Krejcie7b95092019-05-15 11:03:07 +0200407cleanup:
Radek Krejcie7b95092019-05-15 11:03:07 +0200408 lyd_free_attr(ctx->ctx, attributes, 1);
Radek Krejcie7b95092019-05-15 11:03:07 +0200409 return ret;
410}
411
412LY_ERR
Radek Krejcif3b6fec2019-07-24 15:53:11 +0200413lyd_parse_xml(struct ly_ctx *ctx, const char *data, int options, const struct lyd_node **trees, struct lyd_node **result)
Radek Krejcie7b95092019-05-15 11:03:07 +0200414{
415 LY_ERR ret;
Radek Krejcif3b6fec2019-07-24 15:53:11 +0200416 struct lyd_node_inner *parent = NULL;
Radek Krejcie7b95092019-05-15 11:03:07 +0200417 struct lyd_xml_ctx xmlctx = {0};
418
419 xmlctx.options = options;
420 xmlctx.ctx = ctx;
421 xmlctx.line = 1;
422
Radek Krejcif3b6fec2019-07-24 15:53:11 +0200423 /* init */
424 *result = NULL;
425
426 if (!data || !data[0]) {
427 goto no_data;
428 }
429
430 if (options & LYD_OPT_RPCREPLY) {
431 /* TODO prepare container for RPC reply, for which we need RPC
432 * - prepare *result as top-level node
433 * - prepare parent as the RPC/action node */
434 (void)trees;
435 }
436
437 ret = lydxml_nodes(&xmlctx, parent, &data, *result ? &parent->child : result);
Radek Krejcie92210c2019-05-17 15:53:35 +0200438 if (ret) {
439 lyd_free_all(*result);
440 *result = NULL;
Radek Krejcie553e6d2019-06-07 15:33:18 +0200441 } else {
442 /* finish incompletely validated terminal values */
443 for (unsigned int u = 0; u < xmlctx.incomplete_type_validation.count; u++) {
444 struct lyd_node_term *node = (struct lyd_node_term*)xmlctx.incomplete_type_validation.objs[u];
Radek Krejcif3b6fec2019-07-24 15:53:11 +0200445 const struct lyd_node **result_trees = NULL;
Radek Krejcie72c0432019-06-10 10:17:03 +0200446
447 /* prepare sized array for validator */
448 if (*result) {
Radek Krejcif3b6fec2019-07-24 15:53:11 +0200449 result_trees = lyd_trees_new(1, *result);
Radek Krejcie553e6d2019-06-07 15:33:18 +0200450 }
Radek Krejcie72c0432019-06-10 10:17:03 +0200451 /* validate and store the value of the node */
Radek Krejci3c9758d2019-07-11 16:49:10 +0200452 ret = lyd_value_parse(node, node->value.canonized, node->value.canonized ? strlen(node->value.canonized) : 0, 0, 1,
Radek Krejcif3b6fec2019-07-24 15:53:11 +0200453 lydxml_resolve_prefix, ctx, LYD_XML, result_trees);
454 lyd_trees_free(result_trees, 0);
Radek Krejcie553e6d2019-06-07 15:33:18 +0200455 if (ret) {
456 lyd_free_all(*result);
457 *result = NULL;
458 break;
459 }
460 }
Radek Krejcif3b6fec2019-07-24 15:53:11 +0200461
462 if (!(*result)) {
463no_data:
464 /* no data */
465 if (options & (LYD_OPT_RPC | LYD_OPT_NOTIF)) {
466 /* error, top level node identify RPC and Notification */
467 LOGERR(ctx, LY_EINVAL, "Invalid input data of data parser - expected %s which cannot be empty.",
468 lyd_parse_options_type2str(options));
469 } else {
470 /* others - no work is needed, just check for missing mandatory nodes */
471 /* TODO lyd_validate(&result, options, ctx); */
472 }
473 }
Radek Krejcie92210c2019-05-17 15:53:35 +0200474 }
Radek Krejcie553e6d2019-06-07 15:33:18 +0200475
476 ly_set_erase(&xmlctx.incomplete_type_validation, NULL);
Radek Krejcie7b95092019-05-15 11:03:07 +0200477 lyxml_context_clear((struct lyxml_context*)&xmlctx);
478 return ret;
479}