blob: fd88495a50fe9f67059b5e3cb15a99c4eb5d3799 [file] [log] [blame]
Radek Krejcie7b95092019-05-15 11:03:07 +02001/**
2 * @file parser_xml.c
3 * @author Radek Krejci <rkrejci@cesnet.cz>
4 * @brief XML data parser for libyang
5 *
6 * Copyright (c) 2019 CESNET, z.s.p.o.
7 *
8 * This source code is licensed under BSD 3-Clause License (the "License").
9 * You may not use this file except in compliance with the License.
10 * You may obtain a copy of the License at
11 *
12 * https://opensource.org/licenses/BSD-3-Clause
13 */
14
15#include "common.h"
16
17#include <stdint.h>
18#include <stdlib.h>
19#include <string.h>
20
21#include "context.h"
22#include "dict.h"
23#include "log.h"
24#include "plugins_types.h"
25#include "set.h"
26#include "tree_data.h"
27#include "tree_data_internal.h"
28#include "tree_schema.h"
29#include "xml.h"
30
31/**
32 * @brief internal context for XML YANG data parser.
33 *
34 * The leading part is compatible with the struct lyxml_context
35 */
36struct lyd_xml_ctx {
37 struct ly_ctx *ctx; /**< libyang context */
38 uint64_t line; /**< number of the line being currently processed */
39 enum LYXML_PARSER_STATUS status; /**< status providing information about the next expected object in input data */
40 struct ly_set elements; /**< list of not-yet-closed elements */
41 struct ly_set ns; /**< handled with LY_SET_OPT_USEASLIST */
42
43 uint16_t options; /**< various @ref dataparseroptions. */
44 uint16_t path_len; /**< used bytes in the path buffer */
45#define LYD_PARSER_BUFSIZE 4078
46 char path[LYD_PARSER_BUFSIZE]; /**< buffer for the generated path */
Radek Krejcie553e6d2019-06-07 15:33:18 +020047 struct ly_set incomplete_type_validation; /**< set of nodes validated with LY_EINCOMPLETE result */
Radek Krejcie7b95092019-05-15 11:03:07 +020048};
49
50/**
Radek Krejciaca74032019-06-04 08:53:06 +020051 * @brief XML-parser's implementation of ly_type_resolve_prefix() callback to provide mapping between prefixes used in the values to the schema
52 * via XML namespaces.
53 */
54static const struct lys_module *
55lydxml_resolve_prefix(struct ly_ctx *ctx, const char *prefix, size_t prefix_len, void *parser)
56{
57 const struct lyxml_ns *ns;
58 struct lyxml_context *xmlctx = (struct lyxml_context*)parser;
59
60 ns = lyxml_ns_get(xmlctx, prefix, prefix_len);
61 if (!ns) {
62 return NULL;
63 }
64
65 return ly_ctx_get_module_implemented_ns(ctx, ns->uri);
66}
67
68/**
Radek Krejcie7b95092019-05-15 11:03:07 +020069 * @brief Parse XML attributes of the XML element of YANG data.
70 *
71 * @param[in] ctx XML YANG data parser context.
Radek Krejcie7b95092019-05-15 11:03:07 +020072 * @param[in,out] data Pointer to the XML string representation of the YANG data to parse.
73 * @param[out] attributes Resulting list of the parsed attributes. XML namespace definitions are not parsed
74 * as attributes, they are stored internally in the parser context.
75 * @reutn LY_ERR value.
76 */
77static LY_ERR
Radek Krejci17a78d82019-05-15 15:49:55 +020078lydxml_attributes(struct lyd_xml_ctx *ctx, const char **data, struct lyd_attr **attributes)
Radek Krejcie7b95092019-05-15 11:03:07 +020079{
80 LY_ERR ret = LY_SUCCESS;
81 unsigned int u;
82 const char *prefix, *name;
83 size_t prefix_len, name_len;
84 struct lyd_attr *attr = NULL, *last = NULL;
85 const struct lyxml_ns *ns;
86 struct ly_set attr_prefixes = {0};
87 struct attr_prefix_s {
88 const char *prefix;
89 size_t prefix_len;
90 } *attr_prefix;
91 struct lys_module *mod;
92
93 while(ctx->status == LYXML_ATTRIBUTE &&
94 lyxml_get_attribute((struct lyxml_context*)ctx, data, &prefix, &prefix_len, &name, &name_len) == LY_SUCCESS) {
95 int dynamic = 0;
96 char *buffer = NULL, *value;
97 size_t buffer_size = 0, value_len;
98
Radek Krejci17a78d82019-05-15 15:49:55 +020099 if (!name) {
100 /* seems like all the attrributes were internally processed as namespace definitions */
101 continue;
Radek Krejcie7b95092019-05-15 11:03:07 +0200102 }
Radek Krejci17a78d82019-05-15 15:49:55 +0200103
104 /* get attribute value */
105 ret = lyxml_get_string((struct lyxml_context *)ctx, data, &buffer, &buffer_size, &value, &value_len, &dynamic);
106 LY_CHECK_GOTO(ret, cleanup);
107
108 attr = calloc(1, sizeof *attr);
109 LY_CHECK_ERR_GOTO(!attr, LOGMEM(ctx->ctx); ret = LY_EMEM, cleanup);
110
111 attr->name = lydict_insert(ctx->ctx, name, name_len);
112 /* auxiliary store the prefix information and wait with resolving prefix to the time when all the namespaces,
113 * defined in this element, are parsed, so we will get the correct namespace for this prefix */
114 attr_prefix = malloc(sizeof *attr_prefix);
115 attr_prefix->prefix = prefix;
116 attr_prefix->prefix_len = prefix_len;
117 ly_set_add(&attr_prefixes, attr_prefix, LY_SET_OPT_USEASLIST);
118
119 /* TODO process value */
120
121 if (last) {
122 last->next = attr;
123 } else {
124 (*attributes) = attr;
125 }
126 last = attr;
Radek Krejcie7b95092019-05-15 11:03:07 +0200127 }
128
129 /* resolve annotation pointers in all the attributes */
130 for (last = *attributes, u = 0; u < attr_prefixes.count && last; u++, last = last->next) {
131 attr_prefix = (struct attr_prefix_s*)attr_prefixes.objs[u];
132 ns = lyxml_ns_get((struct lyxml_context *)ctx, attr_prefix->prefix, attr_prefix->prefix_len);
133 mod = ly_ctx_get_module_implemented_ns(ctx->ctx, ns->uri);
134
135 /* TODO get annotation */
136 }
137
138cleanup:
139
140 ly_set_erase(&attr_prefixes, free);
141 return ret;
142}
143
144/**
145 * @brief Parse XML elements as children YANG data node of the specified parent node.
146 *
147 * @param[in] ctx XML YANG data parser context.
148 * @param[in] parent Parent node where the children are inserted. NULL in case of parsing top-level elements.
149 * @param[in,out] data Pointer to the XML string representation of the YANG data to parse.
150 * @param[out] node Resulting list of the parsed nodes.
151 * @reutn LY_ERR value.
152 */
153static LY_ERR
154lydxml_nodes(struct lyd_xml_ctx *ctx, struct lyd_node_inner *parent, const char **data, struct lyd_node **node)
155{
156 LY_ERR ret = LY_SUCCESS;
157 const char *prefix, *name;
Radek Krejcie7b95092019-05-15 11:03:07 +0200158 size_t prefix_len, name_len;
159 struct lyd_attr *attributes = NULL;
160 const struct lyxml_ns *ns;
161 const struct lysc_node *snode;
162 struct lys_module *mod;
163 unsigned int parents_count = ctx->elements.count;
164 struct lyd_node *cur = NULL, *prev = NULL;
165
166 (*node) = NULL;
167
168 while(ctx->status == LYXML_ELEMENT) {
169 ret = lyxml_get_element((struct lyxml_context *)ctx, data, &prefix, &prefix_len, &name, &name_len);
170 LY_CHECK_GOTO(ret, cleanup);
171 if (!name) {
172 /* closing previous element */
Radek Krejcie7b95092019-05-15 11:03:07 +0200173 if (ctx->elements.count < parents_count) {
174 /* all siblings parsed */
175 break;
176 } else {
177 continue;
178 }
179 }
180 attributes = NULL;
Radek Krejci1f05b6a2019-07-18 16:15:06 +0200181 if (ctx->status == LYXML_ATTRIBUTE) {
182 LY_CHECK_GOTO(lydxml_attributes(ctx, data, &attributes), cleanup);
183 }
184
Radek Krejcie7b95092019-05-15 11:03:07 +0200185 ns = lyxml_ns_get((struct lyxml_context *)ctx, prefix, prefix_len);
186 if (!ns) {
187 LOGVAL(ctx->ctx, LY_VLOG_LINE, &ctx->line, LYVE_REFERENCE, "Unknown XML prefix \"%*.s\".", prefix_len, prefix);
188 goto cleanup;
189 }
190 mod = ly_ctx_get_module_implemented_ns(ctx->ctx, ns->uri);
191 if (!mod) {
192 LOGVAL(ctx->ctx, LY_VLOG_LINE, &ctx->line, LYVE_REFERENCE, "No module with namespace \"%s\" in the context.", ns->uri);
193 goto cleanup;
194 }
195 snode = lys_child(parent ? parent->schema : NULL, mod, name, name_len, 0, (ctx->options & LYD_OPT_RPCREPLY) ? LYS_GETNEXT_OUTPUT : 0);
196 if (!snode) {
197 LOGVAL(ctx->ctx, LY_VLOG_LINE, &ctx->line, LYVE_REFERENCE, "Element \"%.*s\" not found in the \"%s\" module.", name_len, name, mod->name);
198 goto cleanup;
199 }
200
201 /* allocate new node */
202 switch (snode->nodetype) {
Radek Krejcif3b6fec2019-07-24 15:53:11 +0200203 case LYS_ACTION:
204 if ((ctx->options & LYD_OPT_TYPEMASK) != LYD_OPT_RPC) {
205 LOGVAL(ctx->ctx, LY_VLOG_LINE, &ctx->line, LYVE_RESTRICTION, "Unexpected RPC/action element \"%.*s\" in %s data set.",
206 name_len, name, lyd_parse_options_type2str(ctx->options & LYD_OPT_TYPEMASK));
207 goto cleanup;
208 }
209 cur = calloc(1, sizeof(struct lyd_node_inner));
210 break;
211 case LYS_NOTIF:
212 if ((ctx->options & LYD_OPT_TYPEMASK) != LYD_OPT_RPC) {
213 LOGVAL(ctx->ctx, LY_VLOG_LINE, &ctx->line, LYVE_RESTRICTION, "Unexpected Notification element \"%.*s\" in %s data set.",
214 name_len, name, lyd_parse_options_type2str(ctx->options));
215 goto cleanup;
216 }
217 cur = calloc(1, sizeof(struct lyd_node_inner));
218 break;
Radek Krejcie7b95092019-05-15 11:03:07 +0200219 case LYS_CONTAINER:
220 case LYS_LIST:
221 cur = calloc(1, sizeof(struct lyd_node_inner));
222 break;
223 case LYS_LEAF:
224 case LYS_LEAFLIST:
225 cur = calloc(1, sizeof(struct lyd_node_term));
226 break;
227 case LYS_ANYDATA:
228 case LYS_ANYXML:
229 cur = calloc(1, sizeof(struct lyd_node_any));
230 break;
Radek Krejcie7b95092019-05-15 11:03:07 +0200231 default:
232 LOGINT(ctx->ctx);
233 goto cleanup;
234 }
235 if (!(*node)) {
236 (*node) = cur;
237 }
238 cur->schema = snode;
239 cur->parent = parent;
Radek Krejcie92210c2019-05-17 15:53:35 +0200240 if (parent) {
241 parent->child->prev = cur;
242 } else if (prev) {
243 struct lyd_node *iter;
244 for (iter = prev; iter->prev->next; iter = iter->prev);
245 iter->prev = cur;
246 }
Radek Krejcie7b95092019-05-15 11:03:07 +0200247 if (prev) {
248 cur->prev = prev;
249 prev->next = cur;
250 } else {
251 cur->prev = cur;
252 }
253 prev = cur;
254 cur->attr = attributes;
255 attributes = NULL;
256
257 if (snode->nodetype & LYD_NODE_TERM) {
258 int dynamic = 0;
259 char *buffer = NULL, *value;
260 size_t buffer_size = 0, value_len;
261
262 if (ctx->status == LYXML_ELEM_CONTENT) {
263 /* get the value */
Radek Krejci339e2de2019-05-17 14:28:24 +0200264 LY_ERR r = lyxml_get_string((struct lyxml_context *)ctx, data, &buffer, &buffer_size, &value, &value_len, &dynamic);
265 if (r == LY_EINVAL) {
266 /* just indentation of a child element found */
267 LOGVAL(ctx->ctx, LY_VLOG_LINE, &ctx->line, LYVE_SYNTAX, "Child element inside terminal node \"%s\" found.", cur->schema->name);
268 goto cleanup;
269 }
Radek Krejcie92210c2019-05-17 15:53:35 +0200270 } else {
271 /* no content - validate empty value */
272 value = "";
273 value_len = 0;
Radek Krejcie7b95092019-05-15 11:03:07 +0200274 }
Radek Krejci3c9758d2019-07-11 16:49:10 +0200275 ret = lyd_value_parse((struct lyd_node_term*)cur, value, value_len, dynamic, 0, lydxml_resolve_prefix, ctx, LYD_XML, NULL);
Radek Krejcie553e6d2019-06-07 15:33:18 +0200276 if (ret == LY_EINCOMPLETE) {
277 ly_set_add(&ctx->incomplete_type_validation, cur, LY_SET_OPT_USEASLIST);
278 } else if (ret) {
279 if (dynamic){
280 free(value);
281 }
282 goto cleanup;
283 }
Radek Krejcie7b95092019-05-15 11:03:07 +0200284 } else if (snode->nodetype & LYD_NODE_INNER) {
285 int dynamic = 0;
286 char *buffer = NULL, *value;
287 size_t buffer_size = 0, value_len;
288
289 if (ctx->status == LYXML_ELEM_CONTENT) {
290 LY_ERR r = lyxml_get_string((struct lyxml_context *)ctx, data, &buffer, &buffer_size, &value, &value_len, &dynamic);
Radek Krejcie553e6d2019-06-07 15:33:18 +0200291 if (r != LY_EINVAL && (r != LY_SUCCESS || value_len != 0)) {
Radek Krejcie7b95092019-05-15 11:03:07 +0200292 LOGINT(ctx->ctx);
293 goto cleanup;
294 }
295 }
Radek Krejciee4cab22019-07-17 17:07:47 +0200296 /* process children */
Radek Krejcie553e6d2019-06-07 15:33:18 +0200297 if (ctx->status == LYXML_ELEMENT && parents_count != ctx->elements.count) {
Radek Krejcie7b95092019-05-15 11:03:07 +0200298 ret = lydxml_nodes(ctx, (struct lyd_node_inner*)cur, data, lyd_node_children_p(cur));
Radek Krejcie92210c2019-05-17 15:53:35 +0200299 LY_CHECK_GOTO(ret, cleanup);
Radek Krejcie7b95092019-05-15 11:03:07 +0200300 }
Radek Krejciee4cab22019-07-17 17:07:47 +0200301 } else if (snode->nodetype & LYD_NODE_ANY) {
302 unsigned int cur_element_index = ctx->elements.count;
303 const char *start = *data, *stop;
304 const char *p, *n;
305 size_t p_len, n_len;
306
307 /* skip children data and store them as a string */
308 while (cur_element_index <= ctx->elements.count) {
309 switch (ctx->status) {
310 case LYXML_ELEMENT:
311 ret = lyxml_get_element((struct lyxml_context *)ctx, data, &p, &p_len, &n, &n_len);
312 break;
313 case LYXML_ATTRIBUTE:
314 lyxml_get_attribute((struct lyxml_context*)ctx, data, &p, &p_len, &n, &n_len);
315 break;
316 case LYXML_ELEM_CONTENT:
317 case LYXML_ATTR_CONTENT:
318 ret = lyxml_get_string((struct lyxml_context *)ctx, data, NULL, NULL, NULL, NULL, NULL);
319 if (ret == LY_EINVAL) {
320 /* not an error, just incorrect XML parser status */
321 ret = LY_SUCCESS;
322 }
323 break;
324 case LYXML_END:
325 /* unexpected end of data */
326 LOGINT(ctx->ctx);
327 goto cleanup;
328 }
329 LY_CHECK_GOTO(ret, cleanup);
330 }
331 /* data now points after the anydata's closing element tag, we need just end of its content */
332 for (stop = *data - 1; *stop != '<'; --stop);
333
334 ((struct lyd_node_any*)cur)->value_type = LYD_ANYDATA_XML;
335 ((struct lyd_node_any*)cur)->value.xml = lydict_insert(ctx->ctx, start, stop - start);
Radek Krejcie7b95092019-05-15 11:03:07 +0200336 }
Radek Krejci1f05b6a2019-07-18 16:15:06 +0200337
338 /* calculate the hash and insert it into parent (list with keys is handled when its keys are inserted) */
339 lyd_hash(cur);
340 lyd_insert_hash(cur);
Radek Krejcib6f7ae52019-07-19 10:31:42 +0200341
342 /* if we have empty non-presence container, we keep it, but mark it as default */
343 if (cur->schema->nodetype == LYS_CONTAINER && !((struct lyd_node_inner*)cur)->child &&
344 !cur->attr && !(((struct lysc_node_container*)cur->schema)->flags & LYS_PRESENCE)) {
345 cur->flags |= LYD_DEFAULT;
346 }
347
348 /* TODO context validation */
Radek Krejcie7b95092019-05-15 11:03:07 +0200349 }
350
Radek Krejcif3b6fec2019-07-24 15:53:11 +0200351 /* TODO add missing siblings default elements */
352
Radek Krejcie7b95092019-05-15 11:03:07 +0200353cleanup:
Radek Krejcie7b95092019-05-15 11:03:07 +0200354 lyd_free_attr(ctx->ctx, attributes, 1);
Radek Krejcie7b95092019-05-15 11:03:07 +0200355 return ret;
356}
357
358LY_ERR
Radek Krejcif3b6fec2019-07-24 15:53:11 +0200359lyd_parse_xml(struct ly_ctx *ctx, const char *data, int options, const struct lyd_node **trees, struct lyd_node **result)
Radek Krejcie7b95092019-05-15 11:03:07 +0200360{
361 LY_ERR ret;
Radek Krejcif3b6fec2019-07-24 15:53:11 +0200362 struct lyd_node_inner *parent = NULL;
Radek Krejcie7b95092019-05-15 11:03:07 +0200363 struct lyd_xml_ctx xmlctx = {0};
364
365 xmlctx.options = options;
366 xmlctx.ctx = ctx;
367 xmlctx.line = 1;
368
Radek Krejcif3b6fec2019-07-24 15:53:11 +0200369 /* init */
370 *result = NULL;
371
372 if (!data || !data[0]) {
373 goto no_data;
374 }
375
376 if (options & LYD_OPT_RPCREPLY) {
377 /* TODO prepare container for RPC reply, for which we need RPC
378 * - prepare *result as top-level node
379 * - prepare parent as the RPC/action node */
380 (void)trees;
381 }
382
383 ret = lydxml_nodes(&xmlctx, parent, &data, *result ? &parent->child : result);
Radek Krejcie92210c2019-05-17 15:53:35 +0200384 if (ret) {
385 lyd_free_all(*result);
386 *result = NULL;
Radek Krejcie553e6d2019-06-07 15:33:18 +0200387 } else {
388 /* finish incompletely validated terminal values */
389 for (unsigned int u = 0; u < xmlctx.incomplete_type_validation.count; u++) {
390 struct lyd_node_term *node = (struct lyd_node_term*)xmlctx.incomplete_type_validation.objs[u];
Radek Krejcif3b6fec2019-07-24 15:53:11 +0200391 const struct lyd_node **result_trees = NULL;
Radek Krejcie72c0432019-06-10 10:17:03 +0200392
393 /* prepare sized array for validator */
394 if (*result) {
Radek Krejcif3b6fec2019-07-24 15:53:11 +0200395 result_trees = lyd_trees_new(1, *result);
Radek Krejcie553e6d2019-06-07 15:33:18 +0200396 }
Radek Krejcie72c0432019-06-10 10:17:03 +0200397 /* validate and store the value of the node */
Radek Krejci3c9758d2019-07-11 16:49:10 +0200398 ret = lyd_value_parse(node, node->value.canonized, node->value.canonized ? strlen(node->value.canonized) : 0, 0, 1,
Radek Krejcif3b6fec2019-07-24 15:53:11 +0200399 lydxml_resolve_prefix, ctx, LYD_XML, result_trees);
400 lyd_trees_free(result_trees, 0);
Radek Krejcie553e6d2019-06-07 15:33:18 +0200401 if (ret) {
402 lyd_free_all(*result);
403 *result = NULL;
404 break;
405 }
406 }
Radek Krejcif3b6fec2019-07-24 15:53:11 +0200407
408 if (!(*result)) {
409no_data:
410 /* no data */
411 if (options & (LYD_OPT_RPC | LYD_OPT_NOTIF)) {
412 /* error, top level node identify RPC and Notification */
413 LOGERR(ctx, LY_EINVAL, "Invalid input data of data parser - expected %s which cannot be empty.",
414 lyd_parse_options_type2str(options));
415 } else {
416 /* others - no work is needed, just check for missing mandatory nodes */
417 /* TODO lyd_validate(&result, options, ctx); */
418 }
419 }
Radek Krejcie92210c2019-05-17 15:53:35 +0200420 }
Radek Krejcie553e6d2019-06-07 15:33:18 +0200421
422 ly_set_erase(&xmlctx.incomplete_type_validation, NULL);
Radek Krejcie7b95092019-05-15 11:03:07 +0200423 lyxml_context_clear((struct lyxml_context*)&xmlctx);
424 return ret;
425}