Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 1 | /** |
| 2 | * @file xpath.h |
| 3 | * @author Michal Vasko <mvasko@cesnet.cz> |
| 4 | * @brief YANG XPath evaluation functions header |
| 5 | * |
Michal Vasko | 519fd60 | 2020-05-26 12:17:39 +0200 | [diff] [blame] | 6 | * Copyright (c) 2015 - 2020 CESNET, z.s.p.o. |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 7 | * |
| 8 | * This source code is licensed under BSD 3-Clause License (the "License"). |
| 9 | * You may not use this file except in compliance with the License. |
| 10 | * You may obtain a copy of the License at |
| 11 | * |
| 12 | * https://opensource.org/licenses/BSD-3-Clause |
| 13 | */ |
| 14 | |
Michal Vasko | 1467635 | 2020-05-29 11:35:55 +0200 | [diff] [blame] | 15 | #ifndef LY_XPATH_H |
| 16 | #define LY_XPATH_H |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 17 | |
Radek Krejci | ad97c5f | 2020-06-30 09:19:28 +0200 | [diff] [blame] | 18 | #include <stddef.h> |
Michal Vasko | 6973015 | 2020-10-09 16:30:07 +0200 | [diff] [blame] | 19 | #include <stdint.h> |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 20 | |
Michal Vasko | c5a2283 | 2020-08-20 13:21:33 +0200 | [diff] [blame] | 21 | #include "compat.h" |
Radek Krejci | e7b9509 | 2019-05-15 11:03:07 +0200 | [diff] [blame] | 22 | #include "log.h" |
Radek Krejci | 7711410 | 2021-03-10 15:21:57 +0100 | [diff] [blame] | 23 | #include "tree.h" |
Radek Krejci | 535ea9f | 2020-05-29 16:01:05 +0200 | [diff] [blame] | 24 | #include "tree_schema.h" |
Radek Krejci | e7b9509 | 2019-05-15 11:03:07 +0200 | [diff] [blame] | 25 | |
| 26 | struct ly_ctx; |
Radek Krejci | 7711410 | 2021-03-10 15:21:57 +0100 | [diff] [blame] | 27 | struct lyd_node; |
Radek Krejci | e7b9509 | 2019-05-15 11:03:07 +0200 | [diff] [blame] | 28 | |
Radek Krejci | 84d7fd7 | 2021-07-14 18:32:21 +0200 | [diff] [blame] | 29 | /** |
| 30 | * @internal |
| 31 | * @page internals |
| 32 | * @section internalsXpath XPath Implementation |
| 33 | * |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 34 | * XPath evaluator fully compliant with http://www.w3.org/TR/1999/REC-xpath-19991116/ |
| 35 | * except the following restrictions in the grammar. |
| 36 | * |
Radek Krejci | 84d7fd7 | 2021-07-14 18:32:21 +0200 | [diff] [blame] | 37 | * @subsection internalsXpathGrammar Parsed Grammar |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 38 | * |
| 39 | * Full axes are not supported, abbreviated forms must be used, |
aPiecek | fba7536 | 2021-10-07 12:39:48 +0200 | [diff] [blame] | 40 | * "id()" function is not supported, and processing instruction and comment nodes are not supported, |
| 41 | * which is also reflected in the grammar. Undefined rules and constants are tokens. |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 42 | * |
| 43 | * Modified full grammar: |
Radek Krejci | 84d7fd7 | 2021-07-14 18:32:21 +0200 | [diff] [blame] | 44 | * @code |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 45 | * [1] Expr ::= OrExpr // just an alias |
| 46 | * |
| 47 | * [2] LocationPath ::= RelativeLocationPath | AbsoluteLocationPath |
| 48 | * [3] AbsoluteLocationPath ::= '/' RelativeLocationPath? | '//' RelativeLocationPath |
| 49 | * [4] RelativeLocationPath ::= Step | RelativeLocationPath '/' Step | RelativeLocationPath '//' Step |
| 50 | * [5] Step ::= '@'? NodeTest Predicate* | '.' | '..' |
| 51 | * [6] NodeTest ::= NameTest | NodeType '(' ')' |
Michal Vasko | d367889 | 2020-05-21 10:06:58 +0200 | [diff] [blame] | 52 | * [7] NameTest ::= '*' | NCName ':' '*' | QName |
| 53 | * [8] NodeType ::= 'text' | 'node' |
| 54 | * [9] Predicate ::= '[' Expr ']' |
aPiecek | fba7536 | 2021-10-07 12:39:48 +0200 | [diff] [blame] | 55 | * [10] PrimaryExpr ::= VariableReference | '(' Expr ')' | Literal | Number | FunctionCall |
Michal Vasko | d367889 | 2020-05-21 10:06:58 +0200 | [diff] [blame] | 56 | * [11] FunctionCall ::= FunctionName '(' ( Expr ( ',' Expr )* )? ')' |
| 57 | * [12] PathExpr ::= LocationPath | PrimaryExpr Predicate* |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 58 | * | PrimaryExpr Predicate* '/' RelativeLocationPath |
| 59 | * | PrimaryExpr Predicate* '//' RelativeLocationPath |
Michal Vasko | d367889 | 2020-05-21 10:06:58 +0200 | [diff] [blame] | 60 | * [13] OrExpr ::= AndExpr | OrExpr 'or' AndExpr |
| 61 | * [14] AndExpr ::= EqualityExpr | AndExpr 'and' EqualityExpr |
| 62 | * [15] EqualityExpr ::= RelationalExpr | EqualityExpr '=' RelationalExpr |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 63 | * | EqualityExpr '!=' RelationalExpr |
Michal Vasko | d367889 | 2020-05-21 10:06:58 +0200 | [diff] [blame] | 64 | * [16] RelationalExpr ::= AdditiveExpr |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 65 | * | RelationalExpr '<' AdditiveExpr |
| 66 | * | RelationalExpr '>' AdditiveExpr |
| 67 | * | RelationalExpr '<=' AdditiveExpr |
| 68 | * | RelationalExpr '>=' AdditiveExpr |
Michal Vasko | d367889 | 2020-05-21 10:06:58 +0200 | [diff] [blame] | 69 | * [17] AdditiveExpr ::= MultiplicativeExpr |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 70 | * | AdditiveExpr '+' MultiplicativeExpr |
| 71 | * | AdditiveExpr '-' MultiplicativeExpr |
Michal Vasko | d367889 | 2020-05-21 10:06:58 +0200 | [diff] [blame] | 72 | * [18] MultiplicativeExpr ::= UnaryExpr |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 73 | * | MultiplicativeExpr '*' UnaryExpr |
| 74 | * | MultiplicativeExpr 'div' UnaryExpr |
| 75 | * | MultiplicativeExpr 'mod' UnaryExpr |
Michal Vasko | d367889 | 2020-05-21 10:06:58 +0200 | [diff] [blame] | 76 | * [19] UnaryExpr ::= UnionExpr | '-' UnaryExpr |
| 77 | * [20] UnionExpr ::= PathExpr | UnionExpr '|' PathExpr |
Radek Krejci | 84d7fd7 | 2021-07-14 18:32:21 +0200 | [diff] [blame] | 78 | * @endcode |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 79 | */ |
| 80 | |
| 81 | /* expression tokens allocation */ |
| 82 | #define LYXP_EXPR_SIZE_START 10 |
| 83 | #define LYXP_EXPR_SIZE_STEP 5 |
| 84 | |
| 85 | /* XPath matches allocation */ |
Michal Vasko | 871df52 | 2022-04-06 12:14:41 +0200 | [diff] [blame] | 86 | #define LYXP_SET_SIZE_START 4 |
| 87 | #define LYXP_SET_SIZE_MUL_STEP 2 |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 88 | |
| 89 | /* building string when casting */ |
| 90 | #define LYXP_STRING_CAST_SIZE_START 64 |
| 91 | #define LYXP_STRING_CAST_SIZE_STEP 16 |
| 92 | |
aPiecek | bf968d9 | 2021-05-27 14:35:05 +0200 | [diff] [blame] | 93 | /* Maximum number of nested expressions. */ |
| 94 | #define LYXP_MAX_BLOCK_DEPTH 100 |
| 95 | |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 96 | /** |
| 97 | * @brief Tokens that can be in an XPath expression. |
| 98 | */ |
| 99 | enum lyxp_token { |
| 100 | LYXP_TOKEN_NONE = 0, |
| 101 | LYXP_TOKEN_PAR1, /* '(' */ |
| 102 | LYXP_TOKEN_PAR2, /* ')' */ |
| 103 | LYXP_TOKEN_BRACK1, /* '[' */ |
| 104 | LYXP_TOKEN_BRACK2, /* ']' */ |
| 105 | LYXP_TOKEN_DOT, /* '.' */ |
| 106 | LYXP_TOKEN_DDOT, /* '..' */ |
| 107 | LYXP_TOKEN_AT, /* '@' */ |
| 108 | LYXP_TOKEN_COMMA, /* ',' */ |
| 109 | /* LYXP_TOKEN_DCOLON, * '::' * axes not supported */ |
| 110 | LYXP_TOKEN_NAMETEST, /* NameTest */ |
| 111 | LYXP_TOKEN_NODETYPE, /* NodeType */ |
aPiecek | fba7536 | 2021-10-07 12:39:48 +0200 | [diff] [blame] | 112 | LYXP_TOKEN_VARREF, /* VariableReference */ |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 113 | LYXP_TOKEN_FUNCNAME, /* FunctionName */ |
Michal Vasko | 3e48bf3 | 2020-06-01 08:39:07 +0200 | [diff] [blame] | 114 | LYXP_TOKEN_OPER_LOG, /* Operator 'and', 'or' */ |
| 115 | LYXP_TOKEN_OPER_EQUAL, /* Operator '=' */ |
| 116 | LYXP_TOKEN_OPER_NEQUAL, /* Operator '!=' */ |
| 117 | LYXP_TOKEN_OPER_COMP, /* Operator '<', '<=', '>', '>=' */ |
| 118 | LYXP_TOKEN_OPER_MATH, /* Operator '+', '-', '*', 'div', 'mod', '-' (unary) */ |
| 119 | LYXP_TOKEN_OPER_UNI, /* Operator '|' */ |
| 120 | LYXP_TOKEN_OPER_PATH, /* Operator '/' */ |
| 121 | LYXP_TOKEN_OPER_RPATH, /* Operator '//' (recursive path) */ |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 122 | /* LYXP_TOKEN_AXISNAME, * AxisName * axes not supported */ |
| 123 | LYXP_TOKEN_LITERAL, /* Literal - with either single or double quote */ |
| 124 | LYXP_TOKEN_NUMBER /* Number */ |
| 125 | }; |
| 126 | |
| 127 | /** |
| 128 | * @brief XPath (sub)expressions that can be repeated. |
| 129 | */ |
| 130 | enum lyxp_expr_type { |
| 131 | LYXP_EXPR_NONE = 0, |
| 132 | LYXP_EXPR_OR, |
| 133 | LYXP_EXPR_AND, |
| 134 | LYXP_EXPR_EQUALITY, |
| 135 | LYXP_EXPR_RELATIONAL, |
| 136 | LYXP_EXPR_ADDITIVE, |
| 137 | LYXP_EXPR_MULTIPLICATIVE, |
| 138 | LYXP_EXPR_UNARY, |
Michal Vasko | 6973015 | 2020-10-09 16:30:07 +0200 | [diff] [blame] | 139 | LYXP_EXPR_UNION |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 140 | }; |
| 141 | |
| 142 | /** |
Michal Vasko | 03ff5a7 | 2019-09-11 13:49:33 +0200 | [diff] [blame] | 143 | * @brief Types of context nodes, #LYXP_NODE_ROOT_CONFIG used only in when or must conditions. |
| 144 | */ |
| 145 | enum lyxp_node_type { |
Michal Vasko | 2caefc1 | 2019-11-14 16:07:56 +0100 | [diff] [blame] | 146 | LYXP_NODE_NONE, /* invalid node type */ |
| 147 | |
Michal Vasko | 03ff5a7 | 2019-09-11 13:49:33 +0200 | [diff] [blame] | 148 | /* XML document roots */ |
| 149 | LYXP_NODE_ROOT, /* access to all the data (node value first top-level node) */ |
| 150 | LYXP_NODE_ROOT_CONFIG, /* <running> data context, no state data (node value first top-level node) */ |
| 151 | |
| 152 | /* XML elements */ |
Michal Vasko | 9f96a05 | 2020-03-10 09:41:45 +0100 | [diff] [blame] | 153 | LYXP_NODE_ELEM, /* YANG data element (most common) */ |
| 154 | LYXP_NODE_TEXT, /* YANG data text element (extremely specific use, unlikely to be ever needed) */ |
| 155 | LYXP_NODE_META /* YANG metadata (do not use for the context node) */ |
Michal Vasko | 03ff5a7 | 2019-09-11 13:49:33 +0200 | [diff] [blame] | 156 | }; |
| 157 | |
| 158 | /** |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 159 | * @brief Structure holding a parsed XPath expression. |
| 160 | */ |
| 161 | struct lyxp_expr { |
aPiecek | 6da713d | 2021-10-11 12:50:28 +0200 | [diff] [blame] | 162 | enum lyxp_token *tokens; /**< Array of tokens. */ |
| 163 | uint16_t *tok_pos; /**< Array of the token offsets in expr. */ |
| 164 | uint16_t *tok_len; /**< Array of token lengths in expr. */ |
| 165 | enum lyxp_expr_type **repeat; /**< Array of expression types that this token begins and is repeated ended with 0, |
| 166 | more in the comment after this declaration. */ |
| 167 | uint16_t used; /**< Used array items. */ |
| 168 | uint16_t size; /**< Allocated array items. */ |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 169 | |
aPiecek | 6da713d | 2021-10-11 12:50:28 +0200 | [diff] [blame] | 170 | const char *expr; /**< The original XPath expression. */ |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 171 | }; |
| 172 | |
| 173 | /* |
| 174 | * lyxp_expr repeat |
| 175 | * |
| 176 | * This value is NULL for all the tokens that do not begin an |
| 177 | * expression which can be repeated. Otherwise it is an array |
| 178 | * of expression types that this token begins. These values |
| 179 | * are used during evaluation to know whether we need to |
| 180 | * duplicate the current context or not and to decide what |
| 181 | * the current expression is (for example, if we are only |
| 182 | * starting the parsing and the first token has no repeat, |
| 183 | * we do not parse it as an OrExpr but directly as PathExpr). |
| 184 | * Examples: |
| 185 | * |
aPiecek | ff49d76 | 2021-10-11 10:25:27 +0200 | [diff] [blame] | 186 | * Expr: "/ *[key1 and key2 or key1 < key2]" |
| 187 | * Tokens: '/' '*' '[' NameTest 'and' NameTest 'or' NameTest '<' NameTest ']' |
| 188 | * Repeat: NULL NULL NULL _ NULL NULL NULL _ NULL NULL NULL |
| 189 | * | v |
| 190 | * v RelationalExpr 0 |
| 191 | * AndExpr OrExpr 0 |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 192 | * |
aPiecek | ff49d76 | 2021-10-11 10:25:27 +0200 | [diff] [blame] | 193 | * Expr: "//node[key and node2]/key | /cont" |
| 194 | * Tokens: '//' NameTest '[' NameTest 'and' NameTest ']' '/' NameTest '|' '/' NameTest |
| 195 | * Repeat: _ NULL NULL _ NULL NULL NULL NULL NULL NULL NULL NULL |
| 196 | * | v |
| 197 | * v AndExpr 0 |
| 198 | * UnionExpr 0 |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 199 | * |
| 200 | * Operators between expressions which this concerns: |
| 201 | * 'or', 'and', '=', '!=', '<', '>', '<=', '>=', '+', '-', '*', 'div', 'mod', '|' |
| 202 | */ |
| 203 | |
| 204 | /** |
| 205 | * @brief Supported types of (partial) XPath results. |
| 206 | */ |
| 207 | enum lyxp_set_type { |
Michal Vasko | d367889 | 2020-05-21 10:06:58 +0200 | [diff] [blame] | 208 | LYXP_SET_NODE_SET = 0, |
Michal Vasko | 03ff5a7 | 2019-09-11 13:49:33 +0200 | [diff] [blame] | 209 | LYXP_SET_SCNODE_SET, |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 210 | LYXP_SET_BOOLEAN, |
| 211 | LYXP_SET_NUMBER, |
| 212 | LYXP_SET_STRING |
| 213 | }; |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 214 | |
| 215 | /** |
| 216 | * @brief Item stored in an XPath set hash table. |
| 217 | */ |
| 218 | struct lyxp_set_hash_node { |
| 219 | struct lyd_node *node; |
| 220 | enum lyxp_node_type type; |
| 221 | } _PACKED; |
| 222 | |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 223 | /** |
aPiecek | df23eee | 2021-10-07 12:21:50 +0200 | [diff] [blame] | 224 | * @brief XPath variable bindings. |
| 225 | */ |
| 226 | struct lyxp_var { |
| 227 | char *name; /**< Variable name. In the XPath expression, the name is preceded by a '$' character. */ |
| 228 | char *value; /**< The value of a variable is an object, which can be of any of the type that are possible |
| 229 | for the value of an expression. */ |
| 230 | }; |
| 231 | |
| 232 | /** |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 233 | * @brief XPath set - (partial) result. |
| 234 | */ |
| 235 | struct lyxp_set { |
aPiecek | 6da713d | 2021-10-11 12:50:28 +0200 | [diff] [blame] | 236 | enum lyxp_set_type type; /**< Type of the object (value). */ |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 237 | union { |
| 238 | struct lyxp_set_node { |
aPiecek | 6da713d | 2021-10-11 12:50:28 +0200 | [diff] [blame] | 239 | struct lyd_node *node; /**< Data node. */ |
| 240 | enum lyxp_node_type type; /**< Type of the node. */ |
| 241 | uint32_t pos; /**< Unique node position in the data. */ |
| 242 | } *nodes; /**< Set of data nodes. */ |
Michal Vasko | 03ff5a7 | 2019-09-11 13:49:33 +0200 | [diff] [blame] | 243 | struct lyxp_set_scnode { |
aPiecek | 6da713d | 2021-10-11 12:50:28 +0200 | [diff] [blame] | 244 | struct lysc_node *scnode; /**< Compiled YANG node. */ |
| 245 | enum lyxp_node_type type; /**< Type of the node. */ |
Radek Krejci | f13b87b | 2020-12-01 22:02:17 +0100 | [diff] [blame] | 246 | |
Michal Vasko | d97959c | 2020-12-10 12:18:28 +0100 | [diff] [blame] | 247 | /* _START and _ATOM values should have grouped values */ |
Radek Krejci | f13b87b | 2020-12-01 22:02:17 +0100 | [diff] [blame] | 248 | #define LYXP_SET_SCNODE_START -2 /**< scnode not traversed, currently (the only node) in context */ |
| 249 | #define LYXP_SET_SCNODE_START_USED -1 /**< scnode not traversed except for the eval start, not currently in the context */ |
Michal Vasko | 1a09b21 | 2021-05-06 13:00:10 +0200 | [diff] [blame] | 250 | #define LYXP_SET_SCNODE_ATOM_NODE 0 /**< scnode was traversed, but not currently in the context */ |
| 251 | #define LYXP_SET_SCNODE_ATOM_VAL 1 /**< scnode was traversed and its value used, but not currently in the context */ |
| 252 | #define LYXP_SET_SCNODE_ATOM_CTX 2 /**< scnode currently in context */ |
| 253 | #define LYXP_SET_SCNODE_ATOM_NEW_CTX 3 /**< scnode in context and just added, so skip it for the current operation */ |
| 254 | #define LYXP_SET_SCNODE_ATOM_PRED_CTX 4 /**< includes any higher value - scnode is not in context because we are in |
Radek Krejci | f13b87b | 2020-12-01 22:02:17 +0100 | [diff] [blame] | 255 | a predicate and this scnode was used/will be used later */ |
aPiecek | 6da713d | 2021-10-11 12:50:28 +0200 | [diff] [blame] | 256 | int32_t in_ctx; /**< Flag specifies the state of the node in context. Values are defined |
| 257 | as LYXP_SET_SCNODE_* */ |
| 258 | } *scnodes; /**< Set of compiled YANG data nodes. */ |
Michal Vasko | 9f96a05 | 2020-03-10 09:41:45 +0100 | [diff] [blame] | 259 | struct lyxp_set_meta { |
aPiecek | 6da713d | 2021-10-11 12:50:28 +0200 | [diff] [blame] | 260 | struct lyd_meta *meta; /**< Node that provides information about metadata of a data element. */ |
| 261 | enum lyxp_node_type type; /**< Type of the node. */ |
| 262 | uint32_t pos; /**< Unique node position in the data. if node_type is LYXP_SET_NODE_META, |
| 263 | it is the parent node position */ |
| 264 | } *meta; /**< Set of YANG metadata objects. */ |
| 265 | char *str; /**< String object. */ |
| 266 | long double num; /**< Object of the floating-point number. */ |
| 267 | ly_bool bln; /**< Boolean object. */ |
| 268 | } val; /**< Evaluated object (value). */ |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 269 | |
Michal Vasko | 03ff5a7 | 2019-09-11 13:49:33 +0200 | [diff] [blame] | 270 | /* this is valid only for type LYXP_SET_NODE_SET and LYXP_SET_SCNODE_SET */ |
aPiecek | 6da713d | 2021-10-11 12:50:28 +0200 | [diff] [blame] | 271 | uint32_t used; /**< Number of nodes in the set. */ |
| 272 | uint32_t size; /**< Allocated size for the set. */ |
| 273 | struct hash_table *ht; /**< Hash table for quick determination of whether a node is in the set. */ |
Michal Vasko | 03ff5a7 | 2019-09-11 13:49:33 +0200 | [diff] [blame] | 274 | |
| 275 | /* XPath context information, this is valid only for type LYXP_SET_NODE_SET */ |
aPiecek | 6da713d | 2021-10-11 12:50:28 +0200 | [diff] [blame] | 276 | uint32_t ctx_pos; /**< Position of the current examined node in the set. */ |
| 277 | uint32_t ctx_size; /**< Position of the last node at the time the node was examined. */ |
Michal Vasko | 03ff5a7 | 2019-09-11 13:49:33 +0200 | [diff] [blame] | 278 | |
| 279 | /* general context */ |
aPiecek | 6da713d | 2021-10-11 12:50:28 +0200 | [diff] [blame] | 280 | struct ly_ctx *ctx; /**< General context for logging. */ |
Michal Vasko | 03ff5a7 | 2019-09-11 13:49:33 +0200 | [diff] [blame] | 281 | union { |
aPiecek | 6da713d | 2021-10-11 12:50:28 +0200 | [diff] [blame] | 282 | const struct lyd_node *cur_node; /**< Current (original context) node. */ |
| 283 | const struct lysc_node *cur_scnode; /**< Current (original context) compiled node. */ |
Michal Vasko | 03ff5a7 | 2019-09-11 13:49:33 +0200 | [diff] [blame] | 284 | }; |
aPiecek | 6da713d | 2021-10-11 12:50:28 +0200 | [diff] [blame] | 285 | enum lyxp_node_type root_type; /**< Type of root node. */ |
| 286 | const struct lysc_node *context_op; /**< Schema of the current node. */ |
| 287 | const struct lyd_node *tree; /**< Data tree on which to perform the evaluation. */ |
| 288 | const struct lys_module *cur_mod; /**< Current module for the expression (where it was "instantiated"). */ |
| 289 | LY_VALUE_FORMAT format; /**< Format of the XPath expression. */ |
| 290 | void *prefix_data; /**< Format-specific prefix data (see ::ly_resolve_prefix). */ |
aPiecek | fba7536 | 2021-10-07 12:39:48 +0200 | [diff] [blame] | 291 | const struct lyxp_var *vars; /**< XPath variables. [Sized array](@ref sizedarrays). |
| 292 | Set of variable bindings. */ |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 293 | }; |
| 294 | |
| 295 | /** |
Michal Vasko | 24cddf8 | 2020-06-01 08:17:01 +0200 | [diff] [blame] | 296 | * @brief Print an XPath token \p tok type. |
| 297 | * |
| 298 | * @param[in] tok Token to print. |
| 299 | * @return Token type string. |
| 300 | */ |
| 301 | const char *lyxp_print_token(enum lyxp_token tok); |
| 302 | |
| 303 | /** |
Michal Vasko | 03ff5a7 | 2019-09-11 13:49:33 +0200 | [diff] [blame] | 304 | * @brief Evaluate an XPath expression on data. Be careful when using this function, the result can often |
| 305 | * be confusing without thorough understanding of XPath evaluation rules defined in RFC 7950. |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 306 | * |
Michal Vasko | 400e967 | 2021-01-11 13:39:17 +0100 | [diff] [blame] | 307 | * @param[in] ctx libyang context to use. |
Michal Vasko | ecd62de | 2019-11-13 12:35:11 +0100 | [diff] [blame] | 308 | * @param[in] exp Parsed XPath expression to be evaluated. |
Michal Vasko | 5d24f6c | 2020-10-13 13:49:06 +0200 | [diff] [blame] | 309 | * @param[in] cur_mod Current module for the expression (where it was "instantiated"). |
aPiecek | b0445f2 | 2021-06-24 11:34:07 +0200 | [diff] [blame] | 310 | * @param[in] format Format of the XPath expression (more specifically, of any used prefixes). |
Michal Vasko | 5d24f6c | 2020-10-13 13:49:06 +0200 | [diff] [blame] | 311 | * @param[in] prefix_data Format-specific prefix data (see ::ly_resolve_prefix). |
| 312 | * @param[in] ctx_node Current (context) data node, NULL in case of the root node. |
Michal Vasko | f03ed03 | 2020-03-04 13:31:44 +0100 | [diff] [blame] | 313 | * @param[in] tree Data tree on which to perform the evaluation, it must include all the available data (including |
Michal Vasko | d3bb12f | 2020-12-04 14:33:09 +0100 | [diff] [blame] | 314 | * the tree of @p ctx_node). Can be any node of the tree, it is adjusted. |
aPiecek | fba7536 | 2021-10-07 12:39:48 +0200 | [diff] [blame] | 315 | * @param[in] vars [Sized array](@ref sizedarrays) of XPath variables. |
Michal Vasko | 004d315 | 2020-06-11 19:59:22 +0200 | [diff] [blame] | 316 | * @param[out] set Result set. |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 317 | * @param[in] options Whether to apply some evaluation restrictions. |
Michal Vasko | 004d315 | 2020-06-11 19:59:22 +0200 | [diff] [blame] | 318 | * @return LY_EVALID for invalid argument types/count, |
| 319 | * @return LY_EINCOMPLETE for unresolved when, |
| 320 | * @return LY_EINVAL, LY_EMEM, LY_EINT for other errors. |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 321 | */ |
Michal Vasko | 400e967 | 2021-01-11 13:39:17 +0100 | [diff] [blame] | 322 | LY_ERR lyxp_eval(const struct ly_ctx *ctx, const struct lyxp_expr *exp, const struct lys_module *cur_mod, |
Radek Krejci | 8df109d | 2021-04-23 12:19:08 +0200 | [diff] [blame] | 323 | LY_VALUE_FORMAT format, void *prefix_data, const struct lyd_node *ctx_node, const struct lyd_node *tree, |
aPiecek | fba7536 | 2021-10-07 12:39:48 +0200 | [diff] [blame] | 324 | const struct lyxp_var *vars, struct lyxp_set *set, uint32_t options); |
Michal Vasko | 03ff5a7 | 2019-09-11 13:49:33 +0200 | [diff] [blame] | 325 | |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 326 | /** |
Michal Vasko | 03ff5a7 | 2019-09-11 13:49:33 +0200 | [diff] [blame] | 327 | * @brief Get all the partial XPath nodes (atoms) that are required for @p exp to be evaluated. |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 328 | * |
Michal Vasko | 400e967 | 2021-01-11 13:39:17 +0100 | [diff] [blame] | 329 | * @param[in] ctx libyang context to use. |
Michal Vasko | 03ff5a7 | 2019-09-11 13:49:33 +0200 | [diff] [blame] | 330 | * @param[in] exp Parsed XPath expression to be evaluated. |
Michal Vasko | 5d24f6c | 2020-10-13 13:49:06 +0200 | [diff] [blame] | 331 | * @param[in] cur_mod Current module for the expression (where it was "instantiated"). |
aPiecek | b0445f2 | 2021-06-24 11:34:07 +0200 | [diff] [blame] | 332 | * @param[in] format Format of the XPath expression (more specifically, of any used prefixes). |
Michal Vasko | 5d24f6c | 2020-10-13 13:49:06 +0200 | [diff] [blame] | 333 | * @param[in] prefix_data Format-specific prefix data (see ::ly_resolve_prefix). |
| 334 | * @param[in] ctx_scnode Current (context) schema node, NULL in case of the root node. |
Michal Vasko | 004d315 | 2020-06-11 19:59:22 +0200 | [diff] [blame] | 335 | * @param[out] set Result set. |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 336 | * @param[in] options Whether to apply some evaluation restrictions, one flag must always be used. |
Radek Krejci | 8678fa4 | 2020-08-18 16:07:28 +0200 | [diff] [blame] | 337 | * @return LY_ERR (same as ::lyxp_eval()). |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 338 | */ |
Michal Vasko | 400e967 | 2021-01-11 13:39:17 +0100 | [diff] [blame] | 339 | LY_ERR lyxp_atomize(const struct ly_ctx *ctx, const struct lyxp_expr *exp, const struct lys_module *cur_mod, |
Radek Krejci | 8df109d | 2021-04-23 12:19:08 +0200 | [diff] [blame] | 340 | LY_VALUE_FORMAT format, void *prefix_data, const struct lysc_node *ctx_scnode, struct lyxp_set *set, |
Michal Vasko | 400e967 | 2021-01-11 13:39:17 +0100 | [diff] [blame] | 341 | uint32_t options); |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 342 | |
Michal Vasko | 4ad69e7 | 2021-10-26 16:25:55 +0200 | [diff] [blame] | 343 | /** used only internally, maps with @ref findxpathoptions */ |
Michal Vasko | cdad712 | 2020-11-09 21:04:44 +0100 | [diff] [blame] | 344 | #define LYXP_IGNORE_WHEN 0x01 /**< Ignore unevaluated when in data nodes and do not return ::LY_EINCOMPLETE. */ |
| 345 | #define LYXP_SCHEMA 0x02 /**< Apply data node access restrictions defined for 'when' and 'must' evaluation. */ |
| 346 | #define LYXP_SCNODE 0x04 /**< No special tree access modifiers. */ |
| 347 | #define LYXP_SCNODE_SCHEMA LYS_FIND_XP_SCHEMA /**< Apply node access restrictions defined for 'when' and 'must' evaluation. */ |
| 348 | #define LYXP_SCNODE_OUTPUT LYS_FIND_XP_OUTPUT /**< Search RPC/action output nodes instead of input ones. */ |
| 349 | #define LYXP_SCNODE_ALL 0x1C /**< mask for all the LYXP_* values */ |
aPiecek | 8b0cc15 | 2021-05-31 16:40:31 +0200 | [diff] [blame] | 350 | #define LYXP_SKIP_EXPR 0x20 /**< The rest of the expression will not be evaluated (lazy evaluation) */ |
Michal Vasko | 4ad69e7 | 2021-10-26 16:25:55 +0200 | [diff] [blame] | 351 | #define LYXP_SCNODE_ERROR LYS_FIND_NO_MATCH_ERROR /**< Return error if a path segment matches no nodes, otherwise only |
| 352 | warning is printed. */ |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 353 | |
| 354 | /** |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 355 | * @brief Cast XPath set to another type. |
| 356 | * Indirectly context position aware. |
| 357 | * |
| 358 | * @param[in] set Set to cast. |
| 359 | * @param[in] target Target type to cast \p set into. |
Michal Vasko | 03ff5a7 | 2019-09-11 13:49:33 +0200 | [diff] [blame] | 360 | * @return LY_ERR |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 361 | */ |
Michal Vasko | 5e0e6eb | 2019-11-06 15:47:50 +0100 | [diff] [blame] | 362 | LY_ERR lyxp_set_cast(struct lyxp_set *set, enum lyxp_set_type target); |
Michal Vasko | 03ff5a7 | 2019-09-11 13:49:33 +0200 | [diff] [blame] | 363 | |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 364 | /** |
Michal Vasko | d367889 | 2020-05-21 10:06:58 +0200 | [diff] [blame] | 365 | * @brief Free dynamic content of a set. |
| 366 | * |
| 367 | * @param[in] set Set to modify. |
| 368 | */ |
| 369 | void lyxp_set_free_content(struct lyxp_set *set); |
| 370 | |
| 371 | /** |
Michal Vasko | ecd62de | 2019-11-13 12:35:11 +0100 | [diff] [blame] | 372 | * @brief Insert schema node into set. |
| 373 | * |
| 374 | * @param[in] set Set to insert into. |
| 375 | * @param[in] node Node to insert. |
| 376 | * @param[in] node_type Node type of @p node. |
Radek Krejci | aa6b53f | 2020-08-27 15:19:03 +0200 | [diff] [blame] | 377 | * @param[out] index_p Optional pointer to store index if the inserted @p node. |
| 378 | * @return LY_SUCCESS on success. |
| 379 | * @return LY_EMEM on memory allocation failure. |
Michal Vasko | ecd62de | 2019-11-13 12:35:11 +0100 | [diff] [blame] | 380 | */ |
Michal Vasko | ee38a5d | 2020-11-09 21:02:18 +0100 | [diff] [blame] | 381 | LY_ERR lyxp_set_scnode_insert_node(struct lyxp_set *set, const struct lysc_node *node, enum lyxp_node_type node_type, |
| 382 | uint32_t *index_p); |
Michal Vasko | ecd62de | 2019-11-13 12:35:11 +0100 | [diff] [blame] | 383 | |
| 384 | /** |
| 385 | * @brief Check for duplicates in a schema node set. |
| 386 | * |
| 387 | * @param[in] set Set to check. |
| 388 | * @param[in] node Node to look for in @p set. |
| 389 | * @param[in] node_type Type of @p node. |
| 390 | * @param[in] skip_idx Index from @p set to skip. |
Radek Krejci | aa6b53f | 2020-08-27 15:19:03 +0200 | [diff] [blame] | 391 | * @param[out] index_p Optional pointer to store index if the node is found. |
Radek Krejci | 857189e | 2020-09-01 13:26:36 +0200 | [diff] [blame] | 392 | * @return Boolean value whether the @p node found or not. |
Michal Vasko | ecd62de | 2019-11-13 12:35:11 +0100 | [diff] [blame] | 393 | */ |
Radek Krejci | 857189e | 2020-09-01 13:26:36 +0200 | [diff] [blame] | 394 | ly_bool lyxp_set_scnode_contains(struct lyxp_set *set, const struct lysc_node *node, enum lyxp_node_type node_type, |
Radek Krejci | aa6b53f | 2020-08-27 15:19:03 +0200 | [diff] [blame] | 395 | int skip_idx, uint32_t *index_p); |
Michal Vasko | ecd62de | 2019-11-13 12:35:11 +0100 | [diff] [blame] | 396 | |
| 397 | /** |
| 398 | * @brief Merge 2 schema node sets. |
| 399 | * |
| 400 | * @param[in] set1 Set to merge into. |
| 401 | * @param[in] set2 Set to merge. Its content is freed. |
| 402 | */ |
| 403 | void lyxp_set_scnode_merge(struct lyxp_set *set1, struct lyxp_set *set2); |
| 404 | |
| 405 | /** |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 406 | * @brief Parse an XPath expression into a structure of tokens. |
| 407 | * Logs directly. |
| 408 | * |
Michal Vasko | 03ff5a7 | 2019-09-11 13:49:33 +0200 | [diff] [blame] | 409 | * https://www.w3.org/TR/1999/REC-xpath-19991116/#exprlex |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 410 | * |
| 411 | * @param[in] ctx Context for errors. |
Radek Krejci | f03a9e2 | 2020-09-18 20:09:31 +0200 | [diff] [blame] | 412 | * @param[in] expr_str XPath expression to parse. It is duplicated. |
Michal Vasko | 004d315 | 2020-06-11 19:59:22 +0200 | [diff] [blame] | 413 | * @param[in] expr_len Length of @p expr, can be 0 if @p expr is 0-terminated. |
| 414 | * @param[in] reparse Whether to re-parse the expression to finalize full XPath parsing and fill |
| 415 | * information about expressions and their operators (fill repeat). |
Radek Krejci | f03a9e2 | 2020-09-18 20:09:31 +0200 | [diff] [blame] | 416 | * @param[out] expr_p Pointer to return the filled expression structure. |
| 417 | * @return LY_SUCCESS in case of success. |
| 418 | * @return LY_EMEM in case of memory allocation failure. |
| 419 | * @return LY_EVALID in case of invalid XPath expression in @p expr_str. |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 420 | */ |
Michal Vasko | ee38a5d | 2020-11-09 21:02:18 +0100 | [diff] [blame] | 421 | LY_ERR lyxp_expr_parse(const struct ly_ctx *ctx, const char *expr_str, size_t expr_len, ly_bool reparse, |
| 422 | struct lyxp_expr **expr_p); |
Michal Vasko | 004d315 | 2020-06-11 19:59:22 +0200 | [diff] [blame] | 423 | |
| 424 | /** |
| 425 | * @brief Duplicate parsed XPath expression. |
| 426 | * |
| 427 | * @param[in] ctx Context with a dictionary. |
| 428 | * @param[in] exp Parsed expression. |
Michal Vasko | 1734be9 | 2020-09-22 08:55:10 +0200 | [diff] [blame] | 429 | * @param[out] dup Duplicated structure. |
| 430 | * @return LY_ERR value. |
Michal Vasko | 004d315 | 2020-06-11 19:59:22 +0200 | [diff] [blame] | 431 | */ |
Michal Vasko | 1734be9 | 2020-09-22 08:55:10 +0200 | [diff] [blame] | 432 | LY_ERR lyxp_expr_dup(const struct ly_ctx *ctx, const struct lyxp_expr *exp, struct lyxp_expr **dup); |
Michal Vasko | 1467635 | 2020-05-29 11:35:55 +0200 | [diff] [blame] | 433 | |
| 434 | /** |
| 435 | * @brief Look at the next token and check its kind. |
| 436 | * |
| 437 | * @param[in] ctx Context for logging, not logged if NULL. |
| 438 | * @param[in] exp Expression to use. |
Michal Vasko | 004d315 | 2020-06-11 19:59:22 +0200 | [diff] [blame] | 439 | * @param[in] tok_idx Token index in the expression \p exp. |
Michal Vasko | 1467635 | 2020-05-29 11:35:55 +0200 | [diff] [blame] | 440 | * @param[in] want_tok Expected token. |
| 441 | * @return LY_EINCOMPLETE on EOF, |
| 442 | * @return LY_ENOT on non-matching token, |
| 443 | * @return LY_SUCCESS on success. |
| 444 | */ |
Michal Vasko | 004d315 | 2020-06-11 19:59:22 +0200 | [diff] [blame] | 445 | LY_ERR lyxp_check_token(const struct ly_ctx *ctx, const struct lyxp_expr *exp, uint16_t tok_idx, enum lyxp_token want_tok); |
| 446 | |
| 447 | /** |
| 448 | * @brief Look at the next token and skip it if it matches the expected one. |
| 449 | * |
| 450 | * @param[in] ctx Context for logging, not logged if NULL. |
| 451 | * @param[in] exp Expression to use. |
| 452 | * @param[in,out] tok_idx Token index in the expression \p exp, is updated. |
| 453 | * @param[in] want_tok Expected token. |
| 454 | * @return LY_EINCOMPLETE on EOF, |
| 455 | * @return LY_ENOT on non-matching token, |
| 456 | * @return LY_SUCCESS on success. |
| 457 | */ |
| 458 | LY_ERR lyxp_next_token(const struct ly_ctx *ctx, const struct lyxp_expr *exp, uint16_t *tok_idx, enum lyxp_token want_tok); |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 459 | |
| 460 | /** |
Michal Vasko | 4911eeb | 2021-06-28 11:23:05 +0200 | [diff] [blame] | 461 | * @brief Look at the next token and skip it if it matches either of the 2 expected ones. |
| 462 | * |
| 463 | * @param[in] ctx Context for logging, not logged if NULL. |
| 464 | * @param[in] exp Expression to use. |
| 465 | * @param[in,out] tok_idx Token index in the expression \p exp, is updated. |
| 466 | * @param[in] want_tok1 Expected token 1. |
| 467 | * @param[in] want_tok2 Expected token 2. |
| 468 | * @return LY_EINCOMPLETE on EOF, |
| 469 | * @return LY_ENOT on non-matching token, |
| 470 | * @return LY_SUCCESS on success. |
| 471 | */ |
| 472 | LY_ERR lyxp_next_token2(const struct ly_ctx *ctx, const struct lyxp_expr *exp, uint16_t *tok_idx, |
| 473 | enum lyxp_token want_tok1, enum lyxp_token want_tok2); |
| 474 | |
| 475 | /** |
aPiecek | df23eee | 2021-10-07 12:21:50 +0200 | [diff] [blame] | 476 | * @brief Find variable named @name in @p vars. |
| 477 | * |
| 478 | * @param[in] vars [Sized array](@ref sizedarrays) of XPath variables. |
| 479 | * @param[in] name Name of the variable being searched. |
| 480 | * @param[in] name_len Name length can be set to 0 if @p name is terminated by null byte. |
| 481 | * @param[out] var Variable that was found. The parameter is optional. |
| 482 | * @return LY_SUCCESS if the variable was found, otherwise LY_ENOTFOUND. |
| 483 | */ |
| 484 | LY_ERR lyxp_vars_find(struct lyxp_var *vars, const char *name, size_t name_len, struct lyxp_var **var); |
| 485 | |
| 486 | /** |
Michal Vasko | 03ff5a7 | 2019-09-11 13:49:33 +0200 | [diff] [blame] | 487 | * @brief Frees a parsed XPath expression. @p expr should not be used afterwards. |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 488 | * |
| 489 | * @param[in] ctx libyang context of the expression. |
| 490 | * @param[in] expr Expression to free. |
| 491 | */ |
Michal Vasko | 1467635 | 2020-05-29 11:35:55 +0200 | [diff] [blame] | 492 | void lyxp_expr_free(const struct ly_ctx *ctx, struct lyxp_expr *expr); |
Radek Krejci | b1646a9 | 2018-11-02 16:08:26 +0100 | [diff] [blame] | 493 | |
Michal Vasko | 1467635 | 2020-05-29 11:35:55 +0200 | [diff] [blame] | 494 | #endif /* LY_XPATH_H */ |