1 | /*------------------------------------------------------------------------- |
2 | * |
3 | * jsonfuncs.c |
4 | * Functions to process JSON data types. |
5 | * |
6 | * Portions Copyright (c) 1996-2019, PostgreSQL Global Development Group |
7 | * Portions Copyright (c) 1994, Regents of the University of California |
8 | * |
9 | * IDENTIFICATION |
10 | * src/backend/utils/adt/jsonfuncs.c |
11 | * |
12 | *------------------------------------------------------------------------- |
13 | */ |
14 | |
15 | #include "postgres.h" |
16 | |
17 | #include <limits.h> |
18 | |
19 | #include "access/htup_details.h" |
20 | #include "catalog/pg_type.h" |
21 | #include "fmgr.h" |
22 | #include "funcapi.h" |
23 | #include "lib/stringinfo.h" |
24 | #include "mb/pg_wchar.h" |
25 | #include "miscadmin.h" |
26 | #include "utils/array.h" |
27 | #include "utils/builtins.h" |
28 | #include "utils/hsearch.h" |
29 | #include "utils/json.h" |
30 | #include "utils/jsonapi.h" |
31 | #include "utils/jsonb.h" |
32 | #include "utils/lsyscache.h" |
33 | #include "utils/memutils.h" |
34 | #include "utils/syscache.h" |
35 | #include "utils/typcache.h" |
36 | |
37 | /* Operations available for setPath */ |
38 | #define JB_PATH_CREATE 0x0001 |
39 | #define JB_PATH_DELETE 0x0002 |
40 | #define JB_PATH_REPLACE 0x0004 |
41 | #define JB_PATH_INSERT_BEFORE 0x0008 |
42 | #define JB_PATH_INSERT_AFTER 0x0010 |
43 | #define JB_PATH_CREATE_OR_INSERT \ |
44 | (JB_PATH_INSERT_BEFORE | JB_PATH_INSERT_AFTER | JB_PATH_CREATE) |
45 | |
46 | /* state for json_object_keys */ |
47 | typedef struct OkeysState |
48 | { |
49 | JsonLexContext *lex; |
50 | char **result; |
51 | int result_size; |
52 | int result_count; |
53 | int sent_count; |
54 | } OkeysState; |
55 | |
56 | /* state for iterate_json_values function */ |
57 | typedef struct IterateJsonStringValuesState |
58 | { |
59 | JsonLexContext *lex; |
60 | JsonIterateStringValuesAction action; /* an action that will be applied |
61 | * to each json value */ |
62 | void *action_state; /* any necessary context for iteration */ |
63 | uint32 flags; /* what kind of elements from a json we want |
64 | * to iterate */ |
65 | } IterateJsonStringValuesState; |
66 | |
67 | /* state for transform_json_string_values function */ |
68 | typedef struct TransformJsonStringValuesState |
69 | { |
70 | JsonLexContext *lex; |
71 | StringInfo strval; /* resulting json */ |
72 | JsonTransformStringValuesAction action; /* an action that will be applied |
73 | * to each json value */ |
74 | void *action_state; /* any necessary context for transformation */ |
75 | } TransformJsonStringValuesState; |
76 | |
77 | /* state for json_get* functions */ |
78 | typedef struct GetState |
79 | { |
80 | JsonLexContext *lex; |
81 | text *tresult; |
82 | char *result_start; |
83 | bool normalize_results; |
84 | bool next_scalar; |
85 | int npath; /* length of each path-related array */ |
86 | char **path_names; /* field name(s) being sought */ |
87 | int *path_indexes; /* array index(es) being sought */ |
88 | bool *pathok; /* is path matched to current depth? */ |
89 | int *array_cur_index; /* current element index at each path |
90 | * level */ |
91 | } GetState; |
92 | |
93 | /* state for json_array_length */ |
94 | typedef struct AlenState |
95 | { |
96 | JsonLexContext *lex; |
97 | int count; |
98 | } AlenState; |
99 | |
100 | /* state for json_each */ |
101 | typedef struct EachState |
102 | { |
103 | JsonLexContext *lex; |
104 | Tuplestorestate *tuple_store; |
105 | TupleDesc ret_tdesc; |
106 | MemoryContext tmp_cxt; |
107 | char *result_start; |
108 | bool normalize_results; |
109 | bool next_scalar; |
110 | char *normalized_scalar; |
111 | } EachState; |
112 | |
113 | /* state for json_array_elements */ |
114 | typedef struct ElementsState |
115 | { |
116 | JsonLexContext *lex; |
117 | const char *function_name; |
118 | Tuplestorestate *tuple_store; |
119 | TupleDesc ret_tdesc; |
120 | MemoryContext tmp_cxt; |
121 | char *result_start; |
122 | bool normalize_results; |
123 | bool next_scalar; |
124 | char *normalized_scalar; |
125 | } ElementsState; |
126 | |
127 | /* state for get_json_object_as_hash */ |
128 | typedef struct JHashState |
129 | { |
130 | JsonLexContext *lex; |
131 | const char *function_name; |
132 | HTAB *hash; |
133 | char *saved_scalar; |
134 | char *save_json_start; |
135 | JsonTokenType saved_token_type; |
136 | } JHashState; |
137 | |
138 | /* hashtable element */ |
139 | typedef struct JsonHashEntry |
140 | { |
141 | char fname[NAMEDATALEN]; /* hash key (MUST BE FIRST) */ |
142 | char *val; |
143 | JsonTokenType type; |
144 | } JsonHashEntry; |
145 | |
146 | /* structure to cache type I/O metadata needed for populate_scalar() */ |
147 | typedef struct ScalarIOData |
148 | { |
149 | Oid typioparam; |
150 | FmgrInfo typiofunc; |
151 | } ScalarIOData; |
152 | |
153 | /* these two structures are used recursively */ |
154 | typedef struct ColumnIOData ColumnIOData; |
155 | typedef struct RecordIOData RecordIOData; |
156 | |
157 | /* structure to cache metadata needed for populate_array() */ |
158 | typedef struct ArrayIOData |
159 | { |
160 | ColumnIOData *element_info; /* metadata cache */ |
161 | Oid element_type; /* array element type id */ |
162 | int32 element_typmod; /* array element type modifier */ |
163 | } ArrayIOData; |
164 | |
165 | /* structure to cache metadata needed for populate_composite() */ |
166 | typedef struct CompositeIOData |
167 | { |
168 | /* |
169 | * We use pointer to a RecordIOData here because variable-length struct |
170 | * RecordIOData can't be used directly in ColumnIOData.io union |
171 | */ |
172 | RecordIOData *record_io; /* metadata cache for populate_record() */ |
173 | TupleDesc tupdesc; /* cached tuple descriptor */ |
174 | /* these fields differ from target type only if domain over composite: */ |
175 | Oid base_typid; /* base type id */ |
176 | int32 base_typmod; /* base type modifier */ |
177 | /* this field is used only if target type is domain over composite: */ |
178 | void *domain_info; /* opaque cache for domain checks */ |
179 | } CompositeIOData; |
180 | |
181 | /* structure to cache metadata needed for populate_domain() */ |
182 | typedef struct DomainIOData |
183 | { |
184 | ColumnIOData *base_io; /* metadata cache */ |
185 | Oid base_typid; /* base type id */ |
186 | int32 base_typmod; /* base type modifier */ |
187 | void *domain_info; /* opaque cache for domain checks */ |
188 | } DomainIOData; |
189 | |
190 | /* enumeration type categories */ |
191 | typedef enum TypeCat |
192 | { |
193 | TYPECAT_SCALAR = 's', |
194 | TYPECAT_ARRAY = 'a', |
195 | TYPECAT_COMPOSITE = 'c', |
196 | TYPECAT_COMPOSITE_DOMAIN = 'C', |
197 | TYPECAT_DOMAIN = 'd' |
198 | } TypeCat; |
199 | |
200 | /* these two are stolen from hstore / record_out, used in populate_record* */ |
201 | |
202 | /* structure to cache record metadata needed for populate_record_field() */ |
203 | struct ColumnIOData |
204 | { |
205 | Oid typid; /* column type id */ |
206 | int32 typmod; /* column type modifier */ |
207 | TypeCat typcat; /* column type category */ |
208 | ScalarIOData scalar_io; /* metadata cache for directi conversion |
209 | * through input function */ |
210 | union |
211 | { |
212 | ArrayIOData array; |
213 | CompositeIOData composite; |
214 | DomainIOData domain; |
215 | } io; /* metadata cache for various column type |
216 | * categories */ |
217 | }; |
218 | |
219 | /* structure to cache record metadata needed for populate_record() */ |
220 | struct RecordIOData |
221 | { |
222 | Oid record_type; |
223 | int32 record_typmod; |
224 | int ncolumns; |
225 | ColumnIOData columns[FLEXIBLE_ARRAY_MEMBER]; |
226 | }; |
227 | |
228 | /* per-query cache for populate_record_worker and populate_recordset_worker */ |
229 | typedef struct PopulateRecordCache |
230 | { |
231 | Oid argtype; /* declared type of the record argument */ |
232 | ColumnIOData c; /* metadata cache for populate_composite() */ |
233 | MemoryContext fn_mcxt; /* where this is stored */ |
234 | } PopulateRecordCache; |
235 | |
236 | /* per-call state for populate_recordset */ |
237 | typedef struct PopulateRecordsetState |
238 | { |
239 | JsonLexContext *lex; |
240 | const char *function_name; |
241 | HTAB *json_hash; |
242 | char *saved_scalar; |
243 | char *save_json_start; |
244 | JsonTokenType saved_token_type; |
245 | Tuplestorestate *tuple_store; |
246 | HeapTupleHeader rec; |
247 | PopulateRecordCache *cache; |
248 | } PopulateRecordsetState; |
249 | |
250 | /* common data for populate_array_json() and populate_array_dim_jsonb() */ |
251 | typedef struct PopulateArrayContext |
252 | { |
253 | ArrayBuildState *astate; /* array build state */ |
254 | ArrayIOData *aio; /* metadata cache */ |
255 | MemoryContext acxt; /* array build memory context */ |
256 | MemoryContext mcxt; /* cache memory context */ |
257 | const char *colname; /* for diagnostics only */ |
258 | int *dims; /* dimensions */ |
259 | int *sizes; /* current dimension counters */ |
260 | int ndims; /* number of dimensions */ |
261 | } PopulateArrayContext; |
262 | |
263 | /* state for populate_array_json() */ |
264 | typedef struct PopulateArrayState |
265 | { |
266 | JsonLexContext *lex; /* json lexer */ |
267 | PopulateArrayContext *ctx; /* context */ |
268 | char *element_start; /* start of the current array element */ |
269 | char *element_scalar; /* current array element token if it is a |
270 | * scalar */ |
271 | JsonTokenType element_type; /* current array element type */ |
272 | } PopulateArrayState; |
273 | |
274 | /* state for json_strip_nulls */ |
275 | typedef struct StripnullState |
276 | { |
277 | JsonLexContext *lex; |
278 | StringInfo strval; |
279 | bool skip_next_null; |
280 | } StripnullState; |
281 | |
282 | /* structure for generalized json/jsonb value passing */ |
283 | typedef struct JsValue |
284 | { |
285 | bool is_json; /* json/jsonb */ |
286 | union |
287 | { |
288 | struct |
289 | { |
290 | char *str; /* json string */ |
291 | int len; /* json string length or -1 if null-terminated */ |
292 | JsonTokenType type; /* json type */ |
293 | } json; /* json value */ |
294 | |
295 | JsonbValue *jsonb; /* jsonb value */ |
296 | } val; |
297 | } JsValue; |
298 | |
299 | typedef struct JsObject |
300 | { |
301 | bool is_json; /* json/jsonb */ |
302 | union |
303 | { |
304 | HTAB *json_hash; |
305 | JsonbContainer *jsonb_cont; |
306 | } val; |
307 | } JsObject; |
308 | |
309 | /* useful macros for testing JsValue properties */ |
310 | #define JsValueIsNull(jsv) \ |
311 | ((jsv)->is_json ? \ |
312 | (!(jsv)->val.json.str || (jsv)->val.json.type == JSON_TOKEN_NULL) : \ |
313 | (!(jsv)->val.jsonb || (jsv)->val.jsonb->type == jbvNull)) |
314 | |
315 | #define JsValueIsString(jsv) \ |
316 | ((jsv)->is_json ? (jsv)->val.json.type == JSON_TOKEN_STRING \ |
317 | : ((jsv)->val.jsonb && (jsv)->val.jsonb->type == jbvString)) |
318 | |
319 | #define JsObjectIsEmpty(jso) \ |
320 | ((jso)->is_json \ |
321 | ? hash_get_num_entries((jso)->val.json_hash) == 0 \ |
322 | : ((jso)->val.jsonb_cont == NULL || \ |
323 | JsonContainerSize((jso)->val.jsonb_cont) == 0)) |
324 | |
325 | #define JsObjectFree(jso) \ |
326 | do { \ |
327 | if ((jso)->is_json) \ |
328 | hash_destroy((jso)->val.json_hash); \ |
329 | } while (0) |
330 | |
331 | /* semantic action functions for json_object_keys */ |
332 | static void okeys_object_field_start(void *state, char *fname, bool isnull); |
333 | static void okeys_array_start(void *state); |
334 | static void okeys_scalar(void *state, char *token, JsonTokenType tokentype); |
335 | |
336 | /* semantic action functions for json_get* functions */ |
337 | static void get_object_start(void *state); |
338 | static void get_object_end(void *state); |
339 | static void get_object_field_start(void *state, char *fname, bool isnull); |
340 | static void get_object_field_end(void *state, char *fname, bool isnull); |
341 | static void get_array_start(void *state); |
342 | static void get_array_end(void *state); |
343 | static void get_array_element_start(void *state, bool isnull); |
344 | static void get_array_element_end(void *state, bool isnull); |
345 | static void get_scalar(void *state, char *token, JsonTokenType tokentype); |
346 | |
347 | /* common worker function for json getter functions */ |
348 | static Datum get_path_all(FunctionCallInfo fcinfo, bool as_text); |
349 | static text *get_worker(text *json, char **tpath, int *ipath, int npath, |
350 | bool normalize_results); |
351 | static Datum get_jsonb_path_all(FunctionCallInfo fcinfo, bool as_text); |
352 | |
353 | /* semantic action functions for json_array_length */ |
354 | static void alen_object_start(void *state); |
355 | static void alen_scalar(void *state, char *token, JsonTokenType tokentype); |
356 | static void alen_array_element_start(void *state, bool isnull); |
357 | |
358 | /* common workers for json{b}_each* functions */ |
359 | static Datum each_worker(FunctionCallInfo fcinfo, bool as_text); |
360 | static Datum each_worker_jsonb(FunctionCallInfo fcinfo, const char *funcname, |
361 | bool as_text); |
362 | |
363 | /* semantic action functions for json_each */ |
364 | static void each_object_field_start(void *state, char *fname, bool isnull); |
365 | static void each_object_field_end(void *state, char *fname, bool isnull); |
366 | static void each_array_start(void *state); |
367 | static void each_scalar(void *state, char *token, JsonTokenType tokentype); |
368 | |
369 | /* common workers for json{b}_array_elements_* functions */ |
370 | static Datum elements_worker(FunctionCallInfo fcinfo, const char *funcname, |
371 | bool as_text); |
372 | static Datum elements_worker_jsonb(FunctionCallInfo fcinfo, const char *funcname, |
373 | bool as_text); |
374 | |
375 | /* semantic action functions for json_array_elements */ |
376 | static void elements_object_start(void *state); |
377 | static void elements_array_element_start(void *state, bool isnull); |
378 | static void elements_array_element_end(void *state, bool isnull); |
379 | static void elements_scalar(void *state, char *token, JsonTokenType tokentype); |
380 | |
381 | /* turn a json object into a hash table */ |
382 | static HTAB *get_json_object_as_hash(char *json, int len, const char *funcname); |
383 | |
384 | /* semantic actions for populate_array_json */ |
385 | static void populate_array_object_start(void *_state); |
386 | static void populate_array_array_end(void *_state); |
387 | static void populate_array_element_start(void *_state, bool isnull); |
388 | static void populate_array_element_end(void *_state, bool isnull); |
389 | static void populate_array_scalar(void *_state, char *token, JsonTokenType tokentype); |
390 | |
391 | /* semantic action functions for get_json_object_as_hash */ |
392 | static void hash_object_field_start(void *state, char *fname, bool isnull); |
393 | static void hash_object_field_end(void *state, char *fname, bool isnull); |
394 | static void hash_array_start(void *state); |
395 | static void hash_scalar(void *state, char *token, JsonTokenType tokentype); |
396 | |
397 | /* semantic action functions for populate_recordset */ |
398 | static void populate_recordset_object_field_start(void *state, char *fname, bool isnull); |
399 | static void populate_recordset_object_field_end(void *state, char *fname, bool isnull); |
400 | static void populate_recordset_scalar(void *state, char *token, JsonTokenType tokentype); |
401 | static void populate_recordset_object_start(void *state); |
402 | static void populate_recordset_object_end(void *state); |
403 | static void populate_recordset_array_start(void *state); |
404 | static void populate_recordset_array_element_start(void *state, bool isnull); |
405 | |
406 | /* semantic action functions for json_strip_nulls */ |
407 | static void sn_object_start(void *state); |
408 | static void sn_object_end(void *state); |
409 | static void sn_array_start(void *state); |
410 | static void sn_array_end(void *state); |
411 | static void sn_object_field_start(void *state, char *fname, bool isnull); |
412 | static void sn_array_element_start(void *state, bool isnull); |
413 | static void sn_scalar(void *state, char *token, JsonTokenType tokentype); |
414 | |
415 | /* worker functions for populate_record, to_record, populate_recordset and to_recordset */ |
416 | static Datum populate_recordset_worker(FunctionCallInfo fcinfo, const char *funcname, |
417 | bool is_json, bool have_record_arg); |
418 | static Datum populate_record_worker(FunctionCallInfo fcinfo, const char *funcname, |
419 | bool is_json, bool have_record_arg); |
420 | |
421 | /* helper functions for populate_record[set] */ |
422 | static HeapTupleHeader populate_record(TupleDesc tupdesc, RecordIOData **record_p, |
423 | HeapTupleHeader defaultval, MemoryContext mcxt, |
424 | JsObject *obj); |
425 | static void get_record_type_from_argument(FunctionCallInfo fcinfo, |
426 | const char *funcname, |
427 | PopulateRecordCache *cache); |
428 | static void get_record_type_from_query(FunctionCallInfo fcinfo, |
429 | const char *funcname, |
430 | PopulateRecordCache *cache); |
431 | static void JsValueToJsObject(JsValue *jsv, JsObject *jso); |
432 | static Datum populate_composite(CompositeIOData *io, Oid typid, |
433 | const char *colname, MemoryContext mcxt, |
434 | HeapTupleHeader defaultval, JsValue *jsv, bool isnull); |
435 | static Datum populate_scalar(ScalarIOData *io, Oid typid, int32 typmod, JsValue *jsv); |
436 | static void prepare_column_cache(ColumnIOData *column, Oid typid, int32 typmod, |
437 | MemoryContext mcxt, bool need_scalar); |
438 | static Datum populate_record_field(ColumnIOData *col, Oid typid, int32 typmod, |
439 | const char *colname, MemoryContext mcxt, Datum defaultval, |
440 | JsValue *jsv, bool *isnull); |
441 | static RecordIOData *allocate_record_info(MemoryContext mcxt, int ncolumns); |
442 | static bool JsObjectGetField(JsObject *obj, char *field, JsValue *jsv); |
443 | static void populate_recordset_record(PopulateRecordsetState *state, JsObject *obj); |
444 | static void populate_array_json(PopulateArrayContext *ctx, char *json, int len); |
445 | static void populate_array_dim_jsonb(PopulateArrayContext *ctx, JsonbValue *jbv, |
446 | int ndim); |
447 | static void populate_array_report_expected_array(PopulateArrayContext *ctx, int ndim); |
448 | static void populate_array_assign_ndims(PopulateArrayContext *ctx, int ndims); |
449 | static void populate_array_check_dimension(PopulateArrayContext *ctx, int ndim); |
450 | static void populate_array_element(PopulateArrayContext *ctx, int ndim, JsValue *jsv); |
451 | static Datum populate_array(ArrayIOData *aio, const char *colname, |
452 | MemoryContext mcxt, JsValue *jsv); |
453 | static Datum populate_domain(DomainIOData *io, Oid typid, const char *colname, |
454 | MemoryContext mcxt, JsValue *jsv, bool isnull); |
455 | |
456 | /* Worker that takes care of common setup for us */ |
457 | static JsonbValue *findJsonbValueFromContainerLen(JsonbContainer *container, |
458 | uint32 flags, |
459 | char *key, |
460 | uint32 keylen); |
461 | |
462 | /* functions supporting jsonb_delete, jsonb_set and jsonb_concat */ |
463 | static JsonbValue *IteratorConcat(JsonbIterator **it1, JsonbIterator **it2, |
464 | JsonbParseState **state); |
465 | static JsonbValue *setPath(JsonbIterator **it, Datum *path_elems, |
466 | bool *path_nulls, int path_len, |
467 | JsonbParseState **st, int level, Jsonb *newval, |
468 | int op_type); |
469 | static void setPathObject(JsonbIterator **it, Datum *path_elems, |
470 | bool *path_nulls, int path_len, JsonbParseState **st, |
471 | int level, |
472 | Jsonb *newval, uint32 npairs, int op_type); |
473 | static void setPathArray(JsonbIterator **it, Datum *path_elems, |
474 | bool *path_nulls, int path_len, JsonbParseState **st, |
475 | int level, Jsonb *newval, uint32 nelems, int op_type); |
476 | static void addJsonbToParseState(JsonbParseState **jbps, Jsonb *jb); |
477 | |
478 | /* function supporting iterate_json_values */ |
479 | static void iterate_values_scalar(void *state, char *token, JsonTokenType tokentype); |
480 | static void iterate_values_object_field_start(void *state, char *fname, bool isnull); |
481 | |
482 | /* functions supporting transform_json_string_values */ |
483 | static void transform_string_values_object_start(void *state); |
484 | static void transform_string_values_object_end(void *state); |
485 | static void transform_string_values_array_start(void *state); |
486 | static void transform_string_values_array_end(void *state); |
487 | static void transform_string_values_object_field_start(void *state, char *fname, bool isnull); |
488 | static void transform_string_values_array_element_start(void *state, bool isnull); |
489 | static void transform_string_values_scalar(void *state, char *token, JsonTokenType tokentype); |
490 | |
491 | /* |
492 | * SQL function json_object_keys |
493 | * |
494 | * Returns the set of keys for the object argument. |
495 | * |
496 | * This SRF operates in value-per-call mode. It processes the |
497 | * object during the first call, and the keys are simply stashed |
498 | * in an array, whose size is expanded as necessary. This is probably |
499 | * safe enough for a list of keys of a single object, since they are |
500 | * limited in size to NAMEDATALEN and the number of keys is unlikely to |
501 | * be so huge that it has major memory implications. |
502 | */ |
503 | Datum |
504 | jsonb_object_keys(PG_FUNCTION_ARGS) |
505 | { |
506 | FuncCallContext *funcctx; |
507 | OkeysState *state; |
508 | int i; |
509 | |
510 | if (SRF_IS_FIRSTCALL()) |
511 | { |
512 | MemoryContext oldcontext; |
513 | Jsonb *jb = PG_GETARG_JSONB_P(0); |
514 | bool skipNested = false; |
515 | JsonbIterator *it; |
516 | JsonbValue v; |
517 | JsonbIteratorToken r; |
518 | |
519 | if (JB_ROOT_IS_SCALAR(jb)) |
520 | ereport(ERROR, |
521 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
522 | errmsg("cannot call %s on a scalar" , |
523 | "jsonb_object_keys" ))); |
524 | else if (JB_ROOT_IS_ARRAY(jb)) |
525 | ereport(ERROR, |
526 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
527 | errmsg("cannot call %s on an array" , |
528 | "jsonb_object_keys" ))); |
529 | |
530 | funcctx = SRF_FIRSTCALL_INIT(); |
531 | oldcontext = MemoryContextSwitchTo(funcctx->multi_call_memory_ctx); |
532 | |
533 | state = palloc(sizeof(OkeysState)); |
534 | |
535 | state->result_size = JB_ROOT_COUNT(jb); |
536 | state->result_count = 0; |
537 | state->sent_count = 0; |
538 | state->result = palloc(state->result_size * sizeof(char *)); |
539 | |
540 | it = JsonbIteratorInit(&jb->root); |
541 | |
542 | while ((r = JsonbIteratorNext(&it, &v, skipNested)) != WJB_DONE) |
543 | { |
544 | skipNested = true; |
545 | |
546 | if (r == WJB_KEY) |
547 | { |
548 | char *cstr; |
549 | |
550 | cstr = palloc(v.val.string.len + 1 * sizeof(char)); |
551 | memcpy(cstr, v.val.string.val, v.val.string.len); |
552 | cstr[v.val.string.len] = '\0'; |
553 | state->result[state->result_count++] = cstr; |
554 | } |
555 | } |
556 | |
557 | MemoryContextSwitchTo(oldcontext); |
558 | funcctx->user_fctx = (void *) state; |
559 | } |
560 | |
561 | funcctx = SRF_PERCALL_SETUP(); |
562 | state = (OkeysState *) funcctx->user_fctx; |
563 | |
564 | if (state->sent_count < state->result_count) |
565 | { |
566 | char *nxt = state->result[state->sent_count++]; |
567 | |
568 | SRF_RETURN_NEXT(funcctx, CStringGetTextDatum(nxt)); |
569 | } |
570 | |
571 | /* cleanup to reduce or eliminate memory leaks */ |
572 | for (i = 0; i < state->result_count; i++) |
573 | pfree(state->result[i]); |
574 | pfree(state->result); |
575 | pfree(state); |
576 | |
577 | SRF_RETURN_DONE(funcctx); |
578 | } |
579 | |
580 | |
581 | Datum |
582 | json_object_keys(PG_FUNCTION_ARGS) |
583 | { |
584 | FuncCallContext *funcctx; |
585 | OkeysState *state; |
586 | int i; |
587 | |
588 | if (SRF_IS_FIRSTCALL()) |
589 | { |
590 | text *json = PG_GETARG_TEXT_PP(0); |
591 | JsonLexContext *lex = makeJsonLexContext(json, true); |
592 | JsonSemAction *sem; |
593 | MemoryContext oldcontext; |
594 | |
595 | funcctx = SRF_FIRSTCALL_INIT(); |
596 | oldcontext = MemoryContextSwitchTo(funcctx->multi_call_memory_ctx); |
597 | |
598 | state = palloc(sizeof(OkeysState)); |
599 | sem = palloc0(sizeof(JsonSemAction)); |
600 | |
601 | state->lex = lex; |
602 | state->result_size = 256; |
603 | state->result_count = 0; |
604 | state->sent_count = 0; |
605 | state->result = palloc(256 * sizeof(char *)); |
606 | |
607 | sem->semstate = (void *) state; |
608 | sem->array_start = okeys_array_start; |
609 | sem->scalar = okeys_scalar; |
610 | sem->object_field_start = okeys_object_field_start; |
611 | /* remainder are all NULL, courtesy of palloc0 above */ |
612 | |
613 | pg_parse_json(lex, sem); |
614 | /* keys are now in state->result */ |
615 | |
616 | pfree(lex->strval->data); |
617 | pfree(lex->strval); |
618 | pfree(lex); |
619 | pfree(sem); |
620 | |
621 | MemoryContextSwitchTo(oldcontext); |
622 | funcctx->user_fctx = (void *) state; |
623 | } |
624 | |
625 | funcctx = SRF_PERCALL_SETUP(); |
626 | state = (OkeysState *) funcctx->user_fctx; |
627 | |
628 | if (state->sent_count < state->result_count) |
629 | { |
630 | char *nxt = state->result[state->sent_count++]; |
631 | |
632 | SRF_RETURN_NEXT(funcctx, CStringGetTextDatum(nxt)); |
633 | } |
634 | |
635 | /* cleanup to reduce or eliminate memory leaks */ |
636 | for (i = 0; i < state->result_count; i++) |
637 | pfree(state->result[i]); |
638 | pfree(state->result); |
639 | pfree(state); |
640 | |
641 | SRF_RETURN_DONE(funcctx); |
642 | } |
643 | |
644 | static void |
645 | okeys_object_field_start(void *state, char *fname, bool isnull) |
646 | { |
647 | OkeysState *_state = (OkeysState *) state; |
648 | |
649 | /* only collecting keys for the top level object */ |
650 | if (_state->lex->lex_level != 1) |
651 | return; |
652 | |
653 | /* enlarge result array if necessary */ |
654 | if (_state->result_count >= _state->result_size) |
655 | { |
656 | _state->result_size *= 2; |
657 | _state->result = (char **) |
658 | repalloc(_state->result, sizeof(char *) * _state->result_size); |
659 | } |
660 | |
661 | /* save a copy of the field name */ |
662 | _state->result[_state->result_count++] = pstrdup(fname); |
663 | } |
664 | |
665 | static void |
666 | okeys_array_start(void *state) |
667 | { |
668 | OkeysState *_state = (OkeysState *) state; |
669 | |
670 | /* top level must be a json object */ |
671 | if (_state->lex->lex_level == 0) |
672 | ereport(ERROR, |
673 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
674 | errmsg("cannot call %s on an array" , |
675 | "json_object_keys" ))); |
676 | } |
677 | |
678 | static void |
679 | okeys_scalar(void *state, char *token, JsonTokenType tokentype) |
680 | { |
681 | OkeysState *_state = (OkeysState *) state; |
682 | |
683 | /* top level must be a json object */ |
684 | if (_state->lex->lex_level == 0) |
685 | ereport(ERROR, |
686 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
687 | errmsg("cannot call %s on a scalar" , |
688 | "json_object_keys" ))); |
689 | } |
690 | |
691 | /* |
692 | * json and jsonb getter functions |
693 | * these implement the -> ->> #> and #>> operators |
694 | * and the json{b?}_extract_path*(json, text, ...) functions |
695 | */ |
696 | |
697 | |
698 | Datum |
699 | json_object_field(PG_FUNCTION_ARGS) |
700 | { |
701 | text *json = PG_GETARG_TEXT_PP(0); |
702 | text *fname = PG_GETARG_TEXT_PP(1); |
703 | char *fnamestr = text_to_cstring(fname); |
704 | text *result; |
705 | |
706 | result = get_worker(json, &fnamestr, NULL, 1, false); |
707 | |
708 | if (result != NULL) |
709 | PG_RETURN_TEXT_P(result); |
710 | else |
711 | PG_RETURN_NULL(); |
712 | } |
713 | |
714 | Datum |
715 | jsonb_object_field(PG_FUNCTION_ARGS) |
716 | { |
717 | Jsonb *jb = PG_GETARG_JSONB_P(0); |
718 | text *key = PG_GETARG_TEXT_PP(1); |
719 | JsonbValue *v; |
720 | |
721 | if (!JB_ROOT_IS_OBJECT(jb)) |
722 | PG_RETURN_NULL(); |
723 | |
724 | v = findJsonbValueFromContainerLen(&jb->root, JB_FOBJECT, |
725 | VARDATA_ANY(key), |
726 | VARSIZE_ANY_EXHDR(key)); |
727 | |
728 | if (v != NULL) |
729 | PG_RETURN_JSONB_P(JsonbValueToJsonb(v)); |
730 | |
731 | PG_RETURN_NULL(); |
732 | } |
733 | |
734 | Datum |
735 | json_object_field_text(PG_FUNCTION_ARGS) |
736 | { |
737 | text *json = PG_GETARG_TEXT_PP(0); |
738 | text *fname = PG_GETARG_TEXT_PP(1); |
739 | char *fnamestr = text_to_cstring(fname); |
740 | text *result; |
741 | |
742 | result = get_worker(json, &fnamestr, NULL, 1, true); |
743 | |
744 | if (result != NULL) |
745 | PG_RETURN_TEXT_P(result); |
746 | else |
747 | PG_RETURN_NULL(); |
748 | } |
749 | |
750 | Datum |
751 | jsonb_object_field_text(PG_FUNCTION_ARGS) |
752 | { |
753 | Jsonb *jb = PG_GETARG_JSONB_P(0); |
754 | text *key = PG_GETARG_TEXT_PP(1); |
755 | JsonbValue *v; |
756 | |
757 | if (!JB_ROOT_IS_OBJECT(jb)) |
758 | PG_RETURN_NULL(); |
759 | |
760 | v = findJsonbValueFromContainerLen(&jb->root, JB_FOBJECT, |
761 | VARDATA_ANY(key), |
762 | VARSIZE_ANY_EXHDR(key)); |
763 | |
764 | if (v != NULL) |
765 | { |
766 | text *result = NULL; |
767 | |
768 | switch (v->type) |
769 | { |
770 | case jbvNull: |
771 | break; |
772 | case jbvBool: |
773 | result = cstring_to_text(v->val.boolean ? "true" : "false" ); |
774 | break; |
775 | case jbvString: |
776 | result = cstring_to_text_with_len(v->val.string.val, v->val.string.len); |
777 | break; |
778 | case jbvNumeric: |
779 | result = cstring_to_text(DatumGetCString(DirectFunctionCall1(numeric_out, |
780 | PointerGetDatum(v->val.numeric)))); |
781 | break; |
782 | case jbvBinary: |
783 | { |
784 | StringInfo jtext = makeStringInfo(); |
785 | |
786 | (void) JsonbToCString(jtext, v->val.binary.data, -1); |
787 | result = cstring_to_text_with_len(jtext->data, jtext->len); |
788 | } |
789 | break; |
790 | default: |
791 | elog(ERROR, "unrecognized jsonb type: %d" , (int) v->type); |
792 | } |
793 | |
794 | if (result) |
795 | PG_RETURN_TEXT_P(result); |
796 | } |
797 | |
798 | PG_RETURN_NULL(); |
799 | } |
800 | |
801 | Datum |
802 | json_array_element(PG_FUNCTION_ARGS) |
803 | { |
804 | text *json = PG_GETARG_TEXT_PP(0); |
805 | int element = PG_GETARG_INT32(1); |
806 | text *result; |
807 | |
808 | result = get_worker(json, NULL, &element, 1, false); |
809 | |
810 | if (result != NULL) |
811 | PG_RETURN_TEXT_P(result); |
812 | else |
813 | PG_RETURN_NULL(); |
814 | } |
815 | |
816 | Datum |
817 | jsonb_array_element(PG_FUNCTION_ARGS) |
818 | { |
819 | Jsonb *jb = PG_GETARG_JSONB_P(0); |
820 | int element = PG_GETARG_INT32(1); |
821 | JsonbValue *v; |
822 | |
823 | if (!JB_ROOT_IS_ARRAY(jb)) |
824 | PG_RETURN_NULL(); |
825 | |
826 | /* Handle negative subscript */ |
827 | if (element < 0) |
828 | { |
829 | uint32 nelements = JB_ROOT_COUNT(jb); |
830 | |
831 | if (-element > nelements) |
832 | PG_RETURN_NULL(); |
833 | else |
834 | element += nelements; |
835 | } |
836 | |
837 | v = getIthJsonbValueFromContainer(&jb->root, element); |
838 | if (v != NULL) |
839 | PG_RETURN_JSONB_P(JsonbValueToJsonb(v)); |
840 | |
841 | PG_RETURN_NULL(); |
842 | } |
843 | |
844 | Datum |
845 | json_array_element_text(PG_FUNCTION_ARGS) |
846 | { |
847 | text *json = PG_GETARG_TEXT_PP(0); |
848 | int element = PG_GETARG_INT32(1); |
849 | text *result; |
850 | |
851 | result = get_worker(json, NULL, &element, 1, true); |
852 | |
853 | if (result != NULL) |
854 | PG_RETURN_TEXT_P(result); |
855 | else |
856 | PG_RETURN_NULL(); |
857 | } |
858 | |
859 | Datum |
860 | jsonb_array_element_text(PG_FUNCTION_ARGS) |
861 | { |
862 | Jsonb *jb = PG_GETARG_JSONB_P(0); |
863 | int element = PG_GETARG_INT32(1); |
864 | JsonbValue *v; |
865 | |
866 | if (!JB_ROOT_IS_ARRAY(jb)) |
867 | PG_RETURN_NULL(); |
868 | |
869 | /* Handle negative subscript */ |
870 | if (element < 0) |
871 | { |
872 | uint32 nelements = JB_ROOT_COUNT(jb); |
873 | |
874 | if (-element > nelements) |
875 | PG_RETURN_NULL(); |
876 | else |
877 | element += nelements; |
878 | } |
879 | |
880 | v = getIthJsonbValueFromContainer(&jb->root, element); |
881 | if (v != NULL) |
882 | { |
883 | text *result = NULL; |
884 | |
885 | switch (v->type) |
886 | { |
887 | case jbvNull: |
888 | break; |
889 | case jbvBool: |
890 | result = cstring_to_text(v->val.boolean ? "true" : "false" ); |
891 | break; |
892 | case jbvString: |
893 | result = cstring_to_text_with_len(v->val.string.val, v->val.string.len); |
894 | break; |
895 | case jbvNumeric: |
896 | result = cstring_to_text(DatumGetCString(DirectFunctionCall1(numeric_out, |
897 | PointerGetDatum(v->val.numeric)))); |
898 | break; |
899 | case jbvBinary: |
900 | { |
901 | StringInfo jtext = makeStringInfo(); |
902 | |
903 | (void) JsonbToCString(jtext, v->val.binary.data, -1); |
904 | result = cstring_to_text_with_len(jtext->data, jtext->len); |
905 | } |
906 | break; |
907 | default: |
908 | elog(ERROR, "unrecognized jsonb type: %d" , (int) v->type); |
909 | } |
910 | |
911 | if (result) |
912 | PG_RETURN_TEXT_P(result); |
913 | } |
914 | |
915 | PG_RETURN_NULL(); |
916 | } |
917 | |
918 | Datum |
919 | (PG_FUNCTION_ARGS) |
920 | { |
921 | return get_path_all(fcinfo, false); |
922 | } |
923 | |
924 | Datum |
925 | (PG_FUNCTION_ARGS) |
926 | { |
927 | return get_path_all(fcinfo, true); |
928 | } |
929 | |
930 | /* |
931 | * common routine for extract_path functions |
932 | */ |
933 | static Datum |
934 | get_path_all(FunctionCallInfo fcinfo, bool as_text) |
935 | { |
936 | text *json = PG_GETARG_TEXT_PP(0); |
937 | ArrayType *path = PG_GETARG_ARRAYTYPE_P(1); |
938 | text *result; |
939 | Datum *pathtext; |
940 | bool *pathnulls; |
941 | int npath; |
942 | char **tpath; |
943 | int *ipath; |
944 | int i; |
945 | |
946 | /* |
947 | * If the array contains any null elements, return NULL, on the grounds |
948 | * that you'd have gotten NULL if any RHS value were NULL in a nested |
949 | * series of applications of the -> operator. (Note: because we also |
950 | * return NULL for error cases such as no-such-field, this is true |
951 | * regardless of the contents of the rest of the array.) |
952 | */ |
953 | if (array_contains_nulls(path)) |
954 | PG_RETURN_NULL(); |
955 | |
956 | deconstruct_array(path, TEXTOID, -1, false, 'i', |
957 | &pathtext, &pathnulls, &npath); |
958 | |
959 | tpath = palloc(npath * sizeof(char *)); |
960 | ipath = palloc(npath * sizeof(int)); |
961 | |
962 | for (i = 0; i < npath; i++) |
963 | { |
964 | Assert(!pathnulls[i]); |
965 | tpath[i] = TextDatumGetCString(pathtext[i]); |
966 | |
967 | /* |
968 | * we have no idea at this stage what structure the document is so |
969 | * just convert anything in the path that we can to an integer and set |
970 | * all the other integers to INT_MIN which will never match. |
971 | */ |
972 | if (*tpath[i] != '\0') |
973 | { |
974 | long ind; |
975 | char *endptr; |
976 | |
977 | errno = 0; |
978 | ind = strtol(tpath[i], &endptr, 10); |
979 | if (*endptr == '\0' && errno == 0 && ind <= INT_MAX && ind >= INT_MIN) |
980 | ipath[i] = (int) ind; |
981 | else |
982 | ipath[i] = INT_MIN; |
983 | } |
984 | else |
985 | ipath[i] = INT_MIN; |
986 | } |
987 | |
988 | result = get_worker(json, tpath, ipath, npath, as_text); |
989 | |
990 | if (result != NULL) |
991 | PG_RETURN_TEXT_P(result); |
992 | else |
993 | PG_RETURN_NULL(); |
994 | } |
995 | |
996 | /* |
997 | * get_worker |
998 | * |
999 | * common worker for all the json getter functions |
1000 | * |
1001 | * json: JSON object (in text form) |
1002 | * tpath[]: field name(s) to extract |
1003 | * ipath[]: array index(es) (zero-based) to extract, accepts negatives |
1004 | * npath: length of tpath[] and/or ipath[] |
1005 | * normalize_results: true to de-escape string and null scalars |
1006 | * |
1007 | * tpath can be NULL, or any one tpath[] entry can be NULL, if an object |
1008 | * field is not to be matched at that nesting level. Similarly, ipath can |
1009 | * be NULL, or any one ipath[] entry can be INT_MIN if an array element is |
1010 | * not to be matched at that nesting level (a json datum should never be |
1011 | * large enough to have -INT_MIN elements due to MaxAllocSize restriction). |
1012 | */ |
1013 | static text * |
1014 | get_worker(text *json, |
1015 | char **tpath, |
1016 | int *ipath, |
1017 | int npath, |
1018 | bool normalize_results) |
1019 | { |
1020 | JsonLexContext *lex = makeJsonLexContext(json, true); |
1021 | JsonSemAction *sem = palloc0(sizeof(JsonSemAction)); |
1022 | GetState *state = palloc0(sizeof(GetState)); |
1023 | |
1024 | Assert(npath >= 0); |
1025 | |
1026 | state->lex = lex; |
1027 | /* is it "_as_text" variant? */ |
1028 | state->normalize_results = normalize_results; |
1029 | state->npath = npath; |
1030 | state->path_names = tpath; |
1031 | state->path_indexes = ipath; |
1032 | state->pathok = palloc0(sizeof(bool) * npath); |
1033 | state->array_cur_index = palloc(sizeof(int) * npath); |
1034 | |
1035 | if (npath > 0) |
1036 | state->pathok[0] = true; |
1037 | |
1038 | sem->semstate = (void *) state; |
1039 | |
1040 | /* |
1041 | * Not all variants need all the semantic routines. Only set the ones that |
1042 | * are actually needed for maximum efficiency. |
1043 | */ |
1044 | sem->scalar = get_scalar; |
1045 | if (npath == 0) |
1046 | { |
1047 | sem->object_start = get_object_start; |
1048 | sem->object_end = get_object_end; |
1049 | sem->array_start = get_array_start; |
1050 | sem->array_end = get_array_end; |
1051 | } |
1052 | if (tpath != NULL) |
1053 | { |
1054 | sem->object_field_start = get_object_field_start; |
1055 | sem->object_field_end = get_object_field_end; |
1056 | } |
1057 | if (ipath != NULL) |
1058 | { |
1059 | sem->array_start = get_array_start; |
1060 | sem->array_element_start = get_array_element_start; |
1061 | sem->array_element_end = get_array_element_end; |
1062 | } |
1063 | |
1064 | pg_parse_json(lex, sem); |
1065 | |
1066 | return state->tresult; |
1067 | } |
1068 | |
1069 | static void |
1070 | get_object_start(void *state) |
1071 | { |
1072 | GetState *_state = (GetState *) state; |
1073 | int lex_level = _state->lex->lex_level; |
1074 | |
1075 | if (lex_level == 0 && _state->npath == 0) |
1076 | { |
1077 | /* |
1078 | * Special case: we should match the entire object. We only need this |
1079 | * at outermost level because at nested levels the match will have |
1080 | * been started by the outer field or array element callback. |
1081 | */ |
1082 | _state->result_start = _state->lex->token_start; |
1083 | } |
1084 | } |
1085 | |
1086 | static void |
1087 | get_object_end(void *state) |
1088 | { |
1089 | GetState *_state = (GetState *) state; |
1090 | int lex_level = _state->lex->lex_level; |
1091 | |
1092 | if (lex_level == 0 && _state->npath == 0) |
1093 | { |
1094 | /* Special case: return the entire object */ |
1095 | char *start = _state->result_start; |
1096 | int len = _state->lex->prev_token_terminator - start; |
1097 | |
1098 | _state->tresult = cstring_to_text_with_len(start, len); |
1099 | } |
1100 | } |
1101 | |
1102 | static void |
1103 | get_object_field_start(void *state, char *fname, bool isnull) |
1104 | { |
1105 | GetState *_state = (GetState *) state; |
1106 | bool get_next = false; |
1107 | int lex_level = _state->lex->lex_level; |
1108 | |
1109 | if (lex_level <= _state->npath && |
1110 | _state->pathok[lex_level - 1] && |
1111 | _state->path_names != NULL && |
1112 | _state->path_names[lex_level - 1] != NULL && |
1113 | strcmp(fname, _state->path_names[lex_level - 1]) == 0) |
1114 | { |
1115 | if (lex_level < _state->npath) |
1116 | { |
1117 | /* if not at end of path just mark path ok */ |
1118 | _state->pathok[lex_level] = true; |
1119 | } |
1120 | else |
1121 | { |
1122 | /* end of path, so we want this value */ |
1123 | get_next = true; |
1124 | } |
1125 | } |
1126 | |
1127 | if (get_next) |
1128 | { |
1129 | /* this object overrides any previous matching object */ |
1130 | _state->tresult = NULL; |
1131 | _state->result_start = NULL; |
1132 | |
1133 | if (_state->normalize_results && |
1134 | _state->lex->token_type == JSON_TOKEN_STRING) |
1135 | { |
1136 | /* for as_text variants, tell get_scalar to set it for us */ |
1137 | _state->next_scalar = true; |
1138 | } |
1139 | else |
1140 | { |
1141 | /* for non-as_text variants, just note the json starting point */ |
1142 | _state->result_start = _state->lex->token_start; |
1143 | } |
1144 | } |
1145 | } |
1146 | |
1147 | static void |
1148 | get_object_field_end(void *state, char *fname, bool isnull) |
1149 | { |
1150 | GetState *_state = (GetState *) state; |
1151 | bool get_last = false; |
1152 | int lex_level = _state->lex->lex_level; |
1153 | |
1154 | /* same tests as in get_object_field_start */ |
1155 | if (lex_level <= _state->npath && |
1156 | _state->pathok[lex_level - 1] && |
1157 | _state->path_names != NULL && |
1158 | _state->path_names[lex_level - 1] != NULL && |
1159 | strcmp(fname, _state->path_names[lex_level - 1]) == 0) |
1160 | { |
1161 | if (lex_level < _state->npath) |
1162 | { |
1163 | /* done with this field so reset pathok */ |
1164 | _state->pathok[lex_level] = false; |
1165 | } |
1166 | else |
1167 | { |
1168 | /* end of path, so we want this value */ |
1169 | get_last = true; |
1170 | } |
1171 | } |
1172 | |
1173 | /* for as_text scalar case, our work is already done */ |
1174 | if (get_last && _state->result_start != NULL) |
1175 | { |
1176 | /* |
1177 | * make a text object from the string from the previously noted json |
1178 | * start up to the end of the previous token (the lexer is by now |
1179 | * ahead of us on whatever came after what we're interested in). |
1180 | */ |
1181 | if (isnull && _state->normalize_results) |
1182 | _state->tresult = (text *) NULL; |
1183 | else |
1184 | { |
1185 | char *start = _state->result_start; |
1186 | int len = _state->lex->prev_token_terminator - start; |
1187 | |
1188 | _state->tresult = cstring_to_text_with_len(start, len); |
1189 | } |
1190 | |
1191 | /* this should be unnecessary but let's do it for cleanliness: */ |
1192 | _state->result_start = NULL; |
1193 | } |
1194 | } |
1195 | |
1196 | static void |
1197 | get_array_start(void *state) |
1198 | { |
1199 | GetState *_state = (GetState *) state; |
1200 | int lex_level = _state->lex->lex_level; |
1201 | |
1202 | if (lex_level < _state->npath) |
1203 | { |
1204 | /* Initialize counting of elements in this array */ |
1205 | _state->array_cur_index[lex_level] = -1; |
1206 | |
1207 | /* INT_MIN value is reserved to represent invalid subscript */ |
1208 | if (_state->path_indexes[lex_level] < 0 && |
1209 | _state->path_indexes[lex_level] != INT_MIN) |
1210 | { |
1211 | /* Negative subscript -- convert to positive-wise subscript */ |
1212 | int nelements = json_count_array_elements(_state->lex); |
1213 | |
1214 | if (-_state->path_indexes[lex_level] <= nelements) |
1215 | _state->path_indexes[lex_level] += nelements; |
1216 | } |
1217 | } |
1218 | else if (lex_level == 0 && _state->npath == 0) |
1219 | { |
1220 | /* |
1221 | * Special case: we should match the entire array. We only need this |
1222 | * at the outermost level because at nested levels the match will have |
1223 | * been started by the outer field or array element callback. |
1224 | */ |
1225 | _state->result_start = _state->lex->token_start; |
1226 | } |
1227 | } |
1228 | |
1229 | static void |
1230 | get_array_end(void *state) |
1231 | { |
1232 | GetState *_state = (GetState *) state; |
1233 | int lex_level = _state->lex->lex_level; |
1234 | |
1235 | if (lex_level == 0 && _state->npath == 0) |
1236 | { |
1237 | /* Special case: return the entire array */ |
1238 | char *start = _state->result_start; |
1239 | int len = _state->lex->prev_token_terminator - start; |
1240 | |
1241 | _state->tresult = cstring_to_text_with_len(start, len); |
1242 | } |
1243 | } |
1244 | |
1245 | static void |
1246 | get_array_element_start(void *state, bool isnull) |
1247 | { |
1248 | GetState *_state = (GetState *) state; |
1249 | bool get_next = false; |
1250 | int lex_level = _state->lex->lex_level; |
1251 | |
1252 | /* Update array element counter */ |
1253 | if (lex_level <= _state->npath) |
1254 | _state->array_cur_index[lex_level - 1]++; |
1255 | |
1256 | if (lex_level <= _state->npath && |
1257 | _state->pathok[lex_level - 1] && |
1258 | _state->path_indexes != NULL && |
1259 | _state->array_cur_index[lex_level - 1] == _state->path_indexes[lex_level - 1]) |
1260 | { |
1261 | if (lex_level < _state->npath) |
1262 | { |
1263 | /* if not at end of path just mark path ok */ |
1264 | _state->pathok[lex_level] = true; |
1265 | } |
1266 | else |
1267 | { |
1268 | /* end of path, so we want this value */ |
1269 | get_next = true; |
1270 | } |
1271 | } |
1272 | |
1273 | /* same logic as for objects */ |
1274 | if (get_next) |
1275 | { |
1276 | _state->tresult = NULL; |
1277 | _state->result_start = NULL; |
1278 | |
1279 | if (_state->normalize_results && |
1280 | _state->lex->token_type == JSON_TOKEN_STRING) |
1281 | { |
1282 | _state->next_scalar = true; |
1283 | } |
1284 | else |
1285 | { |
1286 | _state->result_start = _state->lex->token_start; |
1287 | } |
1288 | } |
1289 | } |
1290 | |
1291 | static void |
1292 | get_array_element_end(void *state, bool isnull) |
1293 | { |
1294 | GetState *_state = (GetState *) state; |
1295 | bool get_last = false; |
1296 | int lex_level = _state->lex->lex_level; |
1297 | |
1298 | /* same tests as in get_array_element_start */ |
1299 | if (lex_level <= _state->npath && |
1300 | _state->pathok[lex_level - 1] && |
1301 | _state->path_indexes != NULL && |
1302 | _state->array_cur_index[lex_level - 1] == _state->path_indexes[lex_level - 1]) |
1303 | { |
1304 | if (lex_level < _state->npath) |
1305 | { |
1306 | /* done with this element so reset pathok */ |
1307 | _state->pathok[lex_level] = false; |
1308 | } |
1309 | else |
1310 | { |
1311 | /* end of path, so we want this value */ |
1312 | get_last = true; |
1313 | } |
1314 | } |
1315 | |
1316 | /* same logic as for objects */ |
1317 | if (get_last && _state->result_start != NULL) |
1318 | { |
1319 | if (isnull && _state->normalize_results) |
1320 | _state->tresult = (text *) NULL; |
1321 | else |
1322 | { |
1323 | char *start = _state->result_start; |
1324 | int len = _state->lex->prev_token_terminator - start; |
1325 | |
1326 | _state->tresult = cstring_to_text_with_len(start, len); |
1327 | } |
1328 | |
1329 | _state->result_start = NULL; |
1330 | } |
1331 | } |
1332 | |
1333 | static void |
1334 | get_scalar(void *state, char *token, JsonTokenType tokentype) |
1335 | { |
1336 | GetState *_state = (GetState *) state; |
1337 | int lex_level = _state->lex->lex_level; |
1338 | |
1339 | /* Check for whole-object match */ |
1340 | if (lex_level == 0 && _state->npath == 0) |
1341 | { |
1342 | if (_state->normalize_results && tokentype == JSON_TOKEN_STRING) |
1343 | { |
1344 | /* we want the de-escaped string */ |
1345 | _state->next_scalar = true; |
1346 | } |
1347 | else if (_state->normalize_results && tokentype == JSON_TOKEN_NULL) |
1348 | { |
1349 | _state->tresult = (text *) NULL; |
1350 | } |
1351 | else |
1352 | { |
1353 | /* |
1354 | * This is a bit hokey: we will suppress whitespace after the |
1355 | * scalar token, but not whitespace before it. Probably not worth |
1356 | * doing our own space-skipping to avoid that. |
1357 | */ |
1358 | char *start = _state->lex->input; |
1359 | int len = _state->lex->prev_token_terminator - start; |
1360 | |
1361 | _state->tresult = cstring_to_text_with_len(start, len); |
1362 | } |
1363 | } |
1364 | |
1365 | if (_state->next_scalar) |
1366 | { |
1367 | /* a de-escaped text value is wanted, so supply it */ |
1368 | _state->tresult = cstring_to_text(token); |
1369 | /* make sure the next call to get_scalar doesn't overwrite it */ |
1370 | _state->next_scalar = false; |
1371 | } |
1372 | } |
1373 | |
1374 | Datum |
1375 | (PG_FUNCTION_ARGS) |
1376 | { |
1377 | return get_jsonb_path_all(fcinfo, false); |
1378 | } |
1379 | |
1380 | Datum |
1381 | (PG_FUNCTION_ARGS) |
1382 | { |
1383 | return get_jsonb_path_all(fcinfo, true); |
1384 | } |
1385 | |
1386 | static Datum |
1387 | get_jsonb_path_all(FunctionCallInfo fcinfo, bool as_text) |
1388 | { |
1389 | Jsonb *jb = PG_GETARG_JSONB_P(0); |
1390 | ArrayType *path = PG_GETARG_ARRAYTYPE_P(1); |
1391 | Jsonb *res; |
1392 | Datum *pathtext; |
1393 | bool *pathnulls; |
1394 | int npath; |
1395 | int i; |
1396 | bool have_object = false, |
1397 | have_array = false; |
1398 | JsonbValue *jbvp = NULL; |
1399 | JsonbValue tv; |
1400 | JsonbContainer *container; |
1401 | |
1402 | /* |
1403 | * If the array contains any null elements, return NULL, on the grounds |
1404 | * that you'd have gotten NULL if any RHS value were NULL in a nested |
1405 | * series of applications of the -> operator. (Note: because we also |
1406 | * return NULL for error cases such as no-such-field, this is true |
1407 | * regardless of the contents of the rest of the array.) |
1408 | */ |
1409 | if (array_contains_nulls(path)) |
1410 | PG_RETURN_NULL(); |
1411 | |
1412 | deconstruct_array(path, TEXTOID, -1, false, 'i', |
1413 | &pathtext, &pathnulls, &npath); |
1414 | |
1415 | /* Identify whether we have object, array, or scalar at top-level */ |
1416 | container = &jb->root; |
1417 | |
1418 | if (JB_ROOT_IS_OBJECT(jb)) |
1419 | have_object = true; |
1420 | else if (JB_ROOT_IS_ARRAY(jb) && !JB_ROOT_IS_SCALAR(jb)) |
1421 | have_array = true; |
1422 | else |
1423 | { |
1424 | Assert(JB_ROOT_IS_ARRAY(jb) && JB_ROOT_IS_SCALAR(jb)); |
1425 | /* Extract the scalar value, if it is what we'll return */ |
1426 | if (npath <= 0) |
1427 | jbvp = getIthJsonbValueFromContainer(container, 0); |
1428 | } |
1429 | |
1430 | /* |
1431 | * If the array is empty, return the entire LHS object, on the grounds |
1432 | * that we should do zero field or element extractions. For the |
1433 | * non-scalar case we can just hand back the object without much work. For |
1434 | * the scalar case, fall through and deal with the value below the loop. |
1435 | * (This inconsistency arises because there's no easy way to generate a |
1436 | * JsonbValue directly for root-level containers.) |
1437 | */ |
1438 | if (npath <= 0 && jbvp == NULL) |
1439 | { |
1440 | if (as_text) |
1441 | { |
1442 | PG_RETURN_TEXT_P(cstring_to_text(JsonbToCString(NULL, |
1443 | container, |
1444 | VARSIZE(jb)))); |
1445 | } |
1446 | else |
1447 | { |
1448 | /* not text mode - just hand back the jsonb */ |
1449 | PG_RETURN_JSONB_P(jb); |
1450 | } |
1451 | } |
1452 | |
1453 | for (i = 0; i < npath; i++) |
1454 | { |
1455 | if (have_object) |
1456 | { |
1457 | jbvp = findJsonbValueFromContainerLen(container, |
1458 | JB_FOBJECT, |
1459 | VARDATA(pathtext[i]), |
1460 | VARSIZE(pathtext[i]) - VARHDRSZ); |
1461 | } |
1462 | else if (have_array) |
1463 | { |
1464 | long lindex; |
1465 | uint32 index; |
1466 | char *indextext = TextDatumGetCString(pathtext[i]); |
1467 | char *endptr; |
1468 | |
1469 | errno = 0; |
1470 | lindex = strtol(indextext, &endptr, 10); |
1471 | if (endptr == indextext || *endptr != '\0' || errno != 0 || |
1472 | lindex > INT_MAX || lindex < INT_MIN) |
1473 | PG_RETURN_NULL(); |
1474 | |
1475 | if (lindex >= 0) |
1476 | { |
1477 | index = (uint32) lindex; |
1478 | } |
1479 | else |
1480 | { |
1481 | /* Handle negative subscript */ |
1482 | uint32 nelements; |
1483 | |
1484 | /* Container must be array, but make sure */ |
1485 | if (!JsonContainerIsArray(container)) |
1486 | elog(ERROR, "not a jsonb array" ); |
1487 | |
1488 | nelements = JsonContainerSize(container); |
1489 | |
1490 | if (-lindex > nelements) |
1491 | PG_RETURN_NULL(); |
1492 | else |
1493 | index = nelements + lindex; |
1494 | } |
1495 | |
1496 | jbvp = getIthJsonbValueFromContainer(container, index); |
1497 | } |
1498 | else |
1499 | { |
1500 | /* scalar, extraction yields a null */ |
1501 | PG_RETURN_NULL(); |
1502 | } |
1503 | |
1504 | if (jbvp == NULL) |
1505 | PG_RETURN_NULL(); |
1506 | else if (i == npath - 1) |
1507 | break; |
1508 | |
1509 | if (jbvp->type == jbvBinary) |
1510 | { |
1511 | JsonbIterator *it = JsonbIteratorInit((JsonbContainer *) jbvp->val.binary.data); |
1512 | JsonbIteratorToken r; |
1513 | |
1514 | r = JsonbIteratorNext(&it, &tv, true); |
1515 | container = (JsonbContainer *) jbvp->val.binary.data; |
1516 | have_object = r == WJB_BEGIN_OBJECT; |
1517 | have_array = r == WJB_BEGIN_ARRAY; |
1518 | } |
1519 | else |
1520 | { |
1521 | have_object = jbvp->type == jbvObject; |
1522 | have_array = jbvp->type == jbvArray; |
1523 | } |
1524 | } |
1525 | |
1526 | if (as_text) |
1527 | { |
1528 | /* special-case outputs for string and null values */ |
1529 | if (jbvp->type == jbvString) |
1530 | PG_RETURN_TEXT_P(cstring_to_text_with_len(jbvp->val.string.val, |
1531 | jbvp->val.string.len)); |
1532 | if (jbvp->type == jbvNull) |
1533 | PG_RETURN_NULL(); |
1534 | } |
1535 | |
1536 | res = JsonbValueToJsonb(jbvp); |
1537 | |
1538 | if (as_text) |
1539 | { |
1540 | PG_RETURN_TEXT_P(cstring_to_text(JsonbToCString(NULL, |
1541 | &res->root, |
1542 | VARSIZE(res)))); |
1543 | } |
1544 | else |
1545 | { |
1546 | /* not text mode - just hand back the jsonb */ |
1547 | PG_RETURN_JSONB_P(res); |
1548 | } |
1549 | } |
1550 | |
1551 | /* |
1552 | * SQL function json_array_length(json) -> int |
1553 | */ |
1554 | Datum |
1555 | json_array_length(PG_FUNCTION_ARGS) |
1556 | { |
1557 | text *json = PG_GETARG_TEXT_PP(0); |
1558 | AlenState *state; |
1559 | JsonLexContext *lex; |
1560 | JsonSemAction *sem; |
1561 | |
1562 | lex = makeJsonLexContext(json, false); |
1563 | state = palloc0(sizeof(AlenState)); |
1564 | sem = palloc0(sizeof(JsonSemAction)); |
1565 | |
1566 | /* palloc0 does this for us */ |
1567 | #if 0 |
1568 | state->count = 0; |
1569 | #endif |
1570 | state->lex = lex; |
1571 | |
1572 | sem->semstate = (void *) state; |
1573 | sem->object_start = alen_object_start; |
1574 | sem->scalar = alen_scalar; |
1575 | sem->array_element_start = alen_array_element_start; |
1576 | |
1577 | pg_parse_json(lex, sem); |
1578 | |
1579 | PG_RETURN_INT32(state->count); |
1580 | } |
1581 | |
1582 | Datum |
1583 | jsonb_array_length(PG_FUNCTION_ARGS) |
1584 | { |
1585 | Jsonb *jb = PG_GETARG_JSONB_P(0); |
1586 | |
1587 | if (JB_ROOT_IS_SCALAR(jb)) |
1588 | ereport(ERROR, |
1589 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
1590 | errmsg("cannot get array length of a scalar" ))); |
1591 | else if (!JB_ROOT_IS_ARRAY(jb)) |
1592 | ereport(ERROR, |
1593 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
1594 | errmsg("cannot get array length of a non-array" ))); |
1595 | |
1596 | PG_RETURN_INT32(JB_ROOT_COUNT(jb)); |
1597 | } |
1598 | |
1599 | /* |
1600 | * These next two checks ensure that the json is an array (since it can't be |
1601 | * a scalar or an object). |
1602 | */ |
1603 | |
1604 | static void |
1605 | alen_object_start(void *state) |
1606 | { |
1607 | AlenState *_state = (AlenState *) state; |
1608 | |
1609 | /* json structure check */ |
1610 | if (_state->lex->lex_level == 0) |
1611 | ereport(ERROR, |
1612 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
1613 | errmsg("cannot get array length of a non-array" ))); |
1614 | } |
1615 | |
1616 | static void |
1617 | alen_scalar(void *state, char *token, JsonTokenType tokentype) |
1618 | { |
1619 | AlenState *_state = (AlenState *) state; |
1620 | |
1621 | /* json structure check */ |
1622 | if (_state->lex->lex_level == 0) |
1623 | ereport(ERROR, |
1624 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
1625 | errmsg("cannot get array length of a scalar" ))); |
1626 | } |
1627 | |
1628 | static void |
1629 | alen_array_element_start(void *state, bool isnull) |
1630 | { |
1631 | AlenState *_state = (AlenState *) state; |
1632 | |
1633 | /* just count up all the level 1 elements */ |
1634 | if (_state->lex->lex_level == 1) |
1635 | _state->count++; |
1636 | } |
1637 | |
1638 | /* |
1639 | * SQL function json_each and json_each_text |
1640 | * |
1641 | * decompose a json object into key value pairs. |
1642 | * |
1643 | * Unlike json_object_keys() these SRFs operate in materialize mode, |
1644 | * stashing results into a Tuplestore object as they go. |
1645 | * The construction of tuples is done using a temporary memory context |
1646 | * that is cleared out after each tuple is built. |
1647 | */ |
1648 | Datum |
1649 | json_each(PG_FUNCTION_ARGS) |
1650 | { |
1651 | return each_worker(fcinfo, false); |
1652 | } |
1653 | |
1654 | Datum |
1655 | jsonb_each(PG_FUNCTION_ARGS) |
1656 | { |
1657 | return each_worker_jsonb(fcinfo, "jsonb_each" , false); |
1658 | } |
1659 | |
1660 | Datum |
1661 | json_each_text(PG_FUNCTION_ARGS) |
1662 | { |
1663 | return each_worker(fcinfo, true); |
1664 | } |
1665 | |
1666 | Datum |
1667 | jsonb_each_text(PG_FUNCTION_ARGS) |
1668 | { |
1669 | return each_worker_jsonb(fcinfo, "jsonb_each_text" , true); |
1670 | } |
1671 | |
1672 | static Datum |
1673 | each_worker_jsonb(FunctionCallInfo fcinfo, const char *funcname, bool as_text) |
1674 | { |
1675 | Jsonb *jb = PG_GETARG_JSONB_P(0); |
1676 | ReturnSetInfo *rsi; |
1677 | Tuplestorestate *tuple_store; |
1678 | TupleDesc tupdesc; |
1679 | TupleDesc ret_tdesc; |
1680 | MemoryContext old_cxt, |
1681 | tmp_cxt; |
1682 | bool skipNested = false; |
1683 | JsonbIterator *it; |
1684 | JsonbValue v; |
1685 | JsonbIteratorToken r; |
1686 | |
1687 | if (!JB_ROOT_IS_OBJECT(jb)) |
1688 | ereport(ERROR, |
1689 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
1690 | errmsg("cannot call %s on a non-object" , |
1691 | funcname))); |
1692 | |
1693 | rsi = (ReturnSetInfo *) fcinfo->resultinfo; |
1694 | |
1695 | if (!rsi || !IsA(rsi, ReturnSetInfo) || |
1696 | (rsi->allowedModes & SFRM_Materialize) == 0 || |
1697 | rsi->expectedDesc == NULL) |
1698 | ereport(ERROR, |
1699 | (errcode(ERRCODE_FEATURE_NOT_SUPPORTED), |
1700 | errmsg("set-valued function called in context that " |
1701 | "cannot accept a set" ))); |
1702 | |
1703 | rsi->returnMode = SFRM_Materialize; |
1704 | |
1705 | if (get_call_result_type(fcinfo, NULL, &tupdesc) != TYPEFUNC_COMPOSITE) |
1706 | ereport(ERROR, |
1707 | (errcode(ERRCODE_FEATURE_NOT_SUPPORTED), |
1708 | errmsg("function returning record called in context " |
1709 | "that cannot accept type record" ))); |
1710 | |
1711 | old_cxt = MemoryContextSwitchTo(rsi->econtext->ecxt_per_query_memory); |
1712 | |
1713 | ret_tdesc = CreateTupleDescCopy(tupdesc); |
1714 | BlessTupleDesc(ret_tdesc); |
1715 | tuple_store = |
1716 | tuplestore_begin_heap(rsi->allowedModes & SFRM_Materialize_Random, |
1717 | false, work_mem); |
1718 | |
1719 | MemoryContextSwitchTo(old_cxt); |
1720 | |
1721 | tmp_cxt = AllocSetContextCreate(CurrentMemoryContext, |
1722 | "jsonb_each temporary cxt" , |
1723 | ALLOCSET_DEFAULT_SIZES); |
1724 | |
1725 | it = JsonbIteratorInit(&jb->root); |
1726 | |
1727 | while ((r = JsonbIteratorNext(&it, &v, skipNested)) != WJB_DONE) |
1728 | { |
1729 | skipNested = true; |
1730 | |
1731 | if (r == WJB_KEY) |
1732 | { |
1733 | text *key; |
1734 | HeapTuple tuple; |
1735 | Datum values[2]; |
1736 | bool nulls[2] = {false, false}; |
1737 | |
1738 | /* Use the tmp context so we can clean up after each tuple is done */ |
1739 | old_cxt = MemoryContextSwitchTo(tmp_cxt); |
1740 | |
1741 | key = cstring_to_text_with_len(v.val.string.val, v.val.string.len); |
1742 | |
1743 | /* |
1744 | * The next thing the iterator fetches should be the value, no |
1745 | * matter what shape it is. |
1746 | */ |
1747 | r = JsonbIteratorNext(&it, &v, skipNested); |
1748 | Assert(r != WJB_DONE); |
1749 | |
1750 | values[0] = PointerGetDatum(key); |
1751 | |
1752 | if (as_text) |
1753 | { |
1754 | if (v.type == jbvNull) |
1755 | { |
1756 | /* a json null is an sql null in text mode */ |
1757 | nulls[1] = true; |
1758 | values[1] = (Datum) NULL; |
1759 | } |
1760 | else |
1761 | { |
1762 | text *sv; |
1763 | |
1764 | if (v.type == jbvString) |
1765 | { |
1766 | /* In text mode, scalar strings should be dequoted */ |
1767 | sv = cstring_to_text_with_len(v.val.string.val, v.val.string.len); |
1768 | } |
1769 | else |
1770 | { |
1771 | /* Turn anything else into a json string */ |
1772 | StringInfo jtext = makeStringInfo(); |
1773 | Jsonb *jb = JsonbValueToJsonb(&v); |
1774 | |
1775 | (void) JsonbToCString(jtext, &jb->root, 0); |
1776 | sv = cstring_to_text_with_len(jtext->data, jtext->len); |
1777 | } |
1778 | |
1779 | values[1] = PointerGetDatum(sv); |
1780 | } |
1781 | } |
1782 | else |
1783 | { |
1784 | /* Not in text mode, just return the Jsonb */ |
1785 | Jsonb *val = JsonbValueToJsonb(&v); |
1786 | |
1787 | values[1] = PointerGetDatum(val); |
1788 | } |
1789 | |
1790 | tuple = heap_form_tuple(ret_tdesc, values, nulls); |
1791 | |
1792 | tuplestore_puttuple(tuple_store, tuple); |
1793 | |
1794 | /* clean up and switch back */ |
1795 | MemoryContextSwitchTo(old_cxt); |
1796 | MemoryContextReset(tmp_cxt); |
1797 | } |
1798 | } |
1799 | |
1800 | MemoryContextDelete(tmp_cxt); |
1801 | |
1802 | rsi->setResult = tuple_store; |
1803 | rsi->setDesc = ret_tdesc; |
1804 | |
1805 | PG_RETURN_NULL(); |
1806 | } |
1807 | |
1808 | |
1809 | static Datum |
1810 | each_worker(FunctionCallInfo fcinfo, bool as_text) |
1811 | { |
1812 | text *json = PG_GETARG_TEXT_PP(0); |
1813 | JsonLexContext *lex; |
1814 | JsonSemAction *sem; |
1815 | ReturnSetInfo *rsi; |
1816 | MemoryContext old_cxt; |
1817 | TupleDesc tupdesc; |
1818 | EachState *state; |
1819 | |
1820 | lex = makeJsonLexContext(json, true); |
1821 | state = palloc0(sizeof(EachState)); |
1822 | sem = palloc0(sizeof(JsonSemAction)); |
1823 | |
1824 | rsi = (ReturnSetInfo *) fcinfo->resultinfo; |
1825 | |
1826 | if (!rsi || !IsA(rsi, ReturnSetInfo) || |
1827 | (rsi->allowedModes & SFRM_Materialize) == 0 || |
1828 | rsi->expectedDesc == NULL) |
1829 | ereport(ERROR, |
1830 | (errcode(ERRCODE_FEATURE_NOT_SUPPORTED), |
1831 | errmsg("set-valued function called in context that " |
1832 | "cannot accept a set" ))); |
1833 | |
1834 | rsi->returnMode = SFRM_Materialize; |
1835 | |
1836 | (void) get_call_result_type(fcinfo, NULL, &tupdesc); |
1837 | |
1838 | /* make these in a sufficiently long-lived memory context */ |
1839 | old_cxt = MemoryContextSwitchTo(rsi->econtext->ecxt_per_query_memory); |
1840 | |
1841 | state->ret_tdesc = CreateTupleDescCopy(tupdesc); |
1842 | BlessTupleDesc(state->ret_tdesc); |
1843 | state->tuple_store = |
1844 | tuplestore_begin_heap(rsi->allowedModes & SFRM_Materialize_Random, |
1845 | false, work_mem); |
1846 | |
1847 | MemoryContextSwitchTo(old_cxt); |
1848 | |
1849 | sem->semstate = (void *) state; |
1850 | sem->array_start = each_array_start; |
1851 | sem->scalar = each_scalar; |
1852 | sem->object_field_start = each_object_field_start; |
1853 | sem->object_field_end = each_object_field_end; |
1854 | |
1855 | state->normalize_results = as_text; |
1856 | state->next_scalar = false; |
1857 | state->lex = lex; |
1858 | state->tmp_cxt = AllocSetContextCreate(CurrentMemoryContext, |
1859 | "json_each temporary cxt" , |
1860 | ALLOCSET_DEFAULT_SIZES); |
1861 | |
1862 | pg_parse_json(lex, sem); |
1863 | |
1864 | MemoryContextDelete(state->tmp_cxt); |
1865 | |
1866 | rsi->setResult = state->tuple_store; |
1867 | rsi->setDesc = state->ret_tdesc; |
1868 | |
1869 | PG_RETURN_NULL(); |
1870 | } |
1871 | |
1872 | |
1873 | static void |
1874 | each_object_field_start(void *state, char *fname, bool isnull) |
1875 | { |
1876 | EachState *_state = (EachState *) state; |
1877 | |
1878 | /* save a pointer to where the value starts */ |
1879 | if (_state->lex->lex_level == 1) |
1880 | { |
1881 | /* |
1882 | * next_scalar will be reset in the object_field_end handler, and |
1883 | * since we know the value is a scalar there is no danger of it being |
1884 | * on while recursing down the tree. |
1885 | */ |
1886 | if (_state->normalize_results && _state->lex->token_type == JSON_TOKEN_STRING) |
1887 | _state->next_scalar = true; |
1888 | else |
1889 | _state->result_start = _state->lex->token_start; |
1890 | } |
1891 | } |
1892 | |
1893 | static void |
1894 | each_object_field_end(void *state, char *fname, bool isnull) |
1895 | { |
1896 | EachState *_state = (EachState *) state; |
1897 | MemoryContext old_cxt; |
1898 | int len; |
1899 | text *val; |
1900 | HeapTuple tuple; |
1901 | Datum values[2]; |
1902 | bool nulls[2] = {false, false}; |
1903 | |
1904 | /* skip over nested objects */ |
1905 | if (_state->lex->lex_level != 1) |
1906 | return; |
1907 | |
1908 | /* use the tmp context so we can clean up after each tuple is done */ |
1909 | old_cxt = MemoryContextSwitchTo(_state->tmp_cxt); |
1910 | |
1911 | values[0] = CStringGetTextDatum(fname); |
1912 | |
1913 | if (isnull && _state->normalize_results) |
1914 | { |
1915 | nulls[1] = true; |
1916 | values[1] = (Datum) 0; |
1917 | } |
1918 | else if (_state->next_scalar) |
1919 | { |
1920 | values[1] = CStringGetTextDatum(_state->normalized_scalar); |
1921 | _state->next_scalar = false; |
1922 | } |
1923 | else |
1924 | { |
1925 | len = _state->lex->prev_token_terminator - _state->result_start; |
1926 | val = cstring_to_text_with_len(_state->result_start, len); |
1927 | values[1] = PointerGetDatum(val); |
1928 | } |
1929 | |
1930 | tuple = heap_form_tuple(_state->ret_tdesc, values, nulls); |
1931 | |
1932 | tuplestore_puttuple(_state->tuple_store, tuple); |
1933 | |
1934 | /* clean up and switch back */ |
1935 | MemoryContextSwitchTo(old_cxt); |
1936 | MemoryContextReset(_state->tmp_cxt); |
1937 | } |
1938 | |
1939 | static void |
1940 | each_array_start(void *state) |
1941 | { |
1942 | EachState *_state = (EachState *) state; |
1943 | |
1944 | /* json structure check */ |
1945 | if (_state->lex->lex_level == 0) |
1946 | ereport(ERROR, |
1947 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
1948 | errmsg("cannot deconstruct an array as an object" ))); |
1949 | } |
1950 | |
1951 | static void |
1952 | each_scalar(void *state, char *token, JsonTokenType tokentype) |
1953 | { |
1954 | EachState *_state = (EachState *) state; |
1955 | |
1956 | /* json structure check */ |
1957 | if (_state->lex->lex_level == 0) |
1958 | ereport(ERROR, |
1959 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
1960 | errmsg("cannot deconstruct a scalar" ))); |
1961 | |
1962 | /* supply de-escaped value if required */ |
1963 | if (_state->next_scalar) |
1964 | _state->normalized_scalar = token; |
1965 | } |
1966 | |
1967 | /* |
1968 | * SQL functions json_array_elements and json_array_elements_text |
1969 | * |
1970 | * get the elements from a json array |
1971 | * |
1972 | * a lot of this processing is similar to the json_each* functions |
1973 | */ |
1974 | |
1975 | Datum |
1976 | jsonb_array_elements(PG_FUNCTION_ARGS) |
1977 | { |
1978 | return elements_worker_jsonb(fcinfo, "jsonb_array_elements" , false); |
1979 | } |
1980 | |
1981 | Datum |
1982 | jsonb_array_elements_text(PG_FUNCTION_ARGS) |
1983 | { |
1984 | return elements_worker_jsonb(fcinfo, "jsonb_array_elements_text" , true); |
1985 | } |
1986 | |
1987 | static Datum |
1988 | elements_worker_jsonb(FunctionCallInfo fcinfo, const char *funcname, |
1989 | bool as_text) |
1990 | { |
1991 | Jsonb *jb = PG_GETARG_JSONB_P(0); |
1992 | ReturnSetInfo *rsi; |
1993 | Tuplestorestate *tuple_store; |
1994 | TupleDesc tupdesc; |
1995 | TupleDesc ret_tdesc; |
1996 | MemoryContext old_cxt, |
1997 | tmp_cxt; |
1998 | bool skipNested = false; |
1999 | JsonbIterator *it; |
2000 | JsonbValue v; |
2001 | JsonbIteratorToken r; |
2002 | |
2003 | if (JB_ROOT_IS_SCALAR(jb)) |
2004 | ereport(ERROR, |
2005 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
2006 | errmsg("cannot extract elements from a scalar" ))); |
2007 | else if (!JB_ROOT_IS_ARRAY(jb)) |
2008 | ereport(ERROR, |
2009 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
2010 | errmsg("cannot extract elements from an object" ))); |
2011 | |
2012 | rsi = (ReturnSetInfo *) fcinfo->resultinfo; |
2013 | |
2014 | if (!rsi || !IsA(rsi, ReturnSetInfo) || |
2015 | (rsi->allowedModes & SFRM_Materialize) == 0 || |
2016 | rsi->expectedDesc == NULL) |
2017 | ereport(ERROR, |
2018 | (errcode(ERRCODE_FEATURE_NOT_SUPPORTED), |
2019 | errmsg("set-valued function called in context that " |
2020 | "cannot accept a set" ))); |
2021 | |
2022 | rsi->returnMode = SFRM_Materialize; |
2023 | |
2024 | /* it's a simple type, so don't use get_call_result_type() */ |
2025 | tupdesc = rsi->expectedDesc; |
2026 | |
2027 | old_cxt = MemoryContextSwitchTo(rsi->econtext->ecxt_per_query_memory); |
2028 | |
2029 | ret_tdesc = CreateTupleDescCopy(tupdesc); |
2030 | BlessTupleDesc(ret_tdesc); |
2031 | tuple_store = |
2032 | tuplestore_begin_heap(rsi->allowedModes & SFRM_Materialize_Random, |
2033 | false, work_mem); |
2034 | |
2035 | MemoryContextSwitchTo(old_cxt); |
2036 | |
2037 | tmp_cxt = AllocSetContextCreate(CurrentMemoryContext, |
2038 | "jsonb_array_elements temporary cxt" , |
2039 | ALLOCSET_DEFAULT_SIZES); |
2040 | |
2041 | it = JsonbIteratorInit(&jb->root); |
2042 | |
2043 | while ((r = JsonbIteratorNext(&it, &v, skipNested)) != WJB_DONE) |
2044 | { |
2045 | skipNested = true; |
2046 | |
2047 | if (r == WJB_ELEM) |
2048 | { |
2049 | HeapTuple tuple; |
2050 | Datum values[1]; |
2051 | bool nulls[1] = {false}; |
2052 | |
2053 | /* use the tmp context so we can clean up after each tuple is done */ |
2054 | old_cxt = MemoryContextSwitchTo(tmp_cxt); |
2055 | |
2056 | if (!as_text) |
2057 | { |
2058 | Jsonb *val = JsonbValueToJsonb(&v); |
2059 | |
2060 | values[0] = PointerGetDatum(val); |
2061 | } |
2062 | else |
2063 | { |
2064 | if (v.type == jbvNull) |
2065 | { |
2066 | /* a json null is an sql null in text mode */ |
2067 | nulls[0] = true; |
2068 | values[0] = (Datum) NULL; |
2069 | } |
2070 | else |
2071 | { |
2072 | text *sv; |
2073 | |
2074 | if (v.type == jbvString) |
2075 | { |
2076 | /* in text mode scalar strings should be dequoted */ |
2077 | sv = cstring_to_text_with_len(v.val.string.val, v.val.string.len); |
2078 | } |
2079 | else |
2080 | { |
2081 | /* turn anything else into a json string */ |
2082 | StringInfo jtext = makeStringInfo(); |
2083 | Jsonb *jb = JsonbValueToJsonb(&v); |
2084 | |
2085 | (void) JsonbToCString(jtext, &jb->root, 0); |
2086 | sv = cstring_to_text_with_len(jtext->data, jtext->len); |
2087 | } |
2088 | |
2089 | values[0] = PointerGetDatum(sv); |
2090 | } |
2091 | } |
2092 | |
2093 | tuple = heap_form_tuple(ret_tdesc, values, nulls); |
2094 | |
2095 | tuplestore_puttuple(tuple_store, tuple); |
2096 | |
2097 | /* clean up and switch back */ |
2098 | MemoryContextSwitchTo(old_cxt); |
2099 | MemoryContextReset(tmp_cxt); |
2100 | } |
2101 | } |
2102 | |
2103 | MemoryContextDelete(tmp_cxt); |
2104 | |
2105 | rsi->setResult = tuple_store; |
2106 | rsi->setDesc = ret_tdesc; |
2107 | |
2108 | PG_RETURN_NULL(); |
2109 | } |
2110 | |
2111 | Datum |
2112 | json_array_elements(PG_FUNCTION_ARGS) |
2113 | { |
2114 | return elements_worker(fcinfo, "json_array_elements" , false); |
2115 | } |
2116 | |
2117 | Datum |
2118 | json_array_elements_text(PG_FUNCTION_ARGS) |
2119 | { |
2120 | return elements_worker(fcinfo, "json_array_elements_text" , true); |
2121 | } |
2122 | |
2123 | static Datum |
2124 | elements_worker(FunctionCallInfo fcinfo, const char *funcname, bool as_text) |
2125 | { |
2126 | text *json = PG_GETARG_TEXT_PP(0); |
2127 | |
2128 | /* elements only needs escaped strings when as_text */ |
2129 | JsonLexContext *lex = makeJsonLexContext(json, as_text); |
2130 | JsonSemAction *sem; |
2131 | ReturnSetInfo *rsi; |
2132 | MemoryContext old_cxt; |
2133 | TupleDesc tupdesc; |
2134 | ElementsState *state; |
2135 | |
2136 | state = palloc0(sizeof(ElementsState)); |
2137 | sem = palloc0(sizeof(JsonSemAction)); |
2138 | |
2139 | rsi = (ReturnSetInfo *) fcinfo->resultinfo; |
2140 | |
2141 | if (!rsi || !IsA(rsi, ReturnSetInfo) || |
2142 | (rsi->allowedModes & SFRM_Materialize) == 0 || |
2143 | rsi->expectedDesc == NULL) |
2144 | ereport(ERROR, |
2145 | (errcode(ERRCODE_FEATURE_NOT_SUPPORTED), |
2146 | errmsg("set-valued function called in context that " |
2147 | "cannot accept a set" ))); |
2148 | |
2149 | rsi->returnMode = SFRM_Materialize; |
2150 | |
2151 | /* it's a simple type, so don't use get_call_result_type() */ |
2152 | tupdesc = rsi->expectedDesc; |
2153 | |
2154 | /* make these in a sufficiently long-lived memory context */ |
2155 | old_cxt = MemoryContextSwitchTo(rsi->econtext->ecxt_per_query_memory); |
2156 | |
2157 | state->ret_tdesc = CreateTupleDescCopy(tupdesc); |
2158 | BlessTupleDesc(state->ret_tdesc); |
2159 | state->tuple_store = |
2160 | tuplestore_begin_heap(rsi->allowedModes & SFRM_Materialize_Random, |
2161 | false, work_mem); |
2162 | |
2163 | MemoryContextSwitchTo(old_cxt); |
2164 | |
2165 | sem->semstate = (void *) state; |
2166 | sem->object_start = elements_object_start; |
2167 | sem->scalar = elements_scalar; |
2168 | sem->array_element_start = elements_array_element_start; |
2169 | sem->array_element_end = elements_array_element_end; |
2170 | |
2171 | state->function_name = funcname; |
2172 | state->normalize_results = as_text; |
2173 | state->next_scalar = false; |
2174 | state->lex = lex; |
2175 | state->tmp_cxt = AllocSetContextCreate(CurrentMemoryContext, |
2176 | "json_array_elements temporary cxt" , |
2177 | ALLOCSET_DEFAULT_SIZES); |
2178 | |
2179 | pg_parse_json(lex, sem); |
2180 | |
2181 | MemoryContextDelete(state->tmp_cxt); |
2182 | |
2183 | rsi->setResult = state->tuple_store; |
2184 | rsi->setDesc = state->ret_tdesc; |
2185 | |
2186 | PG_RETURN_NULL(); |
2187 | } |
2188 | |
2189 | static void |
2190 | elements_array_element_start(void *state, bool isnull) |
2191 | { |
2192 | ElementsState *_state = (ElementsState *) state; |
2193 | |
2194 | /* save a pointer to where the value starts */ |
2195 | if (_state->lex->lex_level == 1) |
2196 | { |
2197 | /* |
2198 | * next_scalar will be reset in the array_element_end handler, and |
2199 | * since we know the value is a scalar there is no danger of it being |
2200 | * on while recursing down the tree. |
2201 | */ |
2202 | if (_state->normalize_results && _state->lex->token_type == JSON_TOKEN_STRING) |
2203 | _state->next_scalar = true; |
2204 | else |
2205 | _state->result_start = _state->lex->token_start; |
2206 | } |
2207 | } |
2208 | |
2209 | static void |
2210 | elements_array_element_end(void *state, bool isnull) |
2211 | { |
2212 | ElementsState *_state = (ElementsState *) state; |
2213 | MemoryContext old_cxt; |
2214 | int len; |
2215 | text *val; |
2216 | HeapTuple tuple; |
2217 | Datum values[1]; |
2218 | bool nulls[1] = {false}; |
2219 | |
2220 | /* skip over nested objects */ |
2221 | if (_state->lex->lex_level != 1) |
2222 | return; |
2223 | |
2224 | /* use the tmp context so we can clean up after each tuple is done */ |
2225 | old_cxt = MemoryContextSwitchTo(_state->tmp_cxt); |
2226 | |
2227 | if (isnull && _state->normalize_results) |
2228 | { |
2229 | nulls[0] = true; |
2230 | values[0] = (Datum) NULL; |
2231 | } |
2232 | else if (_state->next_scalar) |
2233 | { |
2234 | values[0] = CStringGetTextDatum(_state->normalized_scalar); |
2235 | _state->next_scalar = false; |
2236 | } |
2237 | else |
2238 | { |
2239 | len = _state->lex->prev_token_terminator - _state->result_start; |
2240 | val = cstring_to_text_with_len(_state->result_start, len); |
2241 | values[0] = PointerGetDatum(val); |
2242 | } |
2243 | |
2244 | tuple = heap_form_tuple(_state->ret_tdesc, values, nulls); |
2245 | |
2246 | tuplestore_puttuple(_state->tuple_store, tuple); |
2247 | |
2248 | /* clean up and switch back */ |
2249 | MemoryContextSwitchTo(old_cxt); |
2250 | MemoryContextReset(_state->tmp_cxt); |
2251 | } |
2252 | |
2253 | static void |
2254 | elements_object_start(void *state) |
2255 | { |
2256 | ElementsState *_state = (ElementsState *) state; |
2257 | |
2258 | /* json structure check */ |
2259 | if (_state->lex->lex_level == 0) |
2260 | ereport(ERROR, |
2261 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
2262 | errmsg("cannot call %s on a non-array" , |
2263 | _state->function_name))); |
2264 | } |
2265 | |
2266 | static void |
2267 | elements_scalar(void *state, char *token, JsonTokenType tokentype) |
2268 | { |
2269 | ElementsState *_state = (ElementsState *) state; |
2270 | |
2271 | /* json structure check */ |
2272 | if (_state->lex->lex_level == 0) |
2273 | ereport(ERROR, |
2274 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
2275 | errmsg("cannot call %s on a scalar" , |
2276 | _state->function_name))); |
2277 | |
2278 | /* supply de-escaped value if required */ |
2279 | if (_state->next_scalar) |
2280 | _state->normalized_scalar = token; |
2281 | } |
2282 | |
2283 | /* |
2284 | * SQL function json_populate_record |
2285 | * |
2286 | * set fields in a record from the argument json |
2287 | * |
2288 | * Code adapted shamelessly from hstore's populate_record |
2289 | * which is in turn partly adapted from record_out. |
2290 | * |
2291 | * The json is decomposed into a hash table, in which each |
2292 | * field in the record is then looked up by name. For jsonb |
2293 | * we fetch the values direct from the object. |
2294 | */ |
2295 | Datum |
2296 | jsonb_populate_record(PG_FUNCTION_ARGS) |
2297 | { |
2298 | return populate_record_worker(fcinfo, "jsonb_populate_record" , |
2299 | false, true); |
2300 | } |
2301 | |
2302 | Datum |
2303 | jsonb_to_record(PG_FUNCTION_ARGS) |
2304 | { |
2305 | return populate_record_worker(fcinfo, "jsonb_to_record" , |
2306 | false, false); |
2307 | } |
2308 | |
2309 | Datum |
2310 | json_populate_record(PG_FUNCTION_ARGS) |
2311 | { |
2312 | return populate_record_worker(fcinfo, "json_populate_record" , |
2313 | true, true); |
2314 | } |
2315 | |
2316 | Datum |
2317 | json_to_record(PG_FUNCTION_ARGS) |
2318 | { |
2319 | return populate_record_worker(fcinfo, "json_to_record" , |
2320 | true, false); |
2321 | } |
2322 | |
2323 | /* helper function for diagnostics */ |
2324 | static void |
2325 | populate_array_report_expected_array(PopulateArrayContext *ctx, int ndim) |
2326 | { |
2327 | if (ndim <= 0) |
2328 | { |
2329 | if (ctx->colname) |
2330 | ereport(ERROR, |
2331 | (errcode(ERRCODE_INVALID_TEXT_REPRESENTATION), |
2332 | errmsg("expected JSON array" ), |
2333 | errhint("See the value of key \"%s\"." , ctx->colname))); |
2334 | else |
2335 | ereport(ERROR, |
2336 | (errcode(ERRCODE_INVALID_TEXT_REPRESENTATION), |
2337 | errmsg("expected JSON array" ))); |
2338 | } |
2339 | else |
2340 | { |
2341 | StringInfoData indices; |
2342 | int i; |
2343 | |
2344 | initStringInfo(&indices); |
2345 | |
2346 | Assert(ctx->ndims > 0 && ndim < ctx->ndims); |
2347 | |
2348 | for (i = 0; i < ndim; i++) |
2349 | appendStringInfo(&indices, "[%d]" , ctx->sizes[i]); |
2350 | |
2351 | if (ctx->colname) |
2352 | ereport(ERROR, |
2353 | (errcode(ERRCODE_INVALID_TEXT_REPRESENTATION), |
2354 | errmsg("expected JSON array" ), |
2355 | errhint("See the array element %s of key \"%s\"." , |
2356 | indices.data, ctx->colname))); |
2357 | else |
2358 | ereport(ERROR, |
2359 | (errcode(ERRCODE_INVALID_TEXT_REPRESENTATION), |
2360 | errmsg("expected JSON array" ), |
2361 | errhint("See the array element %s." , |
2362 | indices.data))); |
2363 | } |
2364 | } |
2365 | |
2366 | /* set the number of dimensions of the populated array when it becomes known */ |
2367 | static void |
2368 | populate_array_assign_ndims(PopulateArrayContext *ctx, int ndims) |
2369 | { |
2370 | int i; |
2371 | |
2372 | Assert(ctx->ndims <= 0); |
2373 | |
2374 | if (ndims <= 0) |
2375 | populate_array_report_expected_array(ctx, ndims); |
2376 | |
2377 | ctx->ndims = ndims; |
2378 | ctx->dims = palloc(sizeof(int) * ndims); |
2379 | ctx->sizes = palloc0(sizeof(int) * ndims); |
2380 | |
2381 | for (i = 0; i < ndims; i++) |
2382 | ctx->dims[i] = -1; /* dimensions are unknown yet */ |
2383 | } |
2384 | |
2385 | /* check the populated subarray dimension */ |
2386 | static void |
2387 | populate_array_check_dimension(PopulateArrayContext *ctx, int ndim) |
2388 | { |
2389 | int dim = ctx->sizes[ndim]; /* current dimension counter */ |
2390 | |
2391 | if (ctx->dims[ndim] == -1) |
2392 | ctx->dims[ndim] = dim; /* assign dimension if not yet known */ |
2393 | else if (ctx->dims[ndim] != dim) |
2394 | ereport(ERROR, |
2395 | (errcode(ERRCODE_INVALID_TEXT_REPRESENTATION), |
2396 | errmsg("malformed JSON array" ), |
2397 | errdetail("Multidimensional arrays must have " |
2398 | "sub-arrays with matching dimensions." ))); |
2399 | |
2400 | /* reset the current array dimension size counter */ |
2401 | ctx->sizes[ndim] = 0; |
2402 | |
2403 | /* increment the parent dimension counter if it is a nested sub-array */ |
2404 | if (ndim > 0) |
2405 | ctx->sizes[ndim - 1]++; |
2406 | } |
2407 | |
2408 | static void |
2409 | populate_array_element(PopulateArrayContext *ctx, int ndim, JsValue *jsv) |
2410 | { |
2411 | Datum element; |
2412 | bool element_isnull; |
2413 | |
2414 | /* populate the array element */ |
2415 | element = populate_record_field(ctx->aio->element_info, |
2416 | ctx->aio->element_type, |
2417 | ctx->aio->element_typmod, |
2418 | NULL, ctx->mcxt, PointerGetDatum(NULL), |
2419 | jsv, &element_isnull); |
2420 | |
2421 | accumArrayResult(ctx->astate, element, element_isnull, |
2422 | ctx->aio->element_type, ctx->acxt); |
2423 | |
2424 | Assert(ndim > 0); |
2425 | ctx->sizes[ndim - 1]++; /* increment current dimension counter */ |
2426 | } |
2427 | |
2428 | /* json object start handler for populate_array_json() */ |
2429 | static void |
2430 | populate_array_object_start(void *_state) |
2431 | { |
2432 | PopulateArrayState *state = (PopulateArrayState *) _state; |
2433 | int ndim = state->lex->lex_level; |
2434 | |
2435 | if (state->ctx->ndims <= 0) |
2436 | populate_array_assign_ndims(state->ctx, ndim); |
2437 | else if (ndim < state->ctx->ndims) |
2438 | populate_array_report_expected_array(state->ctx, ndim); |
2439 | } |
2440 | |
2441 | /* json array end handler for populate_array_json() */ |
2442 | static void |
2443 | populate_array_array_end(void *_state) |
2444 | { |
2445 | PopulateArrayState *state = (PopulateArrayState *) _state; |
2446 | PopulateArrayContext *ctx = state->ctx; |
2447 | int ndim = state->lex->lex_level; |
2448 | |
2449 | if (ctx->ndims <= 0) |
2450 | populate_array_assign_ndims(ctx, ndim + 1); |
2451 | |
2452 | if (ndim < ctx->ndims) |
2453 | populate_array_check_dimension(ctx, ndim); |
2454 | } |
2455 | |
2456 | /* json array element start handler for populate_array_json() */ |
2457 | static void |
2458 | populate_array_element_start(void *_state, bool isnull) |
2459 | { |
2460 | PopulateArrayState *state = (PopulateArrayState *) _state; |
2461 | int ndim = state->lex->lex_level; |
2462 | |
2463 | if (state->ctx->ndims <= 0 || ndim == state->ctx->ndims) |
2464 | { |
2465 | /* remember current array element start */ |
2466 | state->element_start = state->lex->token_start; |
2467 | state->element_type = state->lex->token_type; |
2468 | state->element_scalar = NULL; |
2469 | } |
2470 | } |
2471 | |
2472 | /* json array element end handler for populate_array_json() */ |
2473 | static void |
2474 | populate_array_element_end(void *_state, bool isnull) |
2475 | { |
2476 | PopulateArrayState *state = (PopulateArrayState *) _state; |
2477 | PopulateArrayContext *ctx = state->ctx; |
2478 | int ndim = state->lex->lex_level; |
2479 | |
2480 | Assert(ctx->ndims > 0); |
2481 | |
2482 | if (ndim == ctx->ndims) |
2483 | { |
2484 | JsValue jsv; |
2485 | |
2486 | jsv.is_json = true; |
2487 | jsv.val.json.type = state->element_type; |
2488 | |
2489 | if (isnull) |
2490 | { |
2491 | Assert(jsv.val.json.type == JSON_TOKEN_NULL); |
2492 | jsv.val.json.str = NULL; |
2493 | jsv.val.json.len = 0; |
2494 | } |
2495 | else if (state->element_scalar) |
2496 | { |
2497 | jsv.val.json.str = state->element_scalar; |
2498 | jsv.val.json.len = -1; /* null-terminated */ |
2499 | } |
2500 | else |
2501 | { |
2502 | jsv.val.json.str = state->element_start; |
2503 | jsv.val.json.len = (state->lex->prev_token_terminator - |
2504 | state->element_start) * sizeof(char); |
2505 | } |
2506 | |
2507 | populate_array_element(ctx, ndim, &jsv); |
2508 | } |
2509 | } |
2510 | |
2511 | /* json scalar handler for populate_array_json() */ |
2512 | static void |
2513 | populate_array_scalar(void *_state, char *token, JsonTokenType tokentype) |
2514 | { |
2515 | PopulateArrayState *state = (PopulateArrayState *) _state; |
2516 | PopulateArrayContext *ctx = state->ctx; |
2517 | int ndim = state->lex->lex_level; |
2518 | |
2519 | if (ctx->ndims <= 0) |
2520 | populate_array_assign_ndims(ctx, ndim); |
2521 | else if (ndim < ctx->ndims) |
2522 | populate_array_report_expected_array(ctx, ndim); |
2523 | |
2524 | if (ndim == ctx->ndims) |
2525 | { |
2526 | /* remember the scalar element token */ |
2527 | state->element_scalar = token; |
2528 | /* element_type must already be set in populate_array_element_start() */ |
2529 | Assert(state->element_type == tokentype); |
2530 | } |
2531 | } |
2532 | |
2533 | /* parse a json array and populate array */ |
2534 | static void |
2535 | populate_array_json(PopulateArrayContext *ctx, char *json, int len) |
2536 | { |
2537 | PopulateArrayState state; |
2538 | JsonSemAction sem; |
2539 | |
2540 | state.lex = makeJsonLexContextCstringLen(json, len, true); |
2541 | state.ctx = ctx; |
2542 | |
2543 | memset(&sem, 0, sizeof(sem)); |
2544 | sem.semstate = (void *) &state; |
2545 | sem.object_start = populate_array_object_start; |
2546 | sem.array_end = populate_array_array_end; |
2547 | sem.array_element_start = populate_array_element_start; |
2548 | sem.array_element_end = populate_array_element_end; |
2549 | sem.scalar = populate_array_scalar; |
2550 | |
2551 | pg_parse_json(state.lex, &sem); |
2552 | |
2553 | /* number of dimensions should be already known */ |
2554 | Assert(ctx->ndims > 0 && ctx->dims); |
2555 | |
2556 | pfree(state.lex); |
2557 | } |
2558 | |
2559 | /* |
2560 | * populate_array_dim_jsonb() -- Iterate recursively through jsonb sub-array |
2561 | * elements and accumulate result using given ArrayBuildState. |
2562 | */ |
2563 | static void |
2564 | populate_array_dim_jsonb(PopulateArrayContext *ctx, /* context */ |
2565 | JsonbValue *jbv, /* jsonb sub-array */ |
2566 | int ndim) /* current dimension */ |
2567 | { |
2568 | JsonbContainer *jbc = jbv->val.binary.data; |
2569 | JsonbIterator *it; |
2570 | JsonbIteratorToken tok; |
2571 | JsonbValue val; |
2572 | JsValue jsv; |
2573 | |
2574 | check_stack_depth(); |
2575 | |
2576 | if (jbv->type != jbvBinary || !JsonContainerIsArray(jbc)) |
2577 | populate_array_report_expected_array(ctx, ndim - 1); |
2578 | |
2579 | Assert(!JsonContainerIsScalar(jbc)); |
2580 | |
2581 | it = JsonbIteratorInit(jbc); |
2582 | |
2583 | tok = JsonbIteratorNext(&it, &val, true); |
2584 | Assert(tok == WJB_BEGIN_ARRAY); |
2585 | |
2586 | tok = JsonbIteratorNext(&it, &val, true); |
2587 | |
2588 | /* |
2589 | * If the number of dimensions is not yet known and we have found end of |
2590 | * the array, or the first child element is not an array, then assign the |
2591 | * number of dimensions now. |
2592 | */ |
2593 | if (ctx->ndims <= 0 && |
2594 | (tok == WJB_END_ARRAY || |
2595 | (tok == WJB_ELEM && |
2596 | (val.type != jbvBinary || |
2597 | !JsonContainerIsArray(val.val.binary.data))))) |
2598 | populate_array_assign_ndims(ctx, ndim); |
2599 | |
2600 | jsv.is_json = false; |
2601 | jsv.val.jsonb = &val; |
2602 | |
2603 | /* process all the array elements */ |
2604 | while (tok == WJB_ELEM) |
2605 | { |
2606 | /* |
2607 | * Recurse only if the dimensions of dimensions is still unknown or if |
2608 | * it is not the innermost dimension. |
2609 | */ |
2610 | if (ctx->ndims > 0 && ndim >= ctx->ndims) |
2611 | populate_array_element(ctx, ndim, &jsv); |
2612 | else |
2613 | { |
2614 | /* populate child sub-array */ |
2615 | populate_array_dim_jsonb(ctx, &val, ndim + 1); |
2616 | |
2617 | /* number of dimensions should be already known */ |
2618 | Assert(ctx->ndims > 0 && ctx->dims); |
2619 | |
2620 | populate_array_check_dimension(ctx, ndim); |
2621 | } |
2622 | |
2623 | tok = JsonbIteratorNext(&it, &val, true); |
2624 | } |
2625 | |
2626 | Assert(tok == WJB_END_ARRAY); |
2627 | |
2628 | /* free iterator, iterating until WJB_DONE */ |
2629 | tok = JsonbIteratorNext(&it, &val, true); |
2630 | Assert(tok == WJB_DONE && !it); |
2631 | } |
2632 | |
2633 | /* recursively populate an array from json/jsonb */ |
2634 | static Datum |
2635 | populate_array(ArrayIOData *aio, |
2636 | const char *colname, |
2637 | MemoryContext mcxt, |
2638 | JsValue *jsv) |
2639 | { |
2640 | PopulateArrayContext ctx; |
2641 | Datum result; |
2642 | int *lbs; |
2643 | int i; |
2644 | |
2645 | ctx.aio = aio; |
2646 | ctx.mcxt = mcxt; |
2647 | ctx.acxt = CurrentMemoryContext; |
2648 | ctx.astate = initArrayResult(aio->element_type, ctx.acxt, true); |
2649 | ctx.colname = colname; |
2650 | ctx.ndims = 0; /* unknown yet */ |
2651 | ctx.dims = NULL; |
2652 | ctx.sizes = NULL; |
2653 | |
2654 | if (jsv->is_json) |
2655 | populate_array_json(&ctx, jsv->val.json.str, |
2656 | jsv->val.json.len >= 0 ? jsv->val.json.len |
2657 | : strlen(jsv->val.json.str)); |
2658 | else |
2659 | { |
2660 | populate_array_dim_jsonb(&ctx, jsv->val.jsonb, 1); |
2661 | ctx.dims[0] = ctx.sizes[0]; |
2662 | } |
2663 | |
2664 | Assert(ctx.ndims > 0); |
2665 | |
2666 | lbs = palloc(sizeof(int) * ctx.ndims); |
2667 | |
2668 | for (i = 0; i < ctx.ndims; i++) |
2669 | lbs[i] = 1; |
2670 | |
2671 | result = makeMdArrayResult(ctx.astate, ctx.ndims, ctx.dims, lbs, |
2672 | ctx.acxt, true); |
2673 | |
2674 | pfree(ctx.dims); |
2675 | pfree(ctx.sizes); |
2676 | pfree(lbs); |
2677 | |
2678 | return result; |
2679 | } |
2680 | |
2681 | static void |
2682 | JsValueToJsObject(JsValue *jsv, JsObject *jso) |
2683 | { |
2684 | jso->is_json = jsv->is_json; |
2685 | |
2686 | if (jsv->is_json) |
2687 | { |
2688 | /* convert plain-text json into a hash table */ |
2689 | jso->val.json_hash = |
2690 | get_json_object_as_hash(jsv->val.json.str, |
2691 | jsv->val.json.len >= 0 |
2692 | ? jsv->val.json.len |
2693 | : strlen(jsv->val.json.str), |
2694 | "populate_composite" ); |
2695 | } |
2696 | else |
2697 | { |
2698 | JsonbValue *jbv = jsv->val.jsonb; |
2699 | |
2700 | if (jbv->type == jbvBinary && |
2701 | JsonContainerIsObject(jbv->val.binary.data)) |
2702 | { |
2703 | jso->val.jsonb_cont = jbv->val.binary.data; |
2704 | } |
2705 | else |
2706 | { |
2707 | bool is_scalar; |
2708 | |
2709 | is_scalar = IsAJsonbScalar(jbv) || |
2710 | (jbv->type == jbvBinary && |
2711 | JsonContainerIsScalar(jbv->val.binary.data)); |
2712 | ereport(ERROR, |
2713 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
2714 | is_scalar |
2715 | ? errmsg("cannot call %s on a scalar" , |
2716 | "populate_composite" ) |
2717 | : errmsg("cannot call %s on an array" , |
2718 | "populate_composite" ))); |
2719 | } |
2720 | } |
2721 | } |
2722 | |
2723 | /* acquire or update cached tuple descriptor for a composite type */ |
2724 | static void |
2725 | update_cached_tupdesc(CompositeIOData *io, MemoryContext mcxt) |
2726 | { |
2727 | if (!io->tupdesc || |
2728 | io->tupdesc->tdtypeid != io->base_typid || |
2729 | io->tupdesc->tdtypmod != io->base_typmod) |
2730 | { |
2731 | TupleDesc tupdesc = lookup_rowtype_tupdesc(io->base_typid, |
2732 | io->base_typmod); |
2733 | MemoryContext oldcxt; |
2734 | |
2735 | if (io->tupdesc) |
2736 | FreeTupleDesc(io->tupdesc); |
2737 | |
2738 | /* copy tuple desc without constraints into cache memory context */ |
2739 | oldcxt = MemoryContextSwitchTo(mcxt); |
2740 | io->tupdesc = CreateTupleDescCopy(tupdesc); |
2741 | MemoryContextSwitchTo(oldcxt); |
2742 | |
2743 | ReleaseTupleDesc(tupdesc); |
2744 | } |
2745 | } |
2746 | |
2747 | /* recursively populate a composite (row type) value from json/jsonb */ |
2748 | static Datum |
2749 | populate_composite(CompositeIOData *io, |
2750 | Oid typid, |
2751 | const char *colname, |
2752 | MemoryContext mcxt, |
2753 | HeapTupleHeader defaultval, |
2754 | JsValue *jsv, |
2755 | bool isnull) |
2756 | { |
2757 | Datum result; |
2758 | |
2759 | /* acquire/update cached tuple descriptor */ |
2760 | update_cached_tupdesc(io, mcxt); |
2761 | |
2762 | if (isnull) |
2763 | result = (Datum) 0; |
2764 | else |
2765 | { |
2766 | HeapTupleHeader tuple; |
2767 | JsObject jso; |
2768 | |
2769 | /* prepare input value */ |
2770 | JsValueToJsObject(jsv, &jso); |
2771 | |
2772 | /* populate resulting record tuple */ |
2773 | tuple = populate_record(io->tupdesc, &io->record_io, |
2774 | defaultval, mcxt, &jso); |
2775 | result = HeapTupleHeaderGetDatum(tuple); |
2776 | |
2777 | JsObjectFree(&jso); |
2778 | } |
2779 | |
2780 | /* |
2781 | * If it's domain over composite, check domain constraints. (This should |
2782 | * probably get refactored so that we can see the TYPECAT value, but for |
2783 | * now, we can tell by comparing typid to base_typid.) |
2784 | */ |
2785 | if (typid != io->base_typid && typid != RECORDOID) |
2786 | domain_check(result, isnull, typid, &io->domain_info, mcxt); |
2787 | |
2788 | return result; |
2789 | } |
2790 | |
2791 | /* populate non-null scalar value from json/jsonb value */ |
2792 | static Datum |
2793 | populate_scalar(ScalarIOData *io, Oid typid, int32 typmod, JsValue *jsv) |
2794 | { |
2795 | Datum res; |
2796 | char *str = NULL; |
2797 | char *json = NULL; |
2798 | |
2799 | if (jsv->is_json) |
2800 | { |
2801 | int len = jsv->val.json.len; |
2802 | |
2803 | json = jsv->val.json.str; |
2804 | Assert(json); |
2805 | if (len >= 0) |
2806 | { |
2807 | /* Need to copy non-null-terminated string */ |
2808 | str = palloc(len + 1 * sizeof(char)); |
2809 | memcpy(str, json, len); |
2810 | str[len] = '\0'; |
2811 | } |
2812 | else |
2813 | str = json; /* string is already null-terminated */ |
2814 | |
2815 | /* If converting to json/jsonb, make string into valid JSON literal */ |
2816 | if ((typid == JSONOID || typid == JSONBOID) && |
2817 | jsv->val.json.type == JSON_TOKEN_STRING) |
2818 | { |
2819 | StringInfoData buf; |
2820 | |
2821 | initStringInfo(&buf); |
2822 | escape_json(&buf, str); |
2823 | /* free temporary buffer */ |
2824 | if (str != json) |
2825 | pfree(str); |
2826 | str = buf.data; |
2827 | } |
2828 | } |
2829 | else |
2830 | { |
2831 | JsonbValue *jbv = jsv->val.jsonb; |
2832 | |
2833 | if (typid == JSONBOID) |
2834 | { |
2835 | Jsonb *jsonb = JsonbValueToJsonb(jbv); /* directly use jsonb */ |
2836 | |
2837 | return JsonbPGetDatum(jsonb); |
2838 | } |
2839 | /* convert jsonb to string for typio call */ |
2840 | else if (typid == JSONOID && jbv->type != jbvBinary) |
2841 | { |
2842 | /* |
2843 | * Convert scalar jsonb (non-scalars are passed here as jbvBinary) |
2844 | * to json string, preserving quotes around top-level strings. |
2845 | */ |
2846 | Jsonb *jsonb = JsonbValueToJsonb(jbv); |
2847 | |
2848 | str = JsonbToCString(NULL, &jsonb->root, VARSIZE(jsonb)); |
2849 | } |
2850 | else if (jbv->type == jbvString) /* quotes are stripped */ |
2851 | str = pnstrdup(jbv->val.string.val, jbv->val.string.len); |
2852 | else if (jbv->type == jbvBool) |
2853 | str = pstrdup(jbv->val.boolean ? "true" : "false" ); |
2854 | else if (jbv->type == jbvNumeric) |
2855 | str = DatumGetCString(DirectFunctionCall1(numeric_out, |
2856 | PointerGetDatum(jbv->val.numeric))); |
2857 | else if (jbv->type == jbvBinary) |
2858 | str = JsonbToCString(NULL, jbv->val.binary.data, |
2859 | jbv->val.binary.len); |
2860 | else |
2861 | elog(ERROR, "unrecognized jsonb type: %d" , (int) jbv->type); |
2862 | } |
2863 | |
2864 | res = InputFunctionCall(&io->typiofunc, str, io->typioparam, typmod); |
2865 | |
2866 | /* free temporary buffer */ |
2867 | if (str != json) |
2868 | pfree(str); |
2869 | |
2870 | return res; |
2871 | } |
2872 | |
2873 | static Datum |
2874 | populate_domain(DomainIOData *io, |
2875 | Oid typid, |
2876 | const char *colname, |
2877 | MemoryContext mcxt, |
2878 | JsValue *jsv, |
2879 | bool isnull) |
2880 | { |
2881 | Datum res; |
2882 | |
2883 | if (isnull) |
2884 | res = (Datum) 0; |
2885 | else |
2886 | { |
2887 | res = populate_record_field(io->base_io, |
2888 | io->base_typid, io->base_typmod, |
2889 | colname, mcxt, PointerGetDatum(NULL), |
2890 | jsv, &isnull); |
2891 | Assert(!isnull); |
2892 | } |
2893 | |
2894 | domain_check(res, isnull, typid, &io->domain_info, mcxt); |
2895 | |
2896 | return res; |
2897 | } |
2898 | |
2899 | /* prepare column metadata cache for the given type */ |
2900 | static void |
2901 | prepare_column_cache(ColumnIOData *column, |
2902 | Oid typid, |
2903 | int32 typmod, |
2904 | MemoryContext mcxt, |
2905 | bool need_scalar) |
2906 | { |
2907 | HeapTuple tup; |
2908 | Form_pg_type type; |
2909 | |
2910 | column->typid = typid; |
2911 | column->typmod = typmod; |
2912 | |
2913 | tup = SearchSysCache1(TYPEOID, ObjectIdGetDatum(typid)); |
2914 | if (!HeapTupleIsValid(tup)) |
2915 | elog(ERROR, "cache lookup failed for type %u" , typid); |
2916 | |
2917 | type = (Form_pg_type) GETSTRUCT(tup); |
2918 | |
2919 | if (type->typtype == TYPTYPE_DOMAIN) |
2920 | { |
2921 | /* |
2922 | * We can move directly to the bottom base type; domain_check() will |
2923 | * take care of checking all constraints for a stack of domains. |
2924 | */ |
2925 | Oid base_typid; |
2926 | int32 base_typmod = typmod; |
2927 | |
2928 | base_typid = getBaseTypeAndTypmod(typid, &base_typmod); |
2929 | if (get_typtype(base_typid) == TYPTYPE_COMPOSITE) |
2930 | { |
2931 | /* domain over composite has its own code path */ |
2932 | column->typcat = TYPECAT_COMPOSITE_DOMAIN; |
2933 | column->io.composite.record_io = NULL; |
2934 | column->io.composite.tupdesc = NULL; |
2935 | column->io.composite.base_typid = base_typid; |
2936 | column->io.composite.base_typmod = base_typmod; |
2937 | column->io.composite.domain_info = NULL; |
2938 | } |
2939 | else |
2940 | { |
2941 | /* domain over anything else */ |
2942 | column->typcat = TYPECAT_DOMAIN; |
2943 | column->io.domain.base_typid = base_typid; |
2944 | column->io.domain.base_typmod = base_typmod; |
2945 | column->io.domain.base_io = |
2946 | MemoryContextAllocZero(mcxt, sizeof(ColumnIOData)); |
2947 | column->io.domain.domain_info = NULL; |
2948 | } |
2949 | } |
2950 | else if (type->typtype == TYPTYPE_COMPOSITE || typid == RECORDOID) |
2951 | { |
2952 | column->typcat = TYPECAT_COMPOSITE; |
2953 | column->io.composite.record_io = NULL; |
2954 | column->io.composite.tupdesc = NULL; |
2955 | column->io.composite.base_typid = typid; |
2956 | column->io.composite.base_typmod = typmod; |
2957 | column->io.composite.domain_info = NULL; |
2958 | } |
2959 | else if (type->typlen == -1 && OidIsValid(type->typelem)) |
2960 | { |
2961 | column->typcat = TYPECAT_ARRAY; |
2962 | column->io.array.element_info = MemoryContextAllocZero(mcxt, |
2963 | sizeof(ColumnIOData)); |
2964 | column->io.array.element_type = type->typelem; |
2965 | /* array element typemod stored in attribute's typmod */ |
2966 | column->io.array.element_typmod = typmod; |
2967 | } |
2968 | else |
2969 | { |
2970 | column->typcat = TYPECAT_SCALAR; |
2971 | need_scalar = true; |
2972 | } |
2973 | |
2974 | /* caller can force us to look up scalar_io info even for non-scalars */ |
2975 | if (need_scalar) |
2976 | { |
2977 | Oid typioproc; |
2978 | |
2979 | getTypeInputInfo(typid, &typioproc, &column->scalar_io.typioparam); |
2980 | fmgr_info_cxt(typioproc, &column->scalar_io.typiofunc, mcxt); |
2981 | } |
2982 | |
2983 | ReleaseSysCache(tup); |
2984 | } |
2985 | |
2986 | /* recursively populate a record field or an array element from a json/jsonb value */ |
2987 | static Datum |
2988 | populate_record_field(ColumnIOData *col, |
2989 | Oid typid, |
2990 | int32 typmod, |
2991 | const char *colname, |
2992 | MemoryContext mcxt, |
2993 | Datum defaultval, |
2994 | JsValue *jsv, |
2995 | bool *isnull) |
2996 | { |
2997 | TypeCat typcat; |
2998 | |
2999 | check_stack_depth(); |
3000 | |
3001 | /* |
3002 | * Prepare column metadata cache for the given type. Force lookup of the |
3003 | * scalar_io data so that the json string hack below will work. |
3004 | */ |
3005 | if (col->typid != typid || col->typmod != typmod) |
3006 | prepare_column_cache(col, typid, typmod, mcxt, true); |
3007 | |
3008 | *isnull = JsValueIsNull(jsv); |
3009 | |
3010 | typcat = col->typcat; |
3011 | |
3012 | /* try to convert json string to a non-scalar type through input function */ |
3013 | if (JsValueIsString(jsv) && |
3014 | (typcat == TYPECAT_ARRAY || |
3015 | typcat == TYPECAT_COMPOSITE || |
3016 | typcat == TYPECAT_COMPOSITE_DOMAIN)) |
3017 | typcat = TYPECAT_SCALAR; |
3018 | |
3019 | /* we must perform domain checks for NULLs, otherwise exit immediately */ |
3020 | if (*isnull && |
3021 | typcat != TYPECAT_DOMAIN && |
3022 | typcat != TYPECAT_COMPOSITE_DOMAIN) |
3023 | return (Datum) 0; |
3024 | |
3025 | switch (typcat) |
3026 | { |
3027 | case TYPECAT_SCALAR: |
3028 | return populate_scalar(&col->scalar_io, typid, typmod, jsv); |
3029 | |
3030 | case TYPECAT_ARRAY: |
3031 | return populate_array(&col->io.array, colname, mcxt, jsv); |
3032 | |
3033 | case TYPECAT_COMPOSITE: |
3034 | case TYPECAT_COMPOSITE_DOMAIN: |
3035 | return populate_composite(&col->io.composite, typid, |
3036 | colname, mcxt, |
3037 | DatumGetPointer(defaultval) |
3038 | ? DatumGetHeapTupleHeader(defaultval) |
3039 | : NULL, |
3040 | jsv, *isnull); |
3041 | |
3042 | case TYPECAT_DOMAIN: |
3043 | return populate_domain(&col->io.domain, typid, colname, mcxt, |
3044 | jsv, *isnull); |
3045 | |
3046 | default: |
3047 | elog(ERROR, "unrecognized type category '%c'" , typcat); |
3048 | return (Datum) 0; |
3049 | } |
3050 | } |
3051 | |
3052 | static RecordIOData * |
3053 | allocate_record_info(MemoryContext mcxt, int ncolumns) |
3054 | { |
3055 | RecordIOData *data = (RecordIOData *) |
3056 | MemoryContextAlloc(mcxt, |
3057 | offsetof(RecordIOData, columns) + |
3058 | ncolumns * sizeof(ColumnIOData)); |
3059 | |
3060 | data->record_type = InvalidOid; |
3061 | data->record_typmod = 0; |
3062 | data->ncolumns = ncolumns; |
3063 | MemSet(data->columns, 0, sizeof(ColumnIOData) * ncolumns); |
3064 | |
3065 | return data; |
3066 | } |
3067 | |
3068 | static bool |
3069 | JsObjectGetField(JsObject *obj, char *field, JsValue *jsv) |
3070 | { |
3071 | jsv->is_json = obj->is_json; |
3072 | |
3073 | if (jsv->is_json) |
3074 | { |
3075 | JsonHashEntry *hashentry = hash_search(obj->val.json_hash, field, |
3076 | HASH_FIND, NULL); |
3077 | |
3078 | jsv->val.json.type = hashentry ? hashentry->type : JSON_TOKEN_NULL; |
3079 | jsv->val.json.str = jsv->val.json.type == JSON_TOKEN_NULL ? NULL : |
3080 | hashentry->val; |
3081 | jsv->val.json.len = jsv->val.json.str ? -1 : 0; /* null-terminated */ |
3082 | |
3083 | return hashentry != NULL; |
3084 | } |
3085 | else |
3086 | { |
3087 | jsv->val.jsonb = !obj->val.jsonb_cont ? NULL : |
3088 | findJsonbValueFromContainerLen(obj->val.jsonb_cont, JB_FOBJECT, |
3089 | field, strlen(field)); |
3090 | |
3091 | return jsv->val.jsonb != NULL; |
3092 | } |
3093 | } |
3094 | |
3095 | /* populate a record tuple from json/jsonb value */ |
3096 | static HeapTupleHeader |
3097 | populate_record(TupleDesc tupdesc, |
3098 | RecordIOData **record_p, |
3099 | HeapTupleHeader defaultval, |
3100 | MemoryContext mcxt, |
3101 | JsObject *obj) |
3102 | { |
3103 | RecordIOData *record = *record_p; |
3104 | Datum *values; |
3105 | bool *nulls; |
3106 | HeapTuple res; |
3107 | int ncolumns = tupdesc->natts; |
3108 | int i; |
3109 | |
3110 | /* |
3111 | * if the input json is empty, we can only skip the rest if we were passed |
3112 | * in a non-null record, since otherwise there may be issues with domain |
3113 | * nulls. |
3114 | */ |
3115 | if (defaultval && JsObjectIsEmpty(obj)) |
3116 | return defaultval; |
3117 | |
3118 | /* (re)allocate metadata cache */ |
3119 | if (record == NULL || |
3120 | record->ncolumns != ncolumns) |
3121 | *record_p = record = allocate_record_info(mcxt, ncolumns); |
3122 | |
3123 | /* invalidate metadata cache if the record type has changed */ |
3124 | if (record->record_type != tupdesc->tdtypeid || |
3125 | record->record_typmod != tupdesc->tdtypmod) |
3126 | { |
3127 | MemSet(record, 0, offsetof(RecordIOData, columns) + |
3128 | ncolumns * sizeof(ColumnIOData)); |
3129 | record->record_type = tupdesc->tdtypeid; |
3130 | record->record_typmod = tupdesc->tdtypmod; |
3131 | record->ncolumns = ncolumns; |
3132 | } |
3133 | |
3134 | values = (Datum *) palloc(ncolumns * sizeof(Datum)); |
3135 | nulls = (bool *) palloc(ncolumns * sizeof(bool)); |
3136 | |
3137 | if (defaultval) |
3138 | { |
3139 | HeapTupleData tuple; |
3140 | |
3141 | /* Build a temporary HeapTuple control structure */ |
3142 | tuple.t_len = HeapTupleHeaderGetDatumLength(defaultval); |
3143 | ItemPointerSetInvalid(&(tuple.t_self)); |
3144 | tuple.t_tableOid = InvalidOid; |
3145 | tuple.t_data = defaultval; |
3146 | |
3147 | /* Break down the tuple into fields */ |
3148 | heap_deform_tuple(&tuple, tupdesc, values, nulls); |
3149 | } |
3150 | else |
3151 | { |
3152 | for (i = 0; i < ncolumns; ++i) |
3153 | { |
3154 | values[i] = (Datum) 0; |
3155 | nulls[i] = true; |
3156 | } |
3157 | } |
3158 | |
3159 | for (i = 0; i < ncolumns; ++i) |
3160 | { |
3161 | Form_pg_attribute att = TupleDescAttr(tupdesc, i); |
3162 | char *colname = NameStr(att->attname); |
3163 | JsValue field = {0}; |
3164 | bool found; |
3165 | |
3166 | /* Ignore dropped columns in datatype */ |
3167 | if (att->attisdropped) |
3168 | { |
3169 | nulls[i] = true; |
3170 | continue; |
3171 | } |
3172 | |
3173 | found = JsObjectGetField(obj, colname, &field); |
3174 | |
3175 | /* |
3176 | * we can't just skip here if the key wasn't found since we might have |
3177 | * a domain to deal with. If we were passed in a non-null record |
3178 | * datum, we assume that the existing values are valid (if they're |
3179 | * not, then it's not our fault), but if we were passed in a null, |
3180 | * then every field which we don't populate needs to be run through |
3181 | * the input function just in case it's a domain type. |
3182 | */ |
3183 | if (defaultval && !found) |
3184 | continue; |
3185 | |
3186 | values[i] = populate_record_field(&record->columns[i], |
3187 | att->atttypid, |
3188 | att->atttypmod, |
3189 | colname, |
3190 | mcxt, |
3191 | nulls[i] ? (Datum) 0 : values[i], |
3192 | &field, |
3193 | &nulls[i]); |
3194 | } |
3195 | |
3196 | res = heap_form_tuple(tupdesc, values, nulls); |
3197 | |
3198 | pfree(values); |
3199 | pfree(nulls); |
3200 | |
3201 | return res->t_data; |
3202 | } |
3203 | |
3204 | /* |
3205 | * Setup for json{b}_populate_record{set}: result type will be same as first |
3206 | * argument's type --- unless first argument is "null::record", which we can't |
3207 | * extract type info from; we handle that later. |
3208 | */ |
3209 | static void |
3210 | get_record_type_from_argument(FunctionCallInfo fcinfo, |
3211 | const char *funcname, |
3212 | PopulateRecordCache *cache) |
3213 | { |
3214 | cache->argtype = get_fn_expr_argtype(fcinfo->flinfo, 0); |
3215 | prepare_column_cache(&cache->c, |
3216 | cache->argtype, -1, |
3217 | cache->fn_mcxt, false); |
3218 | if (cache->c.typcat != TYPECAT_COMPOSITE && |
3219 | cache->c.typcat != TYPECAT_COMPOSITE_DOMAIN) |
3220 | ereport(ERROR, |
3221 | (errcode(ERRCODE_DATATYPE_MISMATCH), |
3222 | /* translator: %s is a function name, eg json_to_record */ |
3223 | errmsg("first argument of %s must be a row type" , |
3224 | funcname))); |
3225 | } |
3226 | |
3227 | /* |
3228 | * Setup for json{b}_to_record{set}: result type is specified by calling |
3229 | * query. We'll also use this code for json{b}_populate_record{set}, |
3230 | * if we discover that the first argument is a null of type RECORD. |
3231 | * |
3232 | * Here it is syntactically impossible to specify the target type |
3233 | * as domain-over-composite. |
3234 | */ |
3235 | static void |
3236 | get_record_type_from_query(FunctionCallInfo fcinfo, |
3237 | const char *funcname, |
3238 | PopulateRecordCache *cache) |
3239 | { |
3240 | TupleDesc tupdesc; |
3241 | MemoryContext old_cxt; |
3242 | |
3243 | if (get_call_result_type(fcinfo, NULL, &tupdesc) != TYPEFUNC_COMPOSITE) |
3244 | ereport(ERROR, |
3245 | (errcode(ERRCODE_FEATURE_NOT_SUPPORTED), |
3246 | /* translator: %s is a function name, eg json_to_record */ |
3247 | errmsg("could not determine row type for result of %s" , |
3248 | funcname), |
3249 | errhint("Provide a non-null record argument, " |
3250 | "or call the function in the FROM clause " |
3251 | "using a column definition list." ))); |
3252 | |
3253 | Assert(tupdesc); |
3254 | cache->argtype = tupdesc->tdtypeid; |
3255 | |
3256 | /* If we go through this more than once, avoid memory leak */ |
3257 | if (cache->c.io.composite.tupdesc) |
3258 | FreeTupleDesc(cache->c.io.composite.tupdesc); |
3259 | |
3260 | /* Save identified tupdesc */ |
3261 | old_cxt = MemoryContextSwitchTo(cache->fn_mcxt); |
3262 | cache->c.io.composite.tupdesc = CreateTupleDescCopy(tupdesc); |
3263 | cache->c.io.composite.base_typid = tupdesc->tdtypeid; |
3264 | cache->c.io.composite.base_typmod = tupdesc->tdtypmod; |
3265 | MemoryContextSwitchTo(old_cxt); |
3266 | } |
3267 | |
3268 | /* |
3269 | * common worker for json{b}_populate_record() and json{b}_to_record() |
3270 | * is_json and have_record_arg identify the specific function |
3271 | */ |
3272 | static Datum |
3273 | populate_record_worker(FunctionCallInfo fcinfo, const char *funcname, |
3274 | bool is_json, bool have_record_arg) |
3275 | { |
3276 | int json_arg_num = have_record_arg ? 1 : 0; |
3277 | JsValue jsv = {0}; |
3278 | HeapTupleHeader rec; |
3279 | Datum rettuple; |
3280 | JsonbValue jbv; |
3281 | MemoryContext fnmcxt = fcinfo->flinfo->fn_mcxt; |
3282 | PopulateRecordCache *cache = fcinfo->flinfo->fn_extra; |
3283 | |
3284 | /* |
3285 | * If first time through, identify input/result record type. Note that |
3286 | * this stanza looks only at fcinfo context, which can't change during the |
3287 | * query; so we may not be able to fully resolve a RECORD input type yet. |
3288 | */ |
3289 | if (!cache) |
3290 | { |
3291 | fcinfo->flinfo->fn_extra = cache = |
3292 | MemoryContextAllocZero(fnmcxt, sizeof(*cache)); |
3293 | cache->fn_mcxt = fnmcxt; |
3294 | |
3295 | if (have_record_arg) |
3296 | get_record_type_from_argument(fcinfo, funcname, cache); |
3297 | else |
3298 | get_record_type_from_query(fcinfo, funcname, cache); |
3299 | } |
3300 | |
3301 | /* Collect record arg if we have one */ |
3302 | if (!have_record_arg) |
3303 | rec = NULL; /* it's json{b}_to_record() */ |
3304 | else if (!PG_ARGISNULL(0)) |
3305 | { |
3306 | rec = PG_GETARG_HEAPTUPLEHEADER(0); |
3307 | |
3308 | /* |
3309 | * When declared arg type is RECORD, identify actual record type from |
3310 | * the tuple itself. |
3311 | */ |
3312 | if (cache->argtype == RECORDOID) |
3313 | { |
3314 | cache->c.io.composite.base_typid = HeapTupleHeaderGetTypeId(rec); |
3315 | cache->c.io.composite.base_typmod = HeapTupleHeaderGetTypMod(rec); |
3316 | } |
3317 | } |
3318 | else |
3319 | { |
3320 | rec = NULL; |
3321 | |
3322 | /* |
3323 | * When declared arg type is RECORD, identify actual record type from |
3324 | * calling query, or fail if we can't. |
3325 | */ |
3326 | if (cache->argtype == RECORDOID) |
3327 | { |
3328 | get_record_type_from_query(fcinfo, funcname, cache); |
3329 | /* This can't change argtype, which is important for next time */ |
3330 | Assert(cache->argtype == RECORDOID); |
3331 | } |
3332 | } |
3333 | |
3334 | /* If no JSON argument, just return the record (if any) unchanged */ |
3335 | if (PG_ARGISNULL(json_arg_num)) |
3336 | { |
3337 | if (rec) |
3338 | PG_RETURN_POINTER(rec); |
3339 | else |
3340 | PG_RETURN_NULL(); |
3341 | } |
3342 | |
3343 | jsv.is_json = is_json; |
3344 | |
3345 | if (is_json) |
3346 | { |
3347 | text *json = PG_GETARG_TEXT_PP(json_arg_num); |
3348 | |
3349 | jsv.val.json.str = VARDATA_ANY(json); |
3350 | jsv.val.json.len = VARSIZE_ANY_EXHDR(json); |
3351 | jsv.val.json.type = JSON_TOKEN_INVALID; /* not used in |
3352 | * populate_composite() */ |
3353 | } |
3354 | else |
3355 | { |
3356 | Jsonb *jb = PG_GETARG_JSONB_P(json_arg_num); |
3357 | |
3358 | jsv.val.jsonb = &jbv; |
3359 | |
3360 | /* fill binary jsonb value pointing to jb */ |
3361 | jbv.type = jbvBinary; |
3362 | jbv.val.binary.data = &jb->root; |
3363 | jbv.val.binary.len = VARSIZE(jb) - VARHDRSZ; |
3364 | } |
3365 | |
3366 | rettuple = populate_composite(&cache->c.io.composite, cache->argtype, |
3367 | NULL, fnmcxt, rec, &jsv, false); |
3368 | |
3369 | PG_RETURN_DATUM(rettuple); |
3370 | } |
3371 | |
3372 | /* |
3373 | * get_json_object_as_hash |
3374 | * |
3375 | * decompose a json object into a hash table. |
3376 | */ |
3377 | static HTAB * |
3378 | get_json_object_as_hash(char *json, int len, const char *funcname) |
3379 | { |
3380 | HASHCTL ctl; |
3381 | HTAB *tab; |
3382 | JHashState *state; |
3383 | JsonLexContext *lex = makeJsonLexContextCstringLen(json, len, true); |
3384 | JsonSemAction *sem; |
3385 | |
3386 | memset(&ctl, 0, sizeof(ctl)); |
3387 | ctl.keysize = NAMEDATALEN; |
3388 | ctl.entrysize = sizeof(JsonHashEntry); |
3389 | ctl.hcxt = CurrentMemoryContext; |
3390 | tab = hash_create("json object hashtable" , |
3391 | 100, |
3392 | &ctl, |
3393 | HASH_ELEM | HASH_CONTEXT); |
3394 | |
3395 | state = palloc0(sizeof(JHashState)); |
3396 | sem = palloc0(sizeof(JsonSemAction)); |
3397 | |
3398 | state->function_name = funcname; |
3399 | state->hash = tab; |
3400 | state->lex = lex; |
3401 | |
3402 | sem->semstate = (void *) state; |
3403 | sem->array_start = hash_array_start; |
3404 | sem->scalar = hash_scalar; |
3405 | sem->object_field_start = hash_object_field_start; |
3406 | sem->object_field_end = hash_object_field_end; |
3407 | |
3408 | pg_parse_json(lex, sem); |
3409 | |
3410 | return tab; |
3411 | } |
3412 | |
3413 | static void |
3414 | hash_object_field_start(void *state, char *fname, bool isnull) |
3415 | { |
3416 | JHashState *_state = (JHashState *) state; |
3417 | |
3418 | if (_state->lex->lex_level > 1) |
3419 | return; |
3420 | |
3421 | /* remember token type */ |
3422 | _state->saved_token_type = _state->lex->token_type; |
3423 | |
3424 | if (_state->lex->token_type == JSON_TOKEN_ARRAY_START || |
3425 | _state->lex->token_type == JSON_TOKEN_OBJECT_START) |
3426 | { |
3427 | /* remember start position of the whole text of the subobject */ |
3428 | _state->save_json_start = _state->lex->token_start; |
3429 | } |
3430 | else |
3431 | { |
3432 | /* must be a scalar */ |
3433 | _state->save_json_start = NULL; |
3434 | } |
3435 | } |
3436 | |
3437 | static void |
3438 | hash_object_field_end(void *state, char *fname, bool isnull) |
3439 | { |
3440 | JHashState *_state = (JHashState *) state; |
3441 | JsonHashEntry *hashentry; |
3442 | bool found; |
3443 | |
3444 | /* |
3445 | * Ignore nested fields. |
3446 | */ |
3447 | if (_state->lex->lex_level > 1) |
3448 | return; |
3449 | |
3450 | /* |
3451 | * Ignore field names >= NAMEDATALEN - they can't match a record field. |
3452 | * (Note: without this test, the hash code would truncate the string at |
3453 | * NAMEDATALEN-1, and could then match against a similarly-truncated |
3454 | * record field name. That would be a reasonable behavior, but this code |
3455 | * has previously insisted on exact equality, so we keep this behavior.) |
3456 | */ |
3457 | if (strlen(fname) >= NAMEDATALEN) |
3458 | return; |
3459 | |
3460 | hashentry = hash_search(_state->hash, fname, HASH_ENTER, &found); |
3461 | |
3462 | /* |
3463 | * found being true indicates a duplicate. We don't do anything about |
3464 | * that, a later field with the same name overrides the earlier field. |
3465 | */ |
3466 | |
3467 | hashentry->type = _state->saved_token_type; |
3468 | Assert(isnull == (hashentry->type == JSON_TOKEN_NULL)); |
3469 | |
3470 | if (_state->save_json_start != NULL) |
3471 | { |
3472 | int len = _state->lex->prev_token_terminator - _state->save_json_start; |
3473 | char *val = palloc((len + 1) * sizeof(char)); |
3474 | |
3475 | memcpy(val, _state->save_json_start, len); |
3476 | val[len] = '\0'; |
3477 | hashentry->val = val; |
3478 | } |
3479 | else |
3480 | { |
3481 | /* must have had a scalar instead */ |
3482 | hashentry->val = _state->saved_scalar; |
3483 | } |
3484 | } |
3485 | |
3486 | static void |
3487 | hash_array_start(void *state) |
3488 | { |
3489 | JHashState *_state = (JHashState *) state; |
3490 | |
3491 | if (_state->lex->lex_level == 0) |
3492 | ereport(ERROR, |
3493 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
3494 | errmsg("cannot call %s on an array" , _state->function_name))); |
3495 | } |
3496 | |
3497 | static void |
3498 | hash_scalar(void *state, char *token, JsonTokenType tokentype) |
3499 | { |
3500 | JHashState *_state = (JHashState *) state; |
3501 | |
3502 | if (_state->lex->lex_level == 0) |
3503 | ereport(ERROR, |
3504 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
3505 | errmsg("cannot call %s on a scalar" , _state->function_name))); |
3506 | |
3507 | if (_state->lex->lex_level == 1) |
3508 | { |
3509 | _state->saved_scalar = token; |
3510 | /* saved_token_type must already be set in hash_object_field_start() */ |
3511 | Assert(_state->saved_token_type == tokentype); |
3512 | } |
3513 | } |
3514 | |
3515 | |
3516 | /* |
3517 | * SQL function json_populate_recordset |
3518 | * |
3519 | * set fields in a set of records from the argument json, |
3520 | * which must be an array of objects. |
3521 | * |
3522 | * similar to json_populate_record, but the tuple-building code |
3523 | * is pushed down into the semantic action handlers so it's done |
3524 | * per object in the array. |
3525 | */ |
3526 | Datum |
3527 | jsonb_populate_recordset(PG_FUNCTION_ARGS) |
3528 | { |
3529 | return populate_recordset_worker(fcinfo, "jsonb_populate_recordset" , |
3530 | false, true); |
3531 | } |
3532 | |
3533 | Datum |
3534 | jsonb_to_recordset(PG_FUNCTION_ARGS) |
3535 | { |
3536 | return populate_recordset_worker(fcinfo, "jsonb_to_recordset" , |
3537 | false, false); |
3538 | } |
3539 | |
3540 | Datum |
3541 | json_populate_recordset(PG_FUNCTION_ARGS) |
3542 | { |
3543 | return populate_recordset_worker(fcinfo, "json_populate_recordset" , |
3544 | true, true); |
3545 | } |
3546 | |
3547 | Datum |
3548 | json_to_recordset(PG_FUNCTION_ARGS) |
3549 | { |
3550 | return populate_recordset_worker(fcinfo, "json_to_recordset" , |
3551 | true, false); |
3552 | } |
3553 | |
3554 | static void |
3555 | populate_recordset_record(PopulateRecordsetState *state, JsObject *obj) |
3556 | { |
3557 | PopulateRecordCache *cache = state->cache; |
3558 | HeapTupleHeader tuphead; |
3559 | HeapTupleData tuple; |
3560 | |
3561 | /* acquire/update cached tuple descriptor */ |
3562 | update_cached_tupdesc(&cache->c.io.composite, cache->fn_mcxt); |
3563 | |
3564 | /* replace record fields from json */ |
3565 | tuphead = populate_record(cache->c.io.composite.tupdesc, |
3566 | &cache->c.io.composite.record_io, |
3567 | state->rec, |
3568 | cache->fn_mcxt, |
3569 | obj); |
3570 | |
3571 | /* if it's domain over composite, check domain constraints */ |
3572 | if (cache->c.typcat == TYPECAT_COMPOSITE_DOMAIN) |
3573 | domain_check(HeapTupleHeaderGetDatum(tuphead), false, |
3574 | cache->argtype, |
3575 | &cache->c.io.composite.domain_info, |
3576 | cache->fn_mcxt); |
3577 | |
3578 | /* ok, save into tuplestore */ |
3579 | tuple.t_len = HeapTupleHeaderGetDatumLength(tuphead); |
3580 | ItemPointerSetInvalid(&(tuple.t_self)); |
3581 | tuple.t_tableOid = InvalidOid; |
3582 | tuple.t_data = tuphead; |
3583 | |
3584 | tuplestore_puttuple(state->tuple_store, &tuple); |
3585 | } |
3586 | |
3587 | /* |
3588 | * common worker for json{b}_populate_recordset() and json{b}_to_recordset() |
3589 | * is_json and have_record_arg identify the specific function |
3590 | */ |
3591 | static Datum |
3592 | populate_recordset_worker(FunctionCallInfo fcinfo, const char *funcname, |
3593 | bool is_json, bool have_record_arg) |
3594 | { |
3595 | int json_arg_num = have_record_arg ? 1 : 0; |
3596 | ReturnSetInfo *rsi; |
3597 | MemoryContext old_cxt; |
3598 | HeapTupleHeader rec; |
3599 | PopulateRecordCache *cache = fcinfo->flinfo->fn_extra; |
3600 | PopulateRecordsetState *state; |
3601 | |
3602 | rsi = (ReturnSetInfo *) fcinfo->resultinfo; |
3603 | |
3604 | if (!rsi || !IsA(rsi, ReturnSetInfo) || |
3605 | (rsi->allowedModes & SFRM_Materialize) == 0) |
3606 | ereport(ERROR, |
3607 | (errcode(ERRCODE_FEATURE_NOT_SUPPORTED), |
3608 | errmsg("set-valued function called in context that " |
3609 | "cannot accept a set" ))); |
3610 | |
3611 | rsi->returnMode = SFRM_Materialize; |
3612 | |
3613 | /* |
3614 | * If first time through, identify input/result record type. Note that |
3615 | * this stanza looks only at fcinfo context, which can't change during the |
3616 | * query; so we may not be able to fully resolve a RECORD input type yet. |
3617 | */ |
3618 | if (!cache) |
3619 | { |
3620 | fcinfo->flinfo->fn_extra = cache = |
3621 | MemoryContextAllocZero(fcinfo->flinfo->fn_mcxt, sizeof(*cache)); |
3622 | cache->fn_mcxt = fcinfo->flinfo->fn_mcxt; |
3623 | |
3624 | if (have_record_arg) |
3625 | get_record_type_from_argument(fcinfo, funcname, cache); |
3626 | else |
3627 | get_record_type_from_query(fcinfo, funcname, cache); |
3628 | } |
3629 | |
3630 | /* Collect record arg if we have one */ |
3631 | if (!have_record_arg) |
3632 | rec = NULL; /* it's json{b}_to_recordset() */ |
3633 | else if (!PG_ARGISNULL(0)) |
3634 | { |
3635 | rec = PG_GETARG_HEAPTUPLEHEADER(0); |
3636 | |
3637 | /* |
3638 | * When declared arg type is RECORD, identify actual record type from |
3639 | * the tuple itself. |
3640 | */ |
3641 | if (cache->argtype == RECORDOID) |
3642 | { |
3643 | cache->c.io.composite.base_typid = HeapTupleHeaderGetTypeId(rec); |
3644 | cache->c.io.composite.base_typmod = HeapTupleHeaderGetTypMod(rec); |
3645 | } |
3646 | } |
3647 | else |
3648 | { |
3649 | rec = NULL; |
3650 | |
3651 | /* |
3652 | * When declared arg type is RECORD, identify actual record type from |
3653 | * calling query, or fail if we can't. |
3654 | */ |
3655 | if (cache->argtype == RECORDOID) |
3656 | { |
3657 | get_record_type_from_query(fcinfo, funcname, cache); |
3658 | /* This can't change argtype, which is important for next time */ |
3659 | Assert(cache->argtype == RECORDOID); |
3660 | } |
3661 | } |
3662 | |
3663 | /* if the json is null send back an empty set */ |
3664 | if (PG_ARGISNULL(json_arg_num)) |
3665 | PG_RETURN_NULL(); |
3666 | |
3667 | /* |
3668 | * Forcibly update the cached tupdesc, to ensure we have the right tupdesc |
3669 | * to return even if the JSON contains no rows. |
3670 | */ |
3671 | update_cached_tupdesc(&cache->c.io.composite, cache->fn_mcxt); |
3672 | |
3673 | state = palloc0(sizeof(PopulateRecordsetState)); |
3674 | |
3675 | /* make tuplestore in a sufficiently long-lived memory context */ |
3676 | old_cxt = MemoryContextSwitchTo(rsi->econtext->ecxt_per_query_memory); |
3677 | state->tuple_store = tuplestore_begin_heap(rsi->allowedModes & |
3678 | SFRM_Materialize_Random, |
3679 | false, work_mem); |
3680 | MemoryContextSwitchTo(old_cxt); |
3681 | |
3682 | state->function_name = funcname; |
3683 | state->cache = cache; |
3684 | state->rec = rec; |
3685 | |
3686 | if (is_json) |
3687 | { |
3688 | text *json = PG_GETARG_TEXT_PP(json_arg_num); |
3689 | JsonLexContext *lex; |
3690 | JsonSemAction *sem; |
3691 | |
3692 | sem = palloc0(sizeof(JsonSemAction)); |
3693 | |
3694 | lex = makeJsonLexContext(json, true); |
3695 | |
3696 | sem->semstate = (void *) state; |
3697 | sem->array_start = populate_recordset_array_start; |
3698 | sem->array_element_start = populate_recordset_array_element_start; |
3699 | sem->scalar = populate_recordset_scalar; |
3700 | sem->object_field_start = populate_recordset_object_field_start; |
3701 | sem->object_field_end = populate_recordset_object_field_end; |
3702 | sem->object_start = populate_recordset_object_start; |
3703 | sem->object_end = populate_recordset_object_end; |
3704 | |
3705 | state->lex = lex; |
3706 | |
3707 | pg_parse_json(lex, sem); |
3708 | } |
3709 | else |
3710 | { |
3711 | Jsonb *jb = PG_GETARG_JSONB_P(json_arg_num); |
3712 | JsonbIterator *it; |
3713 | JsonbValue v; |
3714 | bool skipNested = false; |
3715 | JsonbIteratorToken r; |
3716 | |
3717 | if (JB_ROOT_IS_SCALAR(jb) || !JB_ROOT_IS_ARRAY(jb)) |
3718 | ereport(ERROR, |
3719 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
3720 | errmsg("cannot call %s on a non-array" , |
3721 | funcname))); |
3722 | |
3723 | it = JsonbIteratorInit(&jb->root); |
3724 | |
3725 | while ((r = JsonbIteratorNext(&it, &v, skipNested)) != WJB_DONE) |
3726 | { |
3727 | skipNested = true; |
3728 | |
3729 | if (r == WJB_ELEM) |
3730 | { |
3731 | JsObject obj; |
3732 | |
3733 | if (v.type != jbvBinary || |
3734 | !JsonContainerIsObject(v.val.binary.data)) |
3735 | ereport(ERROR, |
3736 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
3737 | errmsg("argument of %s must be an array of objects" , |
3738 | funcname))); |
3739 | |
3740 | obj.is_json = false; |
3741 | obj.val.jsonb_cont = v.val.binary.data; |
3742 | |
3743 | populate_recordset_record(state, &obj); |
3744 | } |
3745 | } |
3746 | } |
3747 | |
3748 | /* |
3749 | * Note: we must copy the cached tupdesc because the executor will free |
3750 | * the passed-back setDesc, but we want to hang onto the cache in case |
3751 | * we're called again in the same query. |
3752 | */ |
3753 | rsi->setResult = state->tuple_store; |
3754 | rsi->setDesc = CreateTupleDescCopy(cache->c.io.composite.tupdesc); |
3755 | |
3756 | PG_RETURN_NULL(); |
3757 | } |
3758 | |
3759 | static void |
3760 | populate_recordset_object_start(void *state) |
3761 | { |
3762 | PopulateRecordsetState *_state = (PopulateRecordsetState *) state; |
3763 | int lex_level = _state->lex->lex_level; |
3764 | HASHCTL ctl; |
3765 | |
3766 | /* Reject object at top level: we must have an array at level 0 */ |
3767 | if (lex_level == 0) |
3768 | ereport(ERROR, |
3769 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
3770 | errmsg("cannot call %s on an object" , |
3771 | _state->function_name))); |
3772 | |
3773 | /* Nested objects require no special processing */ |
3774 | if (lex_level > 1) |
3775 | return; |
3776 | |
3777 | /* Object at level 1: set up a new hash table for this object */ |
3778 | memset(&ctl, 0, sizeof(ctl)); |
3779 | ctl.keysize = NAMEDATALEN; |
3780 | ctl.entrysize = sizeof(JsonHashEntry); |
3781 | ctl.hcxt = CurrentMemoryContext; |
3782 | _state->json_hash = hash_create("json object hashtable" , |
3783 | 100, |
3784 | &ctl, |
3785 | HASH_ELEM | HASH_CONTEXT); |
3786 | } |
3787 | |
3788 | static void |
3789 | populate_recordset_object_end(void *state) |
3790 | { |
3791 | PopulateRecordsetState *_state = (PopulateRecordsetState *) state; |
3792 | JsObject obj; |
3793 | |
3794 | /* Nested objects require no special processing */ |
3795 | if (_state->lex->lex_level > 1) |
3796 | return; |
3797 | |
3798 | obj.is_json = true; |
3799 | obj.val.json_hash = _state->json_hash; |
3800 | |
3801 | /* Otherwise, construct and return a tuple based on this level-1 object */ |
3802 | populate_recordset_record(_state, &obj); |
3803 | |
3804 | /* Done with hash for this object */ |
3805 | hash_destroy(_state->json_hash); |
3806 | _state->json_hash = NULL; |
3807 | } |
3808 | |
3809 | static void |
3810 | populate_recordset_array_element_start(void *state, bool isnull) |
3811 | { |
3812 | PopulateRecordsetState *_state = (PopulateRecordsetState *) state; |
3813 | |
3814 | if (_state->lex->lex_level == 1 && |
3815 | _state->lex->token_type != JSON_TOKEN_OBJECT_START) |
3816 | ereport(ERROR, |
3817 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
3818 | errmsg("argument of %s must be an array of objects" , |
3819 | _state->function_name))); |
3820 | } |
3821 | |
3822 | static void |
3823 | populate_recordset_array_start(void *state) |
3824 | { |
3825 | /* nothing to do */ |
3826 | } |
3827 | |
3828 | static void |
3829 | populate_recordset_scalar(void *state, char *token, JsonTokenType tokentype) |
3830 | { |
3831 | PopulateRecordsetState *_state = (PopulateRecordsetState *) state; |
3832 | |
3833 | if (_state->lex->lex_level == 0) |
3834 | ereport(ERROR, |
3835 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
3836 | errmsg("cannot call %s on a scalar" , |
3837 | _state->function_name))); |
3838 | |
3839 | if (_state->lex->lex_level == 2) |
3840 | _state->saved_scalar = token; |
3841 | } |
3842 | |
3843 | static void |
3844 | populate_recordset_object_field_start(void *state, char *fname, bool isnull) |
3845 | { |
3846 | PopulateRecordsetState *_state = (PopulateRecordsetState *) state; |
3847 | |
3848 | if (_state->lex->lex_level > 2) |
3849 | return; |
3850 | |
3851 | _state->saved_token_type = _state->lex->token_type; |
3852 | |
3853 | if (_state->lex->token_type == JSON_TOKEN_ARRAY_START || |
3854 | _state->lex->token_type == JSON_TOKEN_OBJECT_START) |
3855 | { |
3856 | _state->save_json_start = _state->lex->token_start; |
3857 | } |
3858 | else |
3859 | { |
3860 | _state->save_json_start = NULL; |
3861 | } |
3862 | } |
3863 | |
3864 | static void |
3865 | populate_recordset_object_field_end(void *state, char *fname, bool isnull) |
3866 | { |
3867 | PopulateRecordsetState *_state = (PopulateRecordsetState *) state; |
3868 | JsonHashEntry *hashentry; |
3869 | bool found; |
3870 | |
3871 | /* |
3872 | * Ignore nested fields. |
3873 | */ |
3874 | if (_state->lex->lex_level > 2) |
3875 | return; |
3876 | |
3877 | /* |
3878 | * Ignore field names >= NAMEDATALEN - they can't match a record field. |
3879 | * (Note: without this test, the hash code would truncate the string at |
3880 | * NAMEDATALEN-1, and could then match against a similarly-truncated |
3881 | * record field name. That would be a reasonable behavior, but this code |
3882 | * has previously insisted on exact equality, so we keep this behavior.) |
3883 | */ |
3884 | if (strlen(fname) >= NAMEDATALEN) |
3885 | return; |
3886 | |
3887 | hashentry = hash_search(_state->json_hash, fname, HASH_ENTER, &found); |
3888 | |
3889 | /* |
3890 | * found being true indicates a duplicate. We don't do anything about |
3891 | * that, a later field with the same name overrides the earlier field. |
3892 | */ |
3893 | |
3894 | hashentry->type = _state->saved_token_type; |
3895 | Assert(isnull == (hashentry->type == JSON_TOKEN_NULL)); |
3896 | |
3897 | if (_state->save_json_start != NULL) |
3898 | { |
3899 | int len = _state->lex->prev_token_terminator - _state->save_json_start; |
3900 | char *val = palloc((len + 1) * sizeof(char)); |
3901 | |
3902 | memcpy(val, _state->save_json_start, len); |
3903 | val[len] = '\0'; |
3904 | hashentry->val = val; |
3905 | } |
3906 | else |
3907 | { |
3908 | /* must have had a scalar instead */ |
3909 | hashentry->val = _state->saved_scalar; |
3910 | } |
3911 | } |
3912 | |
3913 | /* |
3914 | * findJsonbValueFromContainer() wrapper that sets up JsonbValue key string. |
3915 | */ |
3916 | static JsonbValue * |
3917 | findJsonbValueFromContainerLen(JsonbContainer *container, uint32 flags, |
3918 | char *key, uint32 keylen) |
3919 | { |
3920 | JsonbValue k; |
3921 | |
3922 | k.type = jbvString; |
3923 | k.val.string.val = key; |
3924 | k.val.string.len = keylen; |
3925 | |
3926 | return findJsonbValueFromContainer(container, flags, &k); |
3927 | } |
3928 | |
3929 | /* |
3930 | * Semantic actions for json_strip_nulls. |
3931 | * |
3932 | * Simply repeat the input on the output unless we encounter |
3933 | * a null object field. State for this is set when the field |
3934 | * is started and reset when the scalar action (which must be next) |
3935 | * is called. |
3936 | */ |
3937 | |
3938 | static void |
3939 | sn_object_start(void *state) |
3940 | { |
3941 | StripnullState *_state = (StripnullState *) state; |
3942 | |
3943 | appendStringInfoCharMacro(_state->strval, '{'); |
3944 | } |
3945 | |
3946 | static void |
3947 | sn_object_end(void *state) |
3948 | { |
3949 | StripnullState *_state = (StripnullState *) state; |
3950 | |
3951 | appendStringInfoCharMacro(_state->strval, '}'); |
3952 | } |
3953 | |
3954 | static void |
3955 | sn_array_start(void *state) |
3956 | { |
3957 | StripnullState *_state = (StripnullState *) state; |
3958 | |
3959 | appendStringInfoCharMacro(_state->strval, '['); |
3960 | } |
3961 | |
3962 | static void |
3963 | sn_array_end(void *state) |
3964 | { |
3965 | StripnullState *_state = (StripnullState *) state; |
3966 | |
3967 | appendStringInfoCharMacro(_state->strval, ']'); |
3968 | } |
3969 | |
3970 | static void |
3971 | sn_object_field_start(void *state, char *fname, bool isnull) |
3972 | { |
3973 | StripnullState *_state = (StripnullState *) state; |
3974 | |
3975 | if (isnull) |
3976 | { |
3977 | /* |
3978 | * The next thing must be a scalar or isnull couldn't be true, so |
3979 | * there is no danger of this state being carried down into a nested |
3980 | * object or array. The flag will be reset in the scalar action. |
3981 | */ |
3982 | _state->skip_next_null = true; |
3983 | return; |
3984 | } |
3985 | |
3986 | if (_state->strval->data[_state->strval->len - 1] != '{') |
3987 | appendStringInfoCharMacro(_state->strval, ','); |
3988 | |
3989 | /* |
3990 | * Unfortunately we don't have the quoted and escaped string any more, so |
3991 | * we have to re-escape it. |
3992 | */ |
3993 | escape_json(_state->strval, fname); |
3994 | |
3995 | appendStringInfoCharMacro(_state->strval, ':'); |
3996 | } |
3997 | |
3998 | static void |
3999 | sn_array_element_start(void *state, bool isnull) |
4000 | { |
4001 | StripnullState *_state = (StripnullState *) state; |
4002 | |
4003 | if (_state->strval->data[_state->strval->len - 1] != '[') |
4004 | appendStringInfoCharMacro(_state->strval, ','); |
4005 | } |
4006 | |
4007 | static void |
4008 | sn_scalar(void *state, char *token, JsonTokenType tokentype) |
4009 | { |
4010 | StripnullState *_state = (StripnullState *) state; |
4011 | |
4012 | if (_state->skip_next_null) |
4013 | { |
4014 | Assert(tokentype == JSON_TOKEN_NULL); |
4015 | _state->skip_next_null = false; |
4016 | return; |
4017 | } |
4018 | |
4019 | if (tokentype == JSON_TOKEN_STRING) |
4020 | escape_json(_state->strval, token); |
4021 | else |
4022 | appendStringInfoString(_state->strval, token); |
4023 | } |
4024 | |
4025 | /* |
4026 | * SQL function json_strip_nulls(json) -> json |
4027 | */ |
4028 | Datum |
4029 | json_strip_nulls(PG_FUNCTION_ARGS) |
4030 | { |
4031 | text *json = PG_GETARG_TEXT_PP(0); |
4032 | StripnullState *state; |
4033 | JsonLexContext *lex; |
4034 | JsonSemAction *sem; |
4035 | |
4036 | lex = makeJsonLexContext(json, true); |
4037 | state = palloc0(sizeof(StripnullState)); |
4038 | sem = palloc0(sizeof(JsonSemAction)); |
4039 | |
4040 | state->strval = makeStringInfo(); |
4041 | state->skip_next_null = false; |
4042 | state->lex = lex; |
4043 | |
4044 | sem->semstate = (void *) state; |
4045 | sem->object_start = sn_object_start; |
4046 | sem->object_end = sn_object_end; |
4047 | sem->array_start = sn_array_start; |
4048 | sem->array_end = sn_array_end; |
4049 | sem->scalar = sn_scalar; |
4050 | sem->array_element_start = sn_array_element_start; |
4051 | sem->object_field_start = sn_object_field_start; |
4052 | |
4053 | pg_parse_json(lex, sem); |
4054 | |
4055 | PG_RETURN_TEXT_P(cstring_to_text_with_len(state->strval->data, |
4056 | state->strval->len)); |
4057 | |
4058 | } |
4059 | |
4060 | /* |
4061 | * SQL function jsonb_strip_nulls(jsonb) -> jsonb |
4062 | */ |
4063 | Datum |
4064 | jsonb_strip_nulls(PG_FUNCTION_ARGS) |
4065 | { |
4066 | Jsonb *jb = PG_GETARG_JSONB_P(0); |
4067 | JsonbIterator *it; |
4068 | JsonbParseState *parseState = NULL; |
4069 | JsonbValue *res = NULL; |
4070 | JsonbValue v, |
4071 | k; |
4072 | JsonbIteratorToken type; |
4073 | bool last_was_key = false; |
4074 | |
4075 | if (JB_ROOT_IS_SCALAR(jb)) |
4076 | PG_RETURN_POINTER(jb); |
4077 | |
4078 | it = JsonbIteratorInit(&jb->root); |
4079 | |
4080 | while ((type = JsonbIteratorNext(&it, &v, false)) != WJB_DONE) |
4081 | { |
4082 | Assert(!(type == WJB_KEY && last_was_key)); |
4083 | |
4084 | if (type == WJB_KEY) |
4085 | { |
4086 | /* stash the key until we know if it has a null value */ |
4087 | k = v; |
4088 | last_was_key = true; |
4089 | continue; |
4090 | } |
4091 | |
4092 | if (last_was_key) |
4093 | { |
4094 | /* if the last element was a key this one can't be */ |
4095 | last_was_key = false; |
4096 | |
4097 | /* skip this field if value is null */ |
4098 | if (type == WJB_VALUE && v.type == jbvNull) |
4099 | continue; |
4100 | |
4101 | /* otherwise, do a delayed push of the key */ |
4102 | (void) pushJsonbValue(&parseState, WJB_KEY, &k); |
4103 | } |
4104 | |
4105 | if (type == WJB_VALUE || type == WJB_ELEM) |
4106 | res = pushJsonbValue(&parseState, type, &v); |
4107 | else |
4108 | res = pushJsonbValue(&parseState, type, NULL); |
4109 | } |
4110 | |
4111 | Assert(res != NULL); |
4112 | |
4113 | PG_RETURN_POINTER(JsonbValueToJsonb(res)); |
4114 | } |
4115 | |
4116 | /* |
4117 | * Add values from the jsonb to the parse state. |
4118 | * |
4119 | * If the parse state container is an object, the jsonb is pushed as |
4120 | * a value, not a key. |
4121 | * |
4122 | * This needs to be done using an iterator because pushJsonbValue doesn't |
4123 | * like getting jbvBinary values, so we can't just push jb as a whole. |
4124 | */ |
4125 | static void |
4126 | addJsonbToParseState(JsonbParseState **jbps, Jsonb *jb) |
4127 | { |
4128 | JsonbIterator *it; |
4129 | JsonbValue *o = &(*jbps)->contVal; |
4130 | JsonbValue v; |
4131 | JsonbIteratorToken type; |
4132 | |
4133 | it = JsonbIteratorInit(&jb->root); |
4134 | |
4135 | Assert(o->type == jbvArray || o->type == jbvObject); |
4136 | |
4137 | if (JB_ROOT_IS_SCALAR(jb)) |
4138 | { |
4139 | (void) JsonbIteratorNext(&it, &v, false); /* skip array header */ |
4140 | Assert(v.type == jbvArray); |
4141 | (void) JsonbIteratorNext(&it, &v, false); /* fetch scalar value */ |
4142 | |
4143 | switch (o->type) |
4144 | { |
4145 | case jbvArray: |
4146 | (void) pushJsonbValue(jbps, WJB_ELEM, &v); |
4147 | break; |
4148 | case jbvObject: |
4149 | (void) pushJsonbValue(jbps, WJB_VALUE, &v); |
4150 | break; |
4151 | default: |
4152 | elog(ERROR, "unexpected parent of nested structure" ); |
4153 | } |
4154 | } |
4155 | else |
4156 | { |
4157 | while ((type = JsonbIteratorNext(&it, &v, false)) != WJB_DONE) |
4158 | { |
4159 | if (type == WJB_KEY || type == WJB_VALUE || type == WJB_ELEM) |
4160 | (void) pushJsonbValue(jbps, type, &v); |
4161 | else |
4162 | (void) pushJsonbValue(jbps, type, NULL); |
4163 | } |
4164 | } |
4165 | |
4166 | } |
4167 | |
4168 | /* |
4169 | * SQL function jsonb_pretty (jsonb) |
4170 | * |
4171 | * Pretty-printed text for the jsonb |
4172 | */ |
4173 | Datum |
4174 | jsonb_pretty(PG_FUNCTION_ARGS) |
4175 | { |
4176 | Jsonb *jb = PG_GETARG_JSONB_P(0); |
4177 | StringInfo str = makeStringInfo(); |
4178 | |
4179 | JsonbToCStringIndent(str, &jb->root, VARSIZE(jb)); |
4180 | |
4181 | PG_RETURN_TEXT_P(cstring_to_text_with_len(str->data, str->len)); |
4182 | } |
4183 | |
4184 | /* |
4185 | * SQL function jsonb_concat (jsonb, jsonb) |
4186 | * |
4187 | * function for || operator |
4188 | */ |
4189 | Datum |
4190 | jsonb_concat(PG_FUNCTION_ARGS) |
4191 | { |
4192 | Jsonb *jb1 = PG_GETARG_JSONB_P(0); |
4193 | Jsonb *jb2 = PG_GETARG_JSONB_P(1); |
4194 | JsonbParseState *state = NULL; |
4195 | JsonbValue *res; |
4196 | JsonbIterator *it1, |
4197 | *it2; |
4198 | |
4199 | /* |
4200 | * If one of the jsonb is empty, just return the other if it's not scalar |
4201 | * and both are of the same kind. If it's a scalar or they are of |
4202 | * different kinds we need to perform the concatenation even if one is |
4203 | * empty. |
4204 | */ |
4205 | if (JB_ROOT_IS_OBJECT(jb1) == JB_ROOT_IS_OBJECT(jb2)) |
4206 | { |
4207 | if (JB_ROOT_COUNT(jb1) == 0 && !JB_ROOT_IS_SCALAR(jb2)) |
4208 | PG_RETURN_JSONB_P(jb2); |
4209 | else if (JB_ROOT_COUNT(jb2) == 0 && !JB_ROOT_IS_SCALAR(jb1)) |
4210 | PG_RETURN_JSONB_P(jb1); |
4211 | } |
4212 | |
4213 | it1 = JsonbIteratorInit(&jb1->root); |
4214 | it2 = JsonbIteratorInit(&jb2->root); |
4215 | |
4216 | res = IteratorConcat(&it1, &it2, &state); |
4217 | |
4218 | Assert(res != NULL); |
4219 | |
4220 | PG_RETURN_JSONB_P(JsonbValueToJsonb(res)); |
4221 | } |
4222 | |
4223 | |
4224 | /* |
4225 | * SQL function jsonb_delete (jsonb, text) |
4226 | * |
4227 | * return a copy of the jsonb with the indicated item |
4228 | * removed. |
4229 | */ |
4230 | Datum |
4231 | jsonb_delete(PG_FUNCTION_ARGS) |
4232 | { |
4233 | Jsonb *in = PG_GETARG_JSONB_P(0); |
4234 | text *key = PG_GETARG_TEXT_PP(1); |
4235 | char *keyptr = VARDATA_ANY(key); |
4236 | int keylen = VARSIZE_ANY_EXHDR(key); |
4237 | JsonbParseState *state = NULL; |
4238 | JsonbIterator *it; |
4239 | JsonbValue v, |
4240 | *res = NULL; |
4241 | bool skipNested = false; |
4242 | JsonbIteratorToken r; |
4243 | |
4244 | if (JB_ROOT_IS_SCALAR(in)) |
4245 | ereport(ERROR, |
4246 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
4247 | errmsg("cannot delete from scalar" ))); |
4248 | |
4249 | if (JB_ROOT_COUNT(in) == 0) |
4250 | PG_RETURN_JSONB_P(in); |
4251 | |
4252 | it = JsonbIteratorInit(&in->root); |
4253 | |
4254 | while ((r = JsonbIteratorNext(&it, &v, skipNested)) != WJB_DONE) |
4255 | { |
4256 | skipNested = true; |
4257 | |
4258 | if ((r == WJB_ELEM || r == WJB_KEY) && |
4259 | (v.type == jbvString && keylen == v.val.string.len && |
4260 | memcmp(keyptr, v.val.string.val, keylen) == 0)) |
4261 | { |
4262 | /* skip corresponding value as well */ |
4263 | if (r == WJB_KEY) |
4264 | (void) JsonbIteratorNext(&it, &v, true); |
4265 | |
4266 | continue; |
4267 | } |
4268 | |
4269 | res = pushJsonbValue(&state, r, r < WJB_BEGIN_ARRAY ? &v : NULL); |
4270 | } |
4271 | |
4272 | Assert(res != NULL); |
4273 | |
4274 | PG_RETURN_JSONB_P(JsonbValueToJsonb(res)); |
4275 | } |
4276 | |
4277 | /* |
4278 | * SQL function jsonb_delete (jsonb, variadic text[]) |
4279 | * |
4280 | * return a copy of the jsonb with the indicated items |
4281 | * removed. |
4282 | */ |
4283 | Datum |
4284 | jsonb_delete_array(PG_FUNCTION_ARGS) |
4285 | { |
4286 | Jsonb *in = PG_GETARG_JSONB_P(0); |
4287 | ArrayType *keys = PG_GETARG_ARRAYTYPE_P(1); |
4288 | Datum *keys_elems; |
4289 | bool *keys_nulls; |
4290 | int keys_len; |
4291 | JsonbParseState *state = NULL; |
4292 | JsonbIterator *it; |
4293 | JsonbValue v, |
4294 | *res = NULL; |
4295 | bool skipNested = false; |
4296 | JsonbIteratorToken r; |
4297 | |
4298 | if (ARR_NDIM(keys) > 1) |
4299 | ereport(ERROR, |
4300 | (errcode(ERRCODE_ARRAY_SUBSCRIPT_ERROR), |
4301 | errmsg("wrong number of array subscripts" ))); |
4302 | |
4303 | if (JB_ROOT_IS_SCALAR(in)) |
4304 | ereport(ERROR, |
4305 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
4306 | errmsg("cannot delete from scalar" ))); |
4307 | |
4308 | if (JB_ROOT_COUNT(in) == 0) |
4309 | PG_RETURN_JSONB_P(in); |
4310 | |
4311 | deconstruct_array(keys, TEXTOID, -1, false, 'i', |
4312 | &keys_elems, &keys_nulls, &keys_len); |
4313 | |
4314 | if (keys_len == 0) |
4315 | PG_RETURN_JSONB_P(in); |
4316 | |
4317 | it = JsonbIteratorInit(&in->root); |
4318 | |
4319 | while ((r = JsonbIteratorNext(&it, &v, skipNested)) != WJB_DONE) |
4320 | { |
4321 | skipNested = true; |
4322 | |
4323 | if ((r == WJB_ELEM || r == WJB_KEY) && v.type == jbvString) |
4324 | { |
4325 | int i; |
4326 | bool found = false; |
4327 | |
4328 | for (i = 0; i < keys_len; i++) |
4329 | { |
4330 | char *keyptr; |
4331 | int keylen; |
4332 | |
4333 | if (keys_nulls[i]) |
4334 | continue; |
4335 | |
4336 | keyptr = VARDATA_ANY(keys_elems[i]); |
4337 | keylen = VARSIZE_ANY_EXHDR(keys_elems[i]); |
4338 | if (keylen == v.val.string.len && |
4339 | memcmp(keyptr, v.val.string.val, keylen) == 0) |
4340 | { |
4341 | found = true; |
4342 | break; |
4343 | } |
4344 | } |
4345 | if (found) |
4346 | { |
4347 | /* skip corresponding value as well */ |
4348 | if (r == WJB_KEY) |
4349 | (void) JsonbIteratorNext(&it, &v, true); |
4350 | |
4351 | continue; |
4352 | } |
4353 | } |
4354 | |
4355 | res = pushJsonbValue(&state, r, r < WJB_BEGIN_ARRAY ? &v : NULL); |
4356 | } |
4357 | |
4358 | Assert(res != NULL); |
4359 | |
4360 | PG_RETURN_JSONB_P(JsonbValueToJsonb(res)); |
4361 | } |
4362 | |
4363 | /* |
4364 | * SQL function jsonb_delete (jsonb, int) |
4365 | * |
4366 | * return a copy of the jsonb with the indicated item |
4367 | * removed. Negative int means count back from the |
4368 | * end of the items. |
4369 | */ |
4370 | Datum |
4371 | jsonb_delete_idx(PG_FUNCTION_ARGS) |
4372 | { |
4373 | Jsonb *in = PG_GETARG_JSONB_P(0); |
4374 | int idx = PG_GETARG_INT32(1); |
4375 | JsonbParseState *state = NULL; |
4376 | JsonbIterator *it; |
4377 | uint32 i = 0, |
4378 | n; |
4379 | JsonbValue v, |
4380 | *res = NULL; |
4381 | JsonbIteratorToken r; |
4382 | |
4383 | if (JB_ROOT_IS_SCALAR(in)) |
4384 | ereport(ERROR, |
4385 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
4386 | errmsg("cannot delete from scalar" ))); |
4387 | |
4388 | if (JB_ROOT_IS_OBJECT(in)) |
4389 | ereport(ERROR, |
4390 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
4391 | errmsg("cannot delete from object using integer index" ))); |
4392 | |
4393 | if (JB_ROOT_COUNT(in) == 0) |
4394 | PG_RETURN_JSONB_P(in); |
4395 | |
4396 | it = JsonbIteratorInit(&in->root); |
4397 | |
4398 | r = JsonbIteratorNext(&it, &v, false); |
4399 | Assert(r == WJB_BEGIN_ARRAY); |
4400 | n = v.val.array.nElems; |
4401 | |
4402 | if (idx < 0) |
4403 | { |
4404 | if (-idx > n) |
4405 | idx = n; |
4406 | else |
4407 | idx = n + idx; |
4408 | } |
4409 | |
4410 | if (idx >= n) |
4411 | PG_RETURN_JSONB_P(in); |
4412 | |
4413 | pushJsonbValue(&state, r, NULL); |
4414 | |
4415 | while ((r = JsonbIteratorNext(&it, &v, true)) != WJB_DONE) |
4416 | { |
4417 | if (r == WJB_ELEM) |
4418 | { |
4419 | if (i++ == idx) |
4420 | continue; |
4421 | } |
4422 | |
4423 | res = pushJsonbValue(&state, r, r < WJB_BEGIN_ARRAY ? &v : NULL); |
4424 | } |
4425 | |
4426 | Assert(res != NULL); |
4427 | |
4428 | PG_RETURN_JSONB_P(JsonbValueToJsonb(res)); |
4429 | } |
4430 | |
4431 | /* |
4432 | * SQL function jsonb_set(jsonb, text[], jsonb, boolean) |
4433 | * |
4434 | */ |
4435 | Datum |
4436 | jsonb_set(PG_FUNCTION_ARGS) |
4437 | { |
4438 | Jsonb *in = PG_GETARG_JSONB_P(0); |
4439 | ArrayType *path = PG_GETARG_ARRAYTYPE_P(1); |
4440 | Jsonb *newval = PG_GETARG_JSONB_P(2); |
4441 | bool create = PG_GETARG_BOOL(3); |
4442 | JsonbValue *res = NULL; |
4443 | Datum *path_elems; |
4444 | bool *path_nulls; |
4445 | int path_len; |
4446 | JsonbIterator *it; |
4447 | JsonbParseState *st = NULL; |
4448 | |
4449 | if (ARR_NDIM(path) > 1) |
4450 | ereport(ERROR, |
4451 | (errcode(ERRCODE_ARRAY_SUBSCRIPT_ERROR), |
4452 | errmsg("wrong number of array subscripts" ))); |
4453 | |
4454 | if (JB_ROOT_IS_SCALAR(in)) |
4455 | ereport(ERROR, |
4456 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
4457 | errmsg("cannot set path in scalar" ))); |
4458 | |
4459 | if (JB_ROOT_COUNT(in) == 0 && !create) |
4460 | PG_RETURN_JSONB_P(in); |
4461 | |
4462 | deconstruct_array(path, TEXTOID, -1, false, 'i', |
4463 | &path_elems, &path_nulls, &path_len); |
4464 | |
4465 | if (path_len == 0) |
4466 | PG_RETURN_JSONB_P(in); |
4467 | |
4468 | it = JsonbIteratorInit(&in->root); |
4469 | |
4470 | res = setPath(&it, path_elems, path_nulls, path_len, &st, |
4471 | 0, newval, create ? JB_PATH_CREATE : JB_PATH_REPLACE); |
4472 | |
4473 | Assert(res != NULL); |
4474 | |
4475 | PG_RETURN_JSONB_P(JsonbValueToJsonb(res)); |
4476 | } |
4477 | |
4478 | |
4479 | /* |
4480 | * SQL function jsonb_delete_path(jsonb, text[]) |
4481 | */ |
4482 | Datum |
4483 | jsonb_delete_path(PG_FUNCTION_ARGS) |
4484 | { |
4485 | Jsonb *in = PG_GETARG_JSONB_P(0); |
4486 | ArrayType *path = PG_GETARG_ARRAYTYPE_P(1); |
4487 | JsonbValue *res = NULL; |
4488 | Datum *path_elems; |
4489 | bool *path_nulls; |
4490 | int path_len; |
4491 | JsonbIterator *it; |
4492 | JsonbParseState *st = NULL; |
4493 | |
4494 | if (ARR_NDIM(path) > 1) |
4495 | ereport(ERROR, |
4496 | (errcode(ERRCODE_ARRAY_SUBSCRIPT_ERROR), |
4497 | errmsg("wrong number of array subscripts" ))); |
4498 | |
4499 | if (JB_ROOT_IS_SCALAR(in)) |
4500 | ereport(ERROR, |
4501 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
4502 | errmsg("cannot delete path in scalar" ))); |
4503 | |
4504 | if (JB_ROOT_COUNT(in) == 0) |
4505 | PG_RETURN_JSONB_P(in); |
4506 | |
4507 | deconstruct_array(path, TEXTOID, -1, false, 'i', |
4508 | &path_elems, &path_nulls, &path_len); |
4509 | |
4510 | if (path_len == 0) |
4511 | PG_RETURN_JSONB_P(in); |
4512 | |
4513 | it = JsonbIteratorInit(&in->root); |
4514 | |
4515 | res = setPath(&it, path_elems, path_nulls, path_len, &st, |
4516 | 0, NULL, JB_PATH_DELETE); |
4517 | |
4518 | Assert(res != NULL); |
4519 | |
4520 | PG_RETURN_JSONB_P(JsonbValueToJsonb(res)); |
4521 | } |
4522 | |
4523 | /* |
4524 | * SQL function jsonb_insert(jsonb, text[], jsonb, boolean) |
4525 | * |
4526 | */ |
4527 | Datum |
4528 | jsonb_insert(PG_FUNCTION_ARGS) |
4529 | { |
4530 | Jsonb *in = PG_GETARG_JSONB_P(0); |
4531 | ArrayType *path = PG_GETARG_ARRAYTYPE_P(1); |
4532 | Jsonb *newval = PG_GETARG_JSONB_P(2); |
4533 | bool after = PG_GETARG_BOOL(3); |
4534 | JsonbValue *res = NULL; |
4535 | Datum *path_elems; |
4536 | bool *path_nulls; |
4537 | int path_len; |
4538 | JsonbIterator *it; |
4539 | JsonbParseState *st = NULL; |
4540 | |
4541 | if (ARR_NDIM(path) > 1) |
4542 | ereport(ERROR, |
4543 | (errcode(ERRCODE_ARRAY_SUBSCRIPT_ERROR), |
4544 | errmsg("wrong number of array subscripts" ))); |
4545 | |
4546 | if (JB_ROOT_IS_SCALAR(in)) |
4547 | ereport(ERROR, |
4548 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
4549 | errmsg("cannot set path in scalar" ))); |
4550 | |
4551 | deconstruct_array(path, TEXTOID, -1, false, 'i', |
4552 | &path_elems, &path_nulls, &path_len); |
4553 | |
4554 | if (path_len == 0) |
4555 | PG_RETURN_JSONB_P(in); |
4556 | |
4557 | it = JsonbIteratorInit(&in->root); |
4558 | |
4559 | res = setPath(&it, path_elems, path_nulls, path_len, &st, 0, newval, |
4560 | after ? JB_PATH_INSERT_AFTER : JB_PATH_INSERT_BEFORE); |
4561 | |
4562 | Assert(res != NULL); |
4563 | |
4564 | PG_RETURN_JSONB_P(JsonbValueToJsonb(res)); |
4565 | } |
4566 | |
4567 | /* |
4568 | * Iterate over all jsonb objects and merge them into one. |
4569 | * The logic of this function copied from the same hstore function, |
4570 | * except the case, when it1 & it2 represents jbvObject. |
4571 | * In that case we just append the content of it2 to it1 without any |
4572 | * verifications. |
4573 | */ |
4574 | static JsonbValue * |
4575 | IteratorConcat(JsonbIterator **it1, JsonbIterator **it2, |
4576 | JsonbParseState **state) |
4577 | { |
4578 | JsonbValue v1, |
4579 | v2, |
4580 | *res = NULL; |
4581 | JsonbIteratorToken r1, |
4582 | r2, |
4583 | rk1, |
4584 | rk2; |
4585 | |
4586 | r1 = rk1 = JsonbIteratorNext(it1, &v1, false); |
4587 | r2 = rk2 = JsonbIteratorNext(it2, &v2, false); |
4588 | |
4589 | /* |
4590 | * Both elements are objects. |
4591 | */ |
4592 | if (rk1 == WJB_BEGIN_OBJECT && rk2 == WJB_BEGIN_OBJECT) |
4593 | { |
4594 | /* |
4595 | * Append the all tokens from v1 to res, except last WJB_END_OBJECT |
4596 | * (because res will not be finished yet). |
4597 | */ |
4598 | pushJsonbValue(state, r1, NULL); |
4599 | while ((r1 = JsonbIteratorNext(it1, &v1, true)) != WJB_END_OBJECT) |
4600 | pushJsonbValue(state, r1, &v1); |
4601 | |
4602 | /* |
4603 | * Append the all tokens from v2 to res, include last WJB_END_OBJECT |
4604 | * (the concatenation will be completed). |
4605 | */ |
4606 | while ((r2 = JsonbIteratorNext(it2, &v2, true)) != WJB_DONE) |
4607 | res = pushJsonbValue(state, r2, r2 != WJB_END_OBJECT ? &v2 : NULL); |
4608 | } |
4609 | |
4610 | /* |
4611 | * Both elements are arrays (either can be scalar). |
4612 | */ |
4613 | else if (rk1 == WJB_BEGIN_ARRAY && rk2 == WJB_BEGIN_ARRAY) |
4614 | { |
4615 | pushJsonbValue(state, r1, NULL); |
4616 | |
4617 | while ((r1 = JsonbIteratorNext(it1, &v1, true)) != WJB_END_ARRAY) |
4618 | { |
4619 | Assert(r1 == WJB_ELEM); |
4620 | pushJsonbValue(state, r1, &v1); |
4621 | } |
4622 | |
4623 | while ((r2 = JsonbIteratorNext(it2, &v2, true)) != WJB_END_ARRAY) |
4624 | { |
4625 | Assert(r2 == WJB_ELEM); |
4626 | pushJsonbValue(state, WJB_ELEM, &v2); |
4627 | } |
4628 | |
4629 | res = pushJsonbValue(state, WJB_END_ARRAY, NULL /* signal to sort */ ); |
4630 | } |
4631 | /* have we got array || object or object || array? */ |
4632 | else if (((rk1 == WJB_BEGIN_ARRAY && !(*it1)->isScalar) && rk2 == WJB_BEGIN_OBJECT) || |
4633 | (rk1 == WJB_BEGIN_OBJECT && (rk2 == WJB_BEGIN_ARRAY && !(*it2)->isScalar))) |
4634 | { |
4635 | |
4636 | JsonbIterator **it_array = rk1 == WJB_BEGIN_ARRAY ? it1 : it2; |
4637 | JsonbIterator **it_object = rk1 == WJB_BEGIN_OBJECT ? it1 : it2; |
4638 | |
4639 | bool prepend = (rk1 == WJB_BEGIN_OBJECT); |
4640 | |
4641 | pushJsonbValue(state, WJB_BEGIN_ARRAY, NULL); |
4642 | |
4643 | if (prepend) |
4644 | { |
4645 | pushJsonbValue(state, WJB_BEGIN_OBJECT, NULL); |
4646 | while ((r1 = JsonbIteratorNext(it_object, &v1, true)) != WJB_DONE) |
4647 | pushJsonbValue(state, r1, r1 != WJB_END_OBJECT ? &v1 : NULL); |
4648 | |
4649 | while ((r2 = JsonbIteratorNext(it_array, &v2, true)) != WJB_DONE) |
4650 | res = pushJsonbValue(state, r2, r2 != WJB_END_ARRAY ? &v2 : NULL); |
4651 | } |
4652 | else |
4653 | { |
4654 | while ((r1 = JsonbIteratorNext(it_array, &v1, true)) != WJB_END_ARRAY) |
4655 | pushJsonbValue(state, r1, &v1); |
4656 | |
4657 | pushJsonbValue(state, WJB_BEGIN_OBJECT, NULL); |
4658 | while ((r2 = JsonbIteratorNext(it_object, &v2, true)) != WJB_DONE) |
4659 | pushJsonbValue(state, r2, r2 != WJB_END_OBJECT ? &v2 : NULL); |
4660 | |
4661 | res = pushJsonbValue(state, WJB_END_ARRAY, NULL); |
4662 | } |
4663 | } |
4664 | else |
4665 | { |
4666 | /* |
4667 | * This must be scalar || object or object || scalar, as that's all |
4668 | * that's left. Both of these make no sense, so error out. |
4669 | */ |
4670 | ereport(ERROR, |
4671 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
4672 | errmsg("invalid concatenation of jsonb objects" ))); |
4673 | } |
4674 | |
4675 | return res; |
4676 | } |
4677 | |
4678 | /* |
4679 | * Do most of the heavy work for jsonb_set/jsonb_insert |
4680 | * |
4681 | * If JB_PATH_DELETE bit is set in op_type, the element is to be removed. |
4682 | * |
4683 | * If any bit mentioned in JB_PATH_CREATE_OR_INSERT is set in op_type, |
4684 | * we create the new value if the key or array index does not exist. |
4685 | * |
4686 | * Bits JB_PATH_INSERT_BEFORE and JB_PATH_INSERT_AFTER in op_type |
4687 | * behave as JB_PATH_CREATE if new value is inserted in JsonbObject. |
4688 | * |
4689 | * All path elements before the last must already exist |
4690 | * whatever bits in op_type are set, or nothing is done. |
4691 | */ |
4692 | static JsonbValue * |
4693 | setPath(JsonbIterator **it, Datum *path_elems, |
4694 | bool *path_nulls, int path_len, |
4695 | JsonbParseState **st, int level, Jsonb *newval, int op_type) |
4696 | { |
4697 | JsonbValue v; |
4698 | JsonbIteratorToken r; |
4699 | JsonbValue *res; |
4700 | |
4701 | check_stack_depth(); |
4702 | |
4703 | if (path_nulls[level]) |
4704 | ereport(ERROR, |
4705 | (errcode(ERRCODE_NULL_VALUE_NOT_ALLOWED), |
4706 | errmsg("path element at position %d is null" , |
4707 | level + 1))); |
4708 | |
4709 | r = JsonbIteratorNext(it, &v, false); |
4710 | |
4711 | switch (r) |
4712 | { |
4713 | case WJB_BEGIN_ARRAY: |
4714 | (void) pushJsonbValue(st, r, NULL); |
4715 | setPathArray(it, path_elems, path_nulls, path_len, st, level, |
4716 | newval, v.val.array.nElems, op_type); |
4717 | r = JsonbIteratorNext(it, &v, false); |
4718 | Assert(r == WJB_END_ARRAY); |
4719 | res = pushJsonbValue(st, r, NULL); |
4720 | break; |
4721 | case WJB_BEGIN_OBJECT: |
4722 | (void) pushJsonbValue(st, r, NULL); |
4723 | setPathObject(it, path_elems, path_nulls, path_len, st, level, |
4724 | newval, v.val.object.nPairs, op_type); |
4725 | r = JsonbIteratorNext(it, &v, true); |
4726 | Assert(r == WJB_END_OBJECT); |
4727 | res = pushJsonbValue(st, r, NULL); |
4728 | break; |
4729 | case WJB_ELEM: |
4730 | case WJB_VALUE: |
4731 | res = pushJsonbValue(st, r, &v); |
4732 | break; |
4733 | default: |
4734 | elog(ERROR, "unrecognized iterator result: %d" , (int) r); |
4735 | res = NULL; /* keep compiler quiet */ |
4736 | break; |
4737 | } |
4738 | |
4739 | return res; |
4740 | } |
4741 | |
4742 | /* |
4743 | * Object walker for setPath |
4744 | */ |
4745 | static void |
4746 | setPathObject(JsonbIterator **it, Datum *path_elems, bool *path_nulls, |
4747 | int path_len, JsonbParseState **st, int level, |
4748 | Jsonb *newval, uint32 npairs, int op_type) |
4749 | { |
4750 | JsonbValue v; |
4751 | int i; |
4752 | JsonbValue k; |
4753 | bool done = false; |
4754 | |
4755 | if (level >= path_len || path_nulls[level]) |
4756 | done = true; |
4757 | |
4758 | /* empty object is a special case for create */ |
4759 | if ((npairs == 0) && (op_type & JB_PATH_CREATE_OR_INSERT) && |
4760 | (level == path_len - 1)) |
4761 | { |
4762 | JsonbValue newkey; |
4763 | |
4764 | newkey.type = jbvString; |
4765 | newkey.val.string.len = VARSIZE_ANY_EXHDR(path_elems[level]); |
4766 | newkey.val.string.val = VARDATA_ANY(path_elems[level]); |
4767 | |
4768 | (void) pushJsonbValue(st, WJB_KEY, &newkey); |
4769 | addJsonbToParseState(st, newval); |
4770 | } |
4771 | |
4772 | for (i = 0; i < npairs; i++) |
4773 | { |
4774 | JsonbIteratorToken r = JsonbIteratorNext(it, &k, true); |
4775 | |
4776 | Assert(r == WJB_KEY); |
4777 | |
4778 | if (!done && |
4779 | k.val.string.len == VARSIZE_ANY_EXHDR(path_elems[level]) && |
4780 | memcmp(k.val.string.val, VARDATA_ANY(path_elems[level]), |
4781 | k.val.string.len) == 0) |
4782 | { |
4783 | if (level == path_len - 1) |
4784 | { |
4785 | /* |
4786 | * called from jsonb_insert(), it forbids redefining an |
4787 | * existing value |
4788 | */ |
4789 | if (op_type & (JB_PATH_INSERT_BEFORE | JB_PATH_INSERT_AFTER)) |
4790 | ereport(ERROR, |
4791 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
4792 | errmsg("cannot replace existing key" ), |
4793 | errhint("Try using the function jsonb_set " |
4794 | "to replace key value." ))); |
4795 | |
4796 | r = JsonbIteratorNext(it, &v, true); /* skip value */ |
4797 | if (!(op_type & JB_PATH_DELETE)) |
4798 | { |
4799 | (void) pushJsonbValue(st, WJB_KEY, &k); |
4800 | addJsonbToParseState(st, newval); |
4801 | } |
4802 | done = true; |
4803 | } |
4804 | else |
4805 | { |
4806 | (void) pushJsonbValue(st, r, &k); |
4807 | setPath(it, path_elems, path_nulls, path_len, |
4808 | st, level + 1, newval, op_type); |
4809 | } |
4810 | } |
4811 | else |
4812 | { |
4813 | if ((op_type & JB_PATH_CREATE_OR_INSERT) && !done && |
4814 | level == path_len - 1 && i == npairs - 1) |
4815 | { |
4816 | JsonbValue newkey; |
4817 | |
4818 | newkey.type = jbvString; |
4819 | newkey.val.string.len = VARSIZE_ANY_EXHDR(path_elems[level]); |
4820 | newkey.val.string.val = VARDATA_ANY(path_elems[level]); |
4821 | |
4822 | (void) pushJsonbValue(st, WJB_KEY, &newkey); |
4823 | addJsonbToParseState(st, newval); |
4824 | } |
4825 | |
4826 | (void) pushJsonbValue(st, r, &k); |
4827 | r = JsonbIteratorNext(it, &v, false); |
4828 | (void) pushJsonbValue(st, r, r < WJB_BEGIN_ARRAY ? &v : NULL); |
4829 | if (r == WJB_BEGIN_ARRAY || r == WJB_BEGIN_OBJECT) |
4830 | { |
4831 | int walking_level = 1; |
4832 | |
4833 | while (walking_level != 0) |
4834 | { |
4835 | r = JsonbIteratorNext(it, &v, false); |
4836 | |
4837 | if (r == WJB_BEGIN_ARRAY || r == WJB_BEGIN_OBJECT) |
4838 | ++walking_level; |
4839 | if (r == WJB_END_ARRAY || r == WJB_END_OBJECT) |
4840 | --walking_level; |
4841 | |
4842 | (void) pushJsonbValue(st, r, r < WJB_BEGIN_ARRAY ? &v : NULL); |
4843 | } |
4844 | } |
4845 | } |
4846 | } |
4847 | } |
4848 | |
4849 | /* |
4850 | * Array walker for setPath |
4851 | */ |
4852 | static void |
4853 | setPathArray(JsonbIterator **it, Datum *path_elems, bool *path_nulls, |
4854 | int path_len, JsonbParseState **st, int level, |
4855 | Jsonb *newval, uint32 nelems, int op_type) |
4856 | { |
4857 | JsonbValue v; |
4858 | int idx, |
4859 | i; |
4860 | bool done = false; |
4861 | |
4862 | /* pick correct index */ |
4863 | if (level < path_len && !path_nulls[level]) |
4864 | { |
4865 | char *c = TextDatumGetCString(path_elems[level]); |
4866 | long lindex; |
4867 | char *badp; |
4868 | |
4869 | errno = 0; |
4870 | lindex = strtol(c, &badp, 10); |
4871 | if (errno != 0 || badp == c || *badp != '\0' || lindex > INT_MAX || |
4872 | lindex < INT_MIN) |
4873 | ereport(ERROR, |
4874 | (errcode(ERRCODE_INVALID_TEXT_REPRESENTATION), |
4875 | errmsg("path element at position %d is not an integer: \"%s\"" , |
4876 | level + 1, c))); |
4877 | idx = lindex; |
4878 | } |
4879 | else |
4880 | idx = nelems; |
4881 | |
4882 | if (idx < 0) |
4883 | { |
4884 | if (-idx > nelems) |
4885 | idx = INT_MIN; |
4886 | else |
4887 | idx = nelems + idx; |
4888 | } |
4889 | |
4890 | if (idx > 0 && idx > nelems) |
4891 | idx = nelems; |
4892 | |
4893 | /* |
4894 | * if we're creating, and idx == INT_MIN, we prepend the new value to the |
4895 | * array also if the array is empty - in which case we don't really care |
4896 | * what the idx value is |
4897 | */ |
4898 | |
4899 | if ((idx == INT_MIN || nelems == 0) && (level == path_len - 1) && |
4900 | (op_type & JB_PATH_CREATE_OR_INSERT)) |
4901 | { |
4902 | Assert(newval != NULL); |
4903 | addJsonbToParseState(st, newval); |
4904 | done = true; |
4905 | } |
4906 | |
4907 | /* iterate over the array elements */ |
4908 | for (i = 0; i < nelems; i++) |
4909 | { |
4910 | JsonbIteratorToken r; |
4911 | |
4912 | if (i == idx && level < path_len) |
4913 | { |
4914 | if (level == path_len - 1) |
4915 | { |
4916 | r = JsonbIteratorNext(it, &v, true); /* skip */ |
4917 | |
4918 | if (op_type & (JB_PATH_INSERT_BEFORE | JB_PATH_CREATE)) |
4919 | addJsonbToParseState(st, newval); |
4920 | |
4921 | /* |
4922 | * We should keep current value only in case of |
4923 | * JB_PATH_INSERT_BEFORE or JB_PATH_INSERT_AFTER because |
4924 | * otherwise it should be deleted or replaced |
4925 | */ |
4926 | if (op_type & (JB_PATH_INSERT_AFTER | JB_PATH_INSERT_BEFORE)) |
4927 | (void) pushJsonbValue(st, r, &v); |
4928 | |
4929 | if (op_type & (JB_PATH_INSERT_AFTER | JB_PATH_REPLACE)) |
4930 | addJsonbToParseState(st, newval); |
4931 | |
4932 | done = true; |
4933 | } |
4934 | else |
4935 | (void) setPath(it, path_elems, path_nulls, path_len, |
4936 | st, level + 1, newval, op_type); |
4937 | } |
4938 | else |
4939 | { |
4940 | r = JsonbIteratorNext(it, &v, false); |
4941 | |
4942 | (void) pushJsonbValue(st, r, r < WJB_BEGIN_ARRAY ? &v : NULL); |
4943 | |
4944 | if (r == WJB_BEGIN_ARRAY || r == WJB_BEGIN_OBJECT) |
4945 | { |
4946 | int walking_level = 1; |
4947 | |
4948 | while (walking_level != 0) |
4949 | { |
4950 | r = JsonbIteratorNext(it, &v, false); |
4951 | |
4952 | if (r == WJB_BEGIN_ARRAY || r == WJB_BEGIN_OBJECT) |
4953 | ++walking_level; |
4954 | if (r == WJB_END_ARRAY || r == WJB_END_OBJECT) |
4955 | --walking_level; |
4956 | |
4957 | (void) pushJsonbValue(st, r, r < WJB_BEGIN_ARRAY ? &v : NULL); |
4958 | } |
4959 | } |
4960 | |
4961 | if ((op_type & JB_PATH_CREATE_OR_INSERT) && !done && |
4962 | level == path_len - 1 && i == nelems - 1) |
4963 | { |
4964 | addJsonbToParseState(st, newval); |
4965 | } |
4966 | } |
4967 | } |
4968 | } |
4969 | |
4970 | /* |
4971 | * Parse information about what elements of a jsonb document we want to iterate |
4972 | * in functions iterate_json(b)_values. This information is presented in jsonb |
4973 | * format, so that it can be easily extended in the future. |
4974 | */ |
4975 | uint32 |
4976 | parse_jsonb_index_flags(Jsonb *jb) |
4977 | { |
4978 | JsonbIterator *it; |
4979 | JsonbValue v; |
4980 | JsonbIteratorToken type; |
4981 | uint32 flags = 0; |
4982 | |
4983 | it = JsonbIteratorInit(&jb->root); |
4984 | |
4985 | type = JsonbIteratorNext(&it, &v, false); |
4986 | |
4987 | /* |
4988 | * We iterate over array (scalar internally is represented as array, so, |
4989 | * we will accept it too) to check all its elements. Flag names are |
4990 | * chosen the same as jsonb_typeof uses. |
4991 | */ |
4992 | if (type != WJB_BEGIN_ARRAY) |
4993 | ereport(ERROR, (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
4994 | errmsg("wrong flag type, only arrays and scalars are allowed" ))); |
4995 | |
4996 | while ((type = JsonbIteratorNext(&it, &v, false)) == WJB_ELEM) |
4997 | { |
4998 | if (v.type != jbvString) |
4999 | ereport(ERROR, |
5000 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
5001 | errmsg("flag array element is not a string" ), |
5002 | errhint("Possible values are: \"string\", \"numeric\", \"boolean\", \"key\", and \"all\"." ))); |
5003 | |
5004 | if (v.val.string.len == 3 && |
5005 | pg_strncasecmp(v.val.string.val, "all" , 3) == 0) |
5006 | flags |= jtiAll; |
5007 | else if (v.val.string.len == 3 && |
5008 | pg_strncasecmp(v.val.string.val, "key" , 3) == 0) |
5009 | flags |= jtiKey; |
5010 | else if (v.val.string.len == 6 && |
5011 | pg_strncasecmp(v.val.string.val, "string" , 5) == 0) |
5012 | flags |= jtiString; |
5013 | else if (v.val.string.len == 7 && |
5014 | pg_strncasecmp(v.val.string.val, "numeric" , 7) == 0) |
5015 | flags |= jtiNumeric; |
5016 | else if (v.val.string.len == 7 && |
5017 | pg_strncasecmp(v.val.string.val, "boolean" , 7) == 0) |
5018 | flags |= jtiBool; |
5019 | else |
5020 | ereport(ERROR, |
5021 | (errcode(ERRCODE_INVALID_PARAMETER_VALUE), |
5022 | errmsg("wrong flag in flag array: \"%s\"" , |
5023 | pnstrdup(v.val.string.val, v.val.string.len)), |
5024 | errhint("Possible values are: \"string\", \"numeric\", \"boolean\", \"key\", and \"all\"." ))); |
5025 | } |
5026 | |
5027 | /* expect end of array now */ |
5028 | if (type != WJB_END_ARRAY) |
5029 | elog(ERROR, "unexpected end of flag array" ); |
5030 | |
5031 | /* get final WJB_DONE and free iterator */ |
5032 | type = JsonbIteratorNext(&it, &v, false); |
5033 | if (type != WJB_DONE) |
5034 | elog(ERROR, "unexpected end of flag array" ); |
5035 | |
5036 | return flags; |
5037 | } |
5038 | |
5039 | /* |
5040 | * Iterate over jsonb values or elements, specified by flags, and pass them |
5041 | * together with an iteration state to a specified JsonIterateStringValuesAction. |
5042 | */ |
5043 | void |
5044 | iterate_jsonb_values(Jsonb *jb, uint32 flags, void *state, |
5045 | JsonIterateStringValuesAction action) |
5046 | { |
5047 | JsonbIterator *it; |
5048 | JsonbValue v; |
5049 | JsonbIteratorToken type; |
5050 | |
5051 | it = JsonbIteratorInit(&jb->root); |
5052 | |
5053 | /* |
5054 | * Just recursively iterating over jsonb and call callback on all |
5055 | * corresponding elements |
5056 | */ |
5057 | while ((type = JsonbIteratorNext(&it, &v, false)) != WJB_DONE) |
5058 | { |
5059 | if (type == WJB_KEY) |
5060 | { |
5061 | if (flags & jtiKey) |
5062 | action(state, v.val.string.val, v.val.string.len); |
5063 | |
5064 | continue; |
5065 | } |
5066 | else if (!(type == WJB_VALUE || type == WJB_ELEM)) |
5067 | { |
5068 | /* do not call callback for composite JsonbValue */ |
5069 | continue; |
5070 | } |
5071 | |
5072 | /* JsonbValue is a value of object or element of array */ |
5073 | switch (v.type) |
5074 | { |
5075 | case jbvString: |
5076 | if (flags & jtiString) |
5077 | action(state, v.val.string.val, v.val.string.len); |
5078 | break; |
5079 | case jbvNumeric: |
5080 | if (flags & jtiNumeric) |
5081 | { |
5082 | char *val; |
5083 | |
5084 | val = DatumGetCString(DirectFunctionCall1(numeric_out, |
5085 | NumericGetDatum(v.val.numeric))); |
5086 | |
5087 | action(state, val, strlen(val)); |
5088 | pfree(val); |
5089 | } |
5090 | break; |
5091 | case jbvBool: |
5092 | if (flags & jtiBool) |
5093 | { |
5094 | if (v.val.boolean) |
5095 | action(state, "true" , 4); |
5096 | else |
5097 | action(state, "false" , 5); |
5098 | } |
5099 | break; |
5100 | default: |
5101 | /* do not call callback for composite JsonbValue */ |
5102 | break; |
5103 | } |
5104 | } |
5105 | } |
5106 | |
5107 | /* |
5108 | * Iterate over json values and elements, specified by flags, and pass them |
5109 | * together with an iteration state to a specified JsonIterateStringValuesAction. |
5110 | */ |
5111 | void |
5112 | iterate_json_values(text *json, uint32 flags, void *action_state, |
5113 | JsonIterateStringValuesAction action) |
5114 | { |
5115 | JsonLexContext *lex = makeJsonLexContext(json, true); |
5116 | JsonSemAction *sem = palloc0(sizeof(JsonSemAction)); |
5117 | IterateJsonStringValuesState *state = palloc0(sizeof(IterateJsonStringValuesState)); |
5118 | |
5119 | state->lex = lex; |
5120 | state->action = action; |
5121 | state->action_state = action_state; |
5122 | state->flags = flags; |
5123 | |
5124 | sem->semstate = (void *) state; |
5125 | sem->scalar = iterate_values_scalar; |
5126 | sem->object_field_start = iterate_values_object_field_start; |
5127 | |
5128 | pg_parse_json(lex, sem); |
5129 | } |
5130 | |
5131 | /* |
5132 | * An auxiliary function for iterate_json_values to invoke a specified |
5133 | * JsonIterateStringValuesAction for specified values. |
5134 | */ |
5135 | static void |
5136 | iterate_values_scalar(void *state, char *token, JsonTokenType tokentype) |
5137 | { |
5138 | IterateJsonStringValuesState *_state = (IterateJsonStringValuesState *) state; |
5139 | |
5140 | switch (tokentype) |
5141 | { |
5142 | case JSON_TOKEN_STRING: |
5143 | if (_state->flags & jtiString) |
5144 | _state->action(_state->action_state, token, strlen(token)); |
5145 | break; |
5146 | case JSON_TOKEN_NUMBER: |
5147 | if (_state->flags & jtiNumeric) |
5148 | _state->action(_state->action_state, token, strlen(token)); |
5149 | break; |
5150 | case JSON_TOKEN_TRUE: |
5151 | case JSON_TOKEN_FALSE: |
5152 | if (_state->flags & jtiBool) |
5153 | _state->action(_state->action_state, token, strlen(token)); |
5154 | break; |
5155 | default: |
5156 | /* do not call callback for any other token */ |
5157 | break; |
5158 | } |
5159 | } |
5160 | |
5161 | static void |
5162 | iterate_values_object_field_start(void *state, char *fname, bool isnull) |
5163 | { |
5164 | IterateJsonStringValuesState *_state = (IterateJsonStringValuesState *) state; |
5165 | |
5166 | if (_state->flags & jtiKey) |
5167 | { |
5168 | char *val = pstrdup(fname); |
5169 | |
5170 | _state->action(_state->action_state, val, strlen(val)); |
5171 | } |
5172 | } |
5173 | |
5174 | /* |
5175 | * Iterate over a jsonb, and apply a specified JsonTransformStringValuesAction |
5176 | * to every string value or element. Any necessary context for a |
5177 | * JsonTransformStringValuesAction can be passed in the action_state variable. |
5178 | * Function returns a copy of an original jsonb object with transformed values. |
5179 | */ |
5180 | Jsonb * |
5181 | transform_jsonb_string_values(Jsonb *jsonb, void *action_state, |
5182 | JsonTransformStringValuesAction transform_action) |
5183 | { |
5184 | JsonbIterator *it; |
5185 | JsonbValue v, |
5186 | *res = NULL; |
5187 | JsonbIteratorToken type; |
5188 | JsonbParseState *st = NULL; |
5189 | text *out; |
5190 | bool is_scalar = false; |
5191 | |
5192 | it = JsonbIteratorInit(&jsonb->root); |
5193 | is_scalar = it->isScalar; |
5194 | |
5195 | while ((type = JsonbIteratorNext(&it, &v, false)) != WJB_DONE) |
5196 | { |
5197 | if ((type == WJB_VALUE || type == WJB_ELEM) && v.type == jbvString) |
5198 | { |
5199 | out = transform_action(action_state, v.val.string.val, v.val.string.len); |
5200 | v.val.string.val = VARDATA_ANY(out); |
5201 | v.val.string.len = VARSIZE_ANY_EXHDR(out); |
5202 | res = pushJsonbValue(&st, type, type < WJB_BEGIN_ARRAY ? &v : NULL); |
5203 | } |
5204 | else |
5205 | { |
5206 | res = pushJsonbValue(&st, type, (type == WJB_KEY || |
5207 | type == WJB_VALUE || |
5208 | type == WJB_ELEM) ? &v : NULL); |
5209 | } |
5210 | } |
5211 | |
5212 | if (res->type == jbvArray) |
5213 | res->val.array.rawScalar = is_scalar; |
5214 | |
5215 | return JsonbValueToJsonb(res); |
5216 | } |
5217 | |
5218 | /* |
5219 | * Iterate over a json, and apply a specified JsonTransformStringValuesAction |
5220 | * to every string value or element. Any necessary context for a |
5221 | * JsonTransformStringValuesAction can be passed in the action_state variable. |
5222 | * Function returns a StringInfo, which is a copy of an original json with |
5223 | * transformed values. |
5224 | */ |
5225 | text * |
5226 | transform_json_string_values(text *json, void *action_state, |
5227 | JsonTransformStringValuesAction transform_action) |
5228 | { |
5229 | JsonLexContext *lex = makeJsonLexContext(json, true); |
5230 | JsonSemAction *sem = palloc0(sizeof(JsonSemAction)); |
5231 | TransformJsonStringValuesState *state = palloc0(sizeof(TransformJsonStringValuesState)); |
5232 | |
5233 | state->lex = lex; |
5234 | state->strval = makeStringInfo(); |
5235 | state->action = transform_action; |
5236 | state->action_state = action_state; |
5237 | |
5238 | sem->semstate = (void *) state; |
5239 | sem->scalar = transform_string_values_scalar; |
5240 | sem->object_start = transform_string_values_object_start; |
5241 | sem->object_end = transform_string_values_object_end; |
5242 | sem->array_start = transform_string_values_array_start; |
5243 | sem->array_end = transform_string_values_array_end; |
5244 | sem->scalar = transform_string_values_scalar; |
5245 | sem->array_element_start = transform_string_values_array_element_start; |
5246 | sem->object_field_start = transform_string_values_object_field_start; |
5247 | |
5248 | pg_parse_json(lex, sem); |
5249 | |
5250 | return cstring_to_text_with_len(state->strval->data, state->strval->len); |
5251 | } |
5252 | |
5253 | /* |
5254 | * Set of auxiliary functions for transform_json_string_values to invoke a |
5255 | * specified JsonTransformStringValuesAction for all values and left everything |
5256 | * else untouched. |
5257 | */ |
5258 | static void |
5259 | transform_string_values_object_start(void *state) |
5260 | { |
5261 | TransformJsonStringValuesState *_state = (TransformJsonStringValuesState *) state; |
5262 | |
5263 | appendStringInfoCharMacro(_state->strval, '{'); |
5264 | } |
5265 | |
5266 | static void |
5267 | transform_string_values_object_end(void *state) |
5268 | { |
5269 | TransformJsonStringValuesState *_state = (TransformJsonStringValuesState *) state; |
5270 | |
5271 | appendStringInfoCharMacro(_state->strval, '}'); |
5272 | } |
5273 | |
5274 | static void |
5275 | transform_string_values_array_start(void *state) |
5276 | { |
5277 | TransformJsonStringValuesState *_state = (TransformJsonStringValuesState *) state; |
5278 | |
5279 | appendStringInfoCharMacro(_state->strval, '['); |
5280 | } |
5281 | |
5282 | static void |
5283 | transform_string_values_array_end(void *state) |
5284 | { |
5285 | TransformJsonStringValuesState *_state = (TransformJsonStringValuesState *) state; |
5286 | |
5287 | appendStringInfoCharMacro(_state->strval, ']'); |
5288 | } |
5289 | |
5290 | static void |
5291 | transform_string_values_object_field_start(void *state, char *fname, bool isnull) |
5292 | { |
5293 | TransformJsonStringValuesState *_state = (TransformJsonStringValuesState *) state; |
5294 | |
5295 | if (_state->strval->data[_state->strval->len - 1] != '{') |
5296 | appendStringInfoCharMacro(_state->strval, ','); |
5297 | |
5298 | /* |
5299 | * Unfortunately we don't have the quoted and escaped string any more, so |
5300 | * we have to re-escape it. |
5301 | */ |
5302 | escape_json(_state->strval, fname); |
5303 | appendStringInfoCharMacro(_state->strval, ':'); |
5304 | } |
5305 | |
5306 | static void |
5307 | transform_string_values_array_element_start(void *state, bool isnull) |
5308 | { |
5309 | TransformJsonStringValuesState *_state = (TransformJsonStringValuesState *) state; |
5310 | |
5311 | if (_state->strval->data[_state->strval->len - 1] != '[') |
5312 | appendStringInfoCharMacro(_state->strval, ','); |
5313 | } |
5314 | |
5315 | static void |
5316 | transform_string_values_scalar(void *state, char *token, JsonTokenType tokentype) |
5317 | { |
5318 | TransformJsonStringValuesState *_state = (TransformJsonStringValuesState *) state; |
5319 | |
5320 | if (tokentype == JSON_TOKEN_STRING) |
5321 | { |
5322 | text *out = _state->action(_state->action_state, token, strlen(token)); |
5323 | |
5324 | escape_json(_state->strval, text_to_cstring(out)); |
5325 | } |
5326 | else |
5327 | appendStringInfoString(_state->strval, token); |
5328 | } |
5329 | |