PostgreSQL Source Code git master
All Data Structures Namespaces Files Functions Variables Typedefs Enumerations Enumerator Macros Pages
jsonb_plpython.c
Go to the documentation of this file.
1#include "postgres.h"
2
3#include "plpy_elog.h"
4#include "plpy_typeio.h"
5#include "plpython.h"
6#include "utils/fmgrprotos.h"
7#include "utils/jsonb.h"
8#include "utils/numeric.h"
9
11 .name = "jsonb_plpython",
12 .version = PG_VERSION
13);
14
15/* for PLyObject_AsString in plpy_typeio.c */
16typedef char *(*PLyObject_AsString_t) (PyObject *plrv);
18
19typedef void (*PLy_elog_impl_t) (int elevel, const char *fmt,...);
21
22/*
23 * decimal_constructor is a function from python library and used
24 * for transforming strings into python decimal type
25 */
26static PyObject *decimal_constructor;
27
28static PyObject *PLyObject_FromJsonbContainer(JsonbContainer *jsonb);
29static JsonbValue *PLyObject_ToJsonbValue(PyObject *obj,
30 JsonbParseState **jsonb_state, bool is_elem);
31
32typedef PyObject *(*PLyUnicode_FromStringAndSize_t)
33 (const char *s, Py_ssize_t size);
35
36/*
37 * Module initialize function: fetch function pointers for cross-module calls.
38 */
39void
41{
42 /* Asserts verify that typedefs above match original declarations */
45 load_external_function("$libdir/" PLPYTHON_LIBNAME, "PLyObject_AsString",
46 true, NULL);
49 load_external_function("$libdir/" PLPYTHON_LIBNAME, "PLyUnicode_FromStringAndSize",
50 true, NULL);
53 load_external_function("$libdir/" PLPYTHON_LIBNAME, "PLy_elog_impl",
54 true, NULL);
55}
56
57/* These defines must be after the _PG_init */
58#define PLyObject_AsString (PLyObject_AsString_p)
59#define PLyUnicode_FromStringAndSize (PLyUnicode_FromStringAndSize_p)
60#undef PLy_elog
61#define PLy_elog (PLy_elog_impl_p)
62
63/*
64 * PLyUnicode_FromJsonbValue
65 *
66 * Transform string JsonbValue to Python string.
67 */
68static PyObject *
70{
71 Assert(jbv->type == jbvString);
72
73 return PLyUnicode_FromStringAndSize(jbv->val.string.val, jbv->val.string.len);
74}
75
76/*
77 * PLyUnicode_ToJsonbValue
78 *
79 * Transform Python string to JsonbValue.
80 */
81static void
82PLyUnicode_ToJsonbValue(PyObject *obj, JsonbValue *jbvElem)
83{
84 jbvElem->type = jbvString;
85 jbvElem->val.string.val = PLyObject_AsString(obj);
86 jbvElem->val.string.len = strlen(jbvElem->val.string.val);
87}
88
89/*
90 * PLyObject_FromJsonbValue
91 *
92 * Transform JsonbValue to PyObject.
93 */
94static PyObject *
96{
97 switch (jsonbValue->type)
98 {
99 case jbvNull:
100 Py_RETURN_NONE;
101
102 case jbvBinary:
103 return PLyObject_FromJsonbContainer(jsonbValue->val.binary.data);
104
105 case jbvNumeric:
106 {
107 Datum num;
108 char *str;
109
110 num = NumericGetDatum(jsonbValue->val.numeric);
112
113 return PyObject_CallFunction(decimal_constructor, "s", str);
114 }
115
116 case jbvString:
117 return PLyUnicode_FromJsonbValue(jsonbValue);
118
119 case jbvBool:
120 if (jsonbValue->val.boolean)
121 Py_RETURN_TRUE;
122 else
123 Py_RETURN_FALSE;
124
125 default:
126 elog(ERROR, "unexpected jsonb value type: %d", jsonbValue->type);
127 return NULL;
128 }
129}
130
131/*
132 * PLyObject_FromJsonbContainer
133 *
134 * Transform JsonbContainer to PyObject.
135 */
136static PyObject *
138{
140 JsonbValue v;
141 JsonbIterator *it;
142 PyObject *result;
143
144 it = JsonbIteratorInit(jsonb);
145 r = JsonbIteratorNext(&it, &v, true);
146
147 switch (r)
148 {
149 case WJB_BEGIN_ARRAY:
150 if (v.val.array.rawScalar)
151 {
152 JsonbValue tmp;
153
154 if ((r = JsonbIteratorNext(&it, &v, true)) != WJB_ELEM ||
155 (r = JsonbIteratorNext(&it, &tmp, true)) != WJB_END_ARRAY ||
156 (r = JsonbIteratorNext(&it, &tmp, true)) != WJB_DONE)
157 elog(ERROR, "unexpected jsonb token: %d", r);
158
159 result = PLyObject_FromJsonbValue(&v);
160 }
161 else
162 {
163 PyObject *volatile elem = NULL;
164
165 result = PyList_New(0);
166 if (!result)
167 return NULL;
168
169 PG_TRY();
170 {
171 while ((r = JsonbIteratorNext(&it, &v, true)) != WJB_DONE)
172 {
173 if (r != WJB_ELEM)
174 continue;
175
176 elem = PLyObject_FromJsonbValue(&v);
177
178 PyList_Append(result, elem);
179 Py_XDECREF(elem);
180 elem = NULL;
181 }
182 }
183 PG_CATCH();
184 {
185 Py_XDECREF(elem);
186 Py_XDECREF(result);
187 PG_RE_THROW();
188 }
189 PG_END_TRY();
190 }
191 break;
192
193 case WJB_BEGIN_OBJECT:
194 {
195 PyObject *volatile result_v = PyDict_New();
196 PyObject *volatile key = NULL;
197 PyObject *volatile val = NULL;
198
199 if (!result_v)
200 return NULL;
201
202 PG_TRY();
203 {
204 while ((r = JsonbIteratorNext(&it, &v, true)) != WJB_DONE)
205 {
206 if (r != WJB_KEY)
207 continue;
208
210 if (!key)
211 {
212 Py_XDECREF(result_v);
213 result_v = NULL;
214 break;
215 }
216
217 if ((r = JsonbIteratorNext(&it, &v, true)) != WJB_VALUE)
218 elog(ERROR, "unexpected jsonb token: %d", r);
219
221 if (!val)
222 {
223 Py_XDECREF(key);
224 key = NULL;
225 Py_XDECREF(result_v);
226 result_v = NULL;
227 break;
228 }
229
230 PyDict_SetItem(result_v, key, val);
231
232 Py_XDECREF(key);
233 key = NULL;
234 Py_XDECREF(val);
235 val = NULL;
236 }
237 }
238 PG_CATCH();
239 {
240 Py_XDECREF(result_v);
241 Py_XDECREF(key);
242 Py_XDECREF(val);
243 PG_RE_THROW();
244 }
245 PG_END_TRY();
246
247 result = result_v;
248 }
249 break;
250
251 default:
252 elog(ERROR, "unexpected jsonb token: %d", r);
253 return NULL;
254 }
255
256 return result;
257}
258
259/*
260 * PLyMapping_ToJsonbValue
261 *
262 * Transform Python dict to JsonbValue.
263 */
264static JsonbValue *
265PLyMapping_ToJsonbValue(PyObject *obj, JsonbParseState **jsonb_state)
266{
267 Py_ssize_t pcount;
268 PyObject *volatile items;
269 JsonbValue *volatile out;
270
271 pcount = PyMapping_Size(obj);
272 items = PyMapping_Items(obj);
273
274 PG_TRY();
275 {
276 Py_ssize_t i;
277
278 pushJsonbValue(jsonb_state, WJB_BEGIN_OBJECT, NULL);
279
280 for (i = 0; i < pcount; i++)
281 {
282 JsonbValue jbvKey;
283 PyObject *item = PyList_GetItem(items, i);
284 PyObject *key = PyTuple_GetItem(item, 0);
285 PyObject *value = PyTuple_GetItem(item, 1);
286
287 /* Python dictionary can have None as key */
288 if (key == Py_None)
289 {
290 jbvKey.type = jbvString;
291 jbvKey.val.string.len = 0;
292 jbvKey.val.string.val = "";
293 }
294 else
295 {
296 /* All others types of keys we serialize to string */
298 }
299
300 (void) pushJsonbValue(jsonb_state, WJB_KEY, &jbvKey);
301 (void) PLyObject_ToJsonbValue(value, jsonb_state, false);
302 }
303
304 out = pushJsonbValue(jsonb_state, WJB_END_OBJECT, NULL);
305 }
306 PG_FINALLY();
307 {
308 Py_DECREF(items);
309 }
310 PG_END_TRY();
311
312 return out;
313}
314
315/*
316 * PLySequence_ToJsonbValue
317 *
318 * Transform python list to JsonbValue. Expects transformed PyObject and
319 * a state required for jsonb construction.
320 */
321static JsonbValue *
322PLySequence_ToJsonbValue(PyObject *obj, JsonbParseState **jsonb_state)
323{
324 Py_ssize_t i;
325 Py_ssize_t pcount;
326 PyObject *volatile value = NULL;
327
328 pcount = PySequence_Size(obj);
329
330 pushJsonbValue(jsonb_state, WJB_BEGIN_ARRAY, NULL);
331
332 PG_TRY();
333 {
334 for (i = 0; i < pcount; i++)
335 {
336 value = PySequence_GetItem(obj, i);
337 Assert(value);
338
339 (void) PLyObject_ToJsonbValue(value, jsonb_state, true);
340 Py_XDECREF(value);
341 value = NULL;
342 }
343 }
344 PG_CATCH();
345 {
346 Py_XDECREF(value);
347 PG_RE_THROW();
348 }
349 PG_END_TRY();
350
351 return pushJsonbValue(jsonb_state, WJB_END_ARRAY, NULL);
352}
353
354/*
355 * PLyNumber_ToJsonbValue(PyObject *obj)
356 *
357 * Transform python number to JsonbValue.
358 */
359static JsonbValue *
360PLyNumber_ToJsonbValue(PyObject *obj, JsonbValue *jbvNum)
361{
362 Numeric num;
363 char *str = PLyObject_AsString(obj);
364
365 PG_TRY();
366 {
367 Datum numd;
368
372 Int32GetDatum(-1));
373 num = DatumGetNumeric(numd);
374 }
375 PG_CATCH();
376 {
378 (errcode(ERRCODE_DATATYPE_MISMATCH),
379 errmsg("could not convert value \"%s\" to jsonb", str)));
380 }
381 PG_END_TRY();
382
383 pfree(str);
384
385 /*
386 * jsonb doesn't allow NaN or infinity (per JSON specification), so we
387 * have to reject those here explicitly.
388 */
389 if (numeric_is_nan(num))
391 (errcode(ERRCODE_NUMERIC_VALUE_OUT_OF_RANGE),
392 errmsg("cannot convert NaN to jsonb")));
393 if (numeric_is_inf(num))
395 (errcode(ERRCODE_NUMERIC_VALUE_OUT_OF_RANGE),
396 errmsg("cannot convert infinity to jsonb")));
397
398 jbvNum->type = jbvNumeric;
399 jbvNum->val.numeric = num;
400
401 return jbvNum;
402}
403
404/*
405 * PLyObject_ToJsonbValue(PyObject *obj)
406 *
407 * Transform python object to JsonbValue.
408 */
409static JsonbValue *
410PLyObject_ToJsonbValue(PyObject *obj, JsonbParseState **jsonb_state, bool is_elem)
411{
412 JsonbValue *out;
413
414 if (!PyUnicode_Check(obj))
415 {
416 if (PySequence_Check(obj))
417 return PLySequence_ToJsonbValue(obj, jsonb_state);
418 else if (PyMapping_Check(obj))
419 return PLyMapping_ToJsonbValue(obj, jsonb_state);
420 }
421
422 out = palloc(sizeof(JsonbValue));
423
424 if (obj == Py_None)
425 out->type = jbvNull;
426 else if (PyUnicode_Check(obj))
427 PLyUnicode_ToJsonbValue(obj, out);
428
429 /*
430 * PyNumber_Check() returns true for booleans, so boolean check should
431 * come first.
432 */
433 else if (PyBool_Check(obj))
434 {
435 out->type = jbvBool;
436 out->val.boolean = (obj == Py_True);
437 }
438 else if (PyNumber_Check(obj))
439 out = PLyNumber_ToJsonbValue(obj, out);
440 else
442 (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
443 errmsg("Python type \"%s\" cannot be transformed to jsonb",
444 PLyObject_AsString((PyObject *) obj->ob_type))));
445
446 /* Push result into 'jsonb_state' unless it is raw scalar value. */
447 return (*jsonb_state ?
448 pushJsonbValue(jsonb_state, is_elem ? WJB_ELEM : WJB_VALUE, out) :
449 out);
450}
451
452/*
453 * plpython_to_jsonb
454 *
455 * Transform python object to Jsonb datum
456 */
458Datum
460{
461 PyObject *obj;
462 JsonbValue *out;
463 JsonbParseState *jsonb_state = NULL;
464
465 obj = (PyObject *) PG_GETARG_POINTER(0);
466 out = PLyObject_ToJsonbValue(obj, &jsonb_state, true);
468}
469
470/*
471 * jsonb_to_plpython
472 *
473 * Transform Jsonb datum to PyObject and return it as internal.
474 */
476Datum
478{
479 PyObject *result;
480 Jsonb *in = PG_GETARG_JSONB_P(0);
481
482 /*
483 * Initialize pointer to Decimal constructor. First we try "cdecimal", C
484 * version of decimal library. In case of failure we use slower "decimal"
485 * module.
486 */
488 {
489 PyObject *decimal_module = PyImport_ImportModule("cdecimal");
490
491 if (!decimal_module)
492 {
493 PyErr_Clear();
494 decimal_module = PyImport_ImportModule("decimal");
495 }
496 Assert(decimal_module);
497 decimal_constructor = PyObject_GetAttrString(decimal_module, "Decimal");
498 }
499
500 result = PLyObject_FromJsonbContainer(&in->root);
501 if (!result)
502 PLy_elog(ERROR, "transformation from jsonb to Python failed");
503
504 return PointerGetDatum(result);
505}
Datum numeric_out(PG_FUNCTION_ARGS)
Definition: numeric.c:816
Datum numeric_in(PG_FUNCTION_ARGS)
Definition: numeric.c:637
bool numeric_is_nan(Numeric num)
Definition: numeric.c:851
bool numeric_is_inf(Numeric num)
Definition: numeric.c:862
#define AssertVariableIsOfType(varname, typename)
Definition: c.h:952
void * load_external_function(const char *filename, const char *funcname, bool signalNotFound, void **filehandle)
Definition: dfmgr.c:95
int errcode(int sqlerrcode)
Definition: elog.c:854
int errmsg(const char *fmt,...)
Definition: elog.c:1071
#define PG_RE_THROW()
Definition: elog.h:404
#define PG_TRY(...)
Definition: elog.h:371
#define PG_END_TRY(...)
Definition: elog.h:396
#define ERROR
Definition: elog.h:39
#define PG_CATCH(...)
Definition: elog.h:381
#define elog(elevel,...)
Definition: elog.h:225
#define PG_FINALLY(...)
Definition: elog.h:388
#define ereport(elevel,...)
Definition: elog.h:149
#define PG_GETARG_POINTER(n)
Definition: fmgr.h:276
#define DirectFunctionCall1(func, arg1)
Definition: fmgr.h:682
#define DirectFunctionCall3(func, arg1, arg2, arg3)
Definition: fmgr.h:686
#define PG_RETURN_POINTER(x)
Definition: fmgr.h:361
#define PG_FUNCTION_ARGS
Definition: fmgr.h:193
Assert(PointerIsAligned(start, uint64))
const char * str
long val
Definition: informix.c:689
static struct @165 value
int i
Definition: isn.c:77
@ jbvNumeric
Definition: jsonb.h:230
@ jbvBool
Definition: jsonb.h:231
@ jbvBinary
Definition: jsonb.h:236
@ jbvNull
Definition: jsonb.h:228
@ jbvString
Definition: jsonb.h:229
#define PG_GETARG_JSONB_P(x)
Definition: jsonb.h:391
JsonbIteratorToken
Definition: jsonb.h:21
@ WJB_KEY
Definition: jsonb.h:23
@ WJB_DONE
Definition: jsonb.h:22
@ WJB_END_ARRAY
Definition: jsonb.h:27
@ WJB_VALUE
Definition: jsonb.h:24
@ WJB_END_OBJECT
Definition: jsonb.h:29
@ WJB_ELEM
Definition: jsonb.h:25
@ WJB_BEGIN_OBJECT
Definition: jsonb.h:28
@ WJB_BEGIN_ARRAY
Definition: jsonb.h:26
static JsonbValue * PLyObject_ToJsonbValue(PyObject *obj, JsonbParseState **jsonb_state, bool is_elem)
static JsonbValue * PLyMapping_ToJsonbValue(PyObject *obj, JsonbParseState **jsonb_state)
#define PLy_elog
#define PLyUnicode_FromStringAndSize
void _PG_init(void)
PG_MODULE_MAGIC_EXT(.name="jsonb_plpython",.version=PG_VERSION)
static PLy_elog_impl_t PLy_elog_impl_p
static JsonbValue * PLyNumber_ToJsonbValue(PyObject *obj, JsonbValue *jbvNum)
PyObject *(* PLyUnicode_FromStringAndSize_t)(const char *s, Py_ssize_t size)
Datum plpython_to_jsonb(PG_FUNCTION_ARGS)
void(* PLy_elog_impl_t)(int elevel, const char *fmt,...)
static PyObject * PLyObject_FromJsonbValue(JsonbValue *jsonbValue)
PG_FUNCTION_INFO_V1(plpython_to_jsonb)
static PLyObject_AsString_t PLyObject_AsString_p
char *(* PLyObject_AsString_t)(PyObject *plrv)
static PyObject * decimal_constructor
Datum jsonb_to_plpython(PG_FUNCTION_ARGS)
static PLyUnicode_FromStringAndSize_t PLyUnicode_FromStringAndSize_p
static void PLyUnicode_ToJsonbValue(PyObject *obj, JsonbValue *jbvElem)
static PyObject * PLyObject_FromJsonbContainer(JsonbContainer *jsonb)
#define PLyObject_AsString
static JsonbValue * PLySequence_ToJsonbValue(PyObject *obj, JsonbParseState **jsonb_state)
static PyObject * PLyUnicode_FromJsonbValue(JsonbValue *jbv)
JsonbValue * pushJsonbValue(JsonbParseState **pstate, JsonbIteratorToken seq, JsonbValue *jbval)
Definition: jsonb_util.c:573
JsonbIterator * JsonbIteratorInit(JsonbContainer *container)
Definition: jsonb_util.c:824
JsonbIteratorToken JsonbIteratorNext(JsonbIterator **it, JsonbValue *val, bool skipNested)
Definition: jsonb_util.c:860
Jsonb * JsonbValueToJsonb(JsonbValue *val)
Definition: jsonb_util.c:92
void pfree(void *pointer)
Definition: mcxt.c:2150
void * palloc(Size size)
Definition: mcxt.c:1943
static Numeric DatumGetNumeric(Datum X)
Definition: numeric.h:61
static Datum NumericGetDatum(Numeric X)
Definition: numeric.h:73
void PLy_elog_impl(int elevel, const char *fmt,...)
Definition: plpy_elog.c:43
static Datum PointerGetDatum(const void *X)
Definition: postgres.h:327
uintptr_t Datum
Definition: postgres.h:69
static Datum ObjectIdGetDatum(Oid X)
Definition: postgres.h:257
static char * DatumGetCString(Datum X)
Definition: postgres.h:340
static Datum CStringGetDatum(const char *X)
Definition: postgres.h:355
static Datum Int32GetDatum(int32 X)
Definition: postgres.h:217
#define InvalidOid
Definition: postgres_ext.h:35
enum jbvType type
Definition: jsonb.h:255
char * val
Definition: jsonb.h:264
Definition: jsonb.h:213
JsonbContainer root
Definition: jsonb.h:215
static ItemArray items
Definition: test_tidstore.c:48
const char * name