Line data Source code
1 : /*
2 : * Python procedure manipulation for plpython
3 : *
4 : * src/pl/plpython/plpy_procedure.c
5 : */
6 :
7 : #include "postgres.h"
8 :
9 : #include "access/htup_details.h"
10 : #include "access/transam.h"
11 : #include "funcapi.h"
12 : #include "catalog/pg_proc.h"
13 : #include "catalog/pg_type.h"
14 : #include "plpy_elog.h"
15 : #include "plpy_main.h"
16 : #include "plpy_procedure.h"
17 : #include "plpython.h"
18 : #include "utils/builtins.h"
19 : #include "utils/hsearch.h"
20 : #include "utils/inval.h"
21 : #include "utils/lsyscache.h"
22 : #include "utils/memutils.h"
23 : #include "utils/syscache.h"
24 :
25 : static HTAB *PLy_procedure_cache = NULL;
26 :
27 : static PLyProcedure *PLy_procedure_create(HeapTuple procTup, Oid fn_oid, bool is_trigger);
28 : static bool PLy_procedure_valid(PLyProcedure *proc, HeapTuple procTup);
29 : static char *PLy_procedure_munge_source(const char *name, const char *src);
30 :
31 :
32 : void
33 46 : init_procedure_caches(void)
34 : {
35 : HASHCTL hash_ctl;
36 :
37 46 : hash_ctl.keysize = sizeof(PLyProcedureKey);
38 46 : hash_ctl.entrysize = sizeof(PLyProcedureEntry);
39 46 : PLy_procedure_cache = hash_create("PL/Python procedures", 32, &hash_ctl,
40 : HASH_ELEM | HASH_BLOBS);
41 46 : }
42 :
43 : /*
44 : * PLy_procedure_name: get the name of the specified procedure.
45 : *
46 : * NB: this returns the SQL name, not the internal Python procedure name
47 : */
48 : char *
49 1034 : PLy_procedure_name(PLyProcedure *proc)
50 : {
51 1034 : if (proc == NULL)
52 0 : return "<unknown procedure>";
53 1034 : return proc->proname;
54 : }
55 :
56 : /*
57 : * PLy_procedure_get: returns a cached PLyProcedure, or creates, stores and
58 : * returns a new PLyProcedure.
59 : *
60 : * fn_oid is the OID of the function requested
61 : * fn_rel is InvalidOid or the relation this function triggers on
62 : * is_trigger denotes whether the function is a trigger function
63 : *
64 : * The reason that both fn_rel and is_trigger need to be passed is that when
65 : * trigger functions get validated we don't know which relation(s) they'll
66 : * be used with, so no sensible fn_rel can be passed.
67 : */
68 : PLyProcedure *
69 1848 : PLy_procedure_get(Oid fn_oid, Oid fn_rel, bool is_trigger)
70 : {
71 1848 : bool use_cache = !(is_trigger && fn_rel == InvalidOid);
72 : HeapTuple procTup;
73 : PLyProcedureKey key;
74 1848 : PLyProcedureEntry *volatile entry = NULL;
75 1848 : PLyProcedure *volatile proc = NULL;
76 1848 : bool found = false;
77 :
78 1848 : procTup = SearchSysCache1(PROCOID, ObjectIdGetDatum(fn_oid));
79 1848 : if (!HeapTupleIsValid(procTup))
80 0 : elog(ERROR, "cache lookup failed for function %u", fn_oid);
81 :
82 : /*
83 : * Look for the function in the cache, unless we don't have the necessary
84 : * information (e.g. during validation). In that case we just don't cache
85 : * anything.
86 : */
87 1848 : if (use_cache)
88 : {
89 1802 : key.fn_oid = fn_oid;
90 1802 : key.fn_rel = fn_rel;
91 1802 : entry = hash_search(PLy_procedure_cache, &key, HASH_ENTER, &found);
92 1802 : proc = entry->proc;
93 : }
94 :
95 1848 : PG_TRY();
96 : {
97 1848 : if (!found)
98 : {
99 : /* Haven't found it, create a new procedure */
100 538 : proc = PLy_procedure_create(procTup, fn_oid, is_trigger);
101 530 : if (use_cache)
102 484 : entry->proc = proc;
103 : }
104 1310 : else if (!PLy_procedure_valid(proc, procTup))
105 : {
106 : /* Found it, but it's invalid, free and reuse the cache entry */
107 10 : entry->proc = NULL;
108 10 : if (proc)
109 10 : PLy_procedure_delete(proc);
110 10 : proc = PLy_procedure_create(procTup, fn_oid, is_trigger);
111 10 : entry->proc = proc;
112 : }
113 : /* Found it and it's valid, it's fine to use it */
114 : }
115 8 : PG_CATCH();
116 : {
117 : /* Do not leave an uninitialized entry in the cache */
118 8 : if (use_cache)
119 8 : hash_search(PLy_procedure_cache, &key, HASH_REMOVE, NULL);
120 8 : PG_RE_THROW();
121 : }
122 1840 : PG_END_TRY();
123 :
124 1840 : ReleaseSysCache(procTup);
125 :
126 1840 : return proc;
127 : }
128 :
129 : /*
130 : * Create a new PLyProcedure structure
131 : */
132 : static PLyProcedure *
133 548 : PLy_procedure_create(HeapTuple procTup, Oid fn_oid, bool is_trigger)
134 : {
135 : char procName[NAMEDATALEN + 256];
136 : Form_pg_proc procStruct;
137 : PLyProcedure *volatile proc;
138 : MemoryContext cxt;
139 : MemoryContext oldcxt;
140 : int rv;
141 : char *ptr;
142 :
143 548 : procStruct = (Form_pg_proc) GETSTRUCT(procTup);
144 1096 : rv = snprintf(procName, sizeof(procName),
145 : "__plpython_procedure_%s_%u",
146 548 : NameStr(procStruct->proname),
147 : fn_oid);
148 548 : if (rv >= sizeof(procName) || rv < 0)
149 0 : elog(ERROR, "procedure name would overrun buffer");
150 :
151 : /* Replace any not-legal-in-Python-names characters with '_' */
152 25686 : for (ptr = procName; *ptr; ptr++)
153 : {
154 25138 : if (!((*ptr >= 'A' && *ptr <= 'Z') ||
155 25136 : (*ptr >= 'a' && *ptr <= 'z') ||
156 6734 : (*ptr >= '0' && *ptr <= '9')))
157 3792 : *ptr = '_';
158 : }
159 :
160 : /* Create long-lived context that all procedure info will live in */
161 548 : cxt = AllocSetContextCreate(TopMemoryContext,
162 : "PL/Python function",
163 : ALLOCSET_DEFAULT_SIZES);
164 :
165 548 : oldcxt = MemoryContextSwitchTo(cxt);
166 :
167 548 : proc = (PLyProcedure *) palloc0(sizeof(PLyProcedure));
168 548 : proc->mcxt = cxt;
169 :
170 548 : PG_TRY();
171 : {
172 : Datum protrftypes_datum;
173 : Datum prosrcdatum;
174 : bool isnull;
175 : char *procSource;
176 : int i;
177 :
178 548 : proc->proname = pstrdup(NameStr(procStruct->proname));
179 548 : MemoryContextSetIdentifier(cxt, proc->proname);
180 548 : proc->pyname = pstrdup(procName);
181 548 : proc->fn_xmin = HeapTupleHeaderGetRawXmin(procTup->t_data);
182 548 : proc->fn_tid = procTup->t_self;
183 548 : proc->fn_readonly = (procStruct->provolatile != PROVOLATILE_VOLATILE);
184 548 : proc->is_setof = procStruct->proretset;
185 548 : proc->is_procedure = (procStruct->prokind == PROKIND_PROCEDURE);
186 548 : proc->src = NULL;
187 548 : proc->argnames = NULL;
188 548 : proc->args = NULL;
189 548 : proc->nargs = 0;
190 548 : proc->langid = procStruct->prolang;
191 548 : protrftypes_datum = SysCacheGetAttr(PROCOID, procTup,
192 : Anum_pg_proc_protrftypes,
193 : &isnull);
194 548 : proc->trftypes = isnull ? NIL : oid_array_to_list(protrftypes_datum);
195 548 : proc->code = NULL;
196 548 : proc->statics = NULL;
197 548 : proc->globals = NULL;
198 548 : proc->calldepth = 0;
199 548 : proc->argstack = NULL;
200 :
201 : /*
202 : * get information required for output conversion of the return value,
203 : * but only if this isn't a trigger.
204 : */
205 548 : if (!is_trigger)
206 : {
207 452 : Oid rettype = procStruct->prorettype;
208 : HeapTuple rvTypeTup;
209 : Form_pg_type rvTypeStruct;
210 :
211 452 : rvTypeTup = SearchSysCache1(TYPEOID, ObjectIdGetDatum(rettype));
212 452 : if (!HeapTupleIsValid(rvTypeTup))
213 0 : elog(ERROR, "cache lookup failed for type %u", rettype);
214 452 : rvTypeStruct = (Form_pg_type) GETSTRUCT(rvTypeTup);
215 :
216 : /* Disallow pseudotype result, except for void or record */
217 452 : if (rvTypeStruct->typtype == TYPTYPE_PSEUDO)
218 : {
219 102 : if (rettype == VOIDOID ||
220 : rettype == RECORDOID)
221 : /* okay */ ;
222 2 : else if (rettype == TRIGGEROID || rettype == EVENT_TRIGGEROID)
223 2 : ereport(ERROR,
224 : (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
225 : errmsg("trigger functions can only be called as triggers")));
226 : else
227 0 : ereport(ERROR,
228 : (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
229 : errmsg("PL/Python functions cannot return type %s",
230 : format_type_be(rettype))));
231 : }
232 :
233 : /* set up output function for procedure result */
234 450 : PLy_output_setup_func(&proc->result, proc->mcxt,
235 : rettype, -1, proc);
236 :
237 450 : ReleaseSysCache(rvTypeTup);
238 : }
239 : else
240 : {
241 : /*
242 : * In a trigger function, we use proc->result and proc->result_in
243 : * for converting tuples, but we don't yet have enough info to set
244 : * them up. PLy_exec_trigger will deal with it.
245 : */
246 96 : proc->result.typoid = InvalidOid;
247 96 : proc->result_in.typoid = InvalidOid;
248 : }
249 :
250 : /*
251 : * Now get information required for input conversion of the
252 : * procedure's arguments. Note that we ignore output arguments here.
253 : * If the function returns record, those I/O functions will be set up
254 : * when the function is first called.
255 : */
256 546 : if (procStruct->pronargs)
257 : {
258 : Oid *types;
259 : char **names,
260 : *modes;
261 : int pos,
262 : total;
263 :
264 : /* extract argument type info from the pg_proc tuple */
265 210 : total = get_func_arg_info(procTup, &types, &names, &modes);
266 :
267 : /* count number of in+inout args into proc->nargs */
268 210 : if (modes == NULL)
269 188 : proc->nargs = total;
270 : else
271 : {
272 : /* proc->nargs was initialized to 0 above */
273 82 : for (i = 0; i < total; i++)
274 : {
275 60 : if (modes[i] != PROARGMODE_OUT &&
276 36 : modes[i] != PROARGMODE_TABLE)
277 36 : (proc->nargs)++;
278 : }
279 : }
280 :
281 : /* Allocate arrays for per-input-argument data */
282 210 : proc->argnames = (char **) palloc0(sizeof(char *) * proc->nargs);
283 210 : proc->args = (PLyDatumToOb *) palloc0(sizeof(PLyDatumToOb) * proc->nargs);
284 :
285 544 : for (i = pos = 0; i < total; i++)
286 : {
287 : HeapTuple argTypeTup;
288 : Form_pg_type argTypeStruct;
289 :
290 334 : if (modes &&
291 60 : (modes[i] == PROARGMODE_OUT ||
292 36 : modes[i] == PROARGMODE_TABLE))
293 24 : continue; /* skip OUT arguments */
294 :
295 : Assert(types[i] == procStruct->proargtypes.values[pos]);
296 :
297 310 : argTypeTup = SearchSysCache1(TYPEOID,
298 310 : ObjectIdGetDatum(types[i]));
299 310 : if (!HeapTupleIsValid(argTypeTup))
300 0 : elog(ERROR, "cache lookup failed for type %u", types[i]);
301 310 : argTypeStruct = (Form_pg_type) GETSTRUCT(argTypeTup);
302 :
303 : /* disallow pseudotype arguments */
304 310 : if (argTypeStruct->typtype == TYPTYPE_PSEUDO)
305 0 : ereport(ERROR,
306 : (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
307 : errmsg("PL/Python functions cannot accept type %s",
308 : format_type_be(types[i]))));
309 :
310 : /* set up I/O function info */
311 310 : PLy_input_setup_func(&proc->args[pos], proc->mcxt,
312 310 : types[i], -1, /* typmod not known */
313 : proc);
314 :
315 : /* get argument name */
316 310 : proc->argnames[pos] = names ? pstrdup(names[i]) : NULL;
317 :
318 310 : ReleaseSysCache(argTypeTup);
319 :
320 310 : pos++;
321 : }
322 : }
323 :
324 : /*
325 : * get the text of the function.
326 : */
327 546 : prosrcdatum = SysCacheGetAttrNotNull(PROCOID, procTup,
328 : Anum_pg_proc_prosrc);
329 546 : procSource = TextDatumGetCString(prosrcdatum);
330 :
331 546 : PLy_procedure_compile(proc, procSource);
332 :
333 540 : pfree(procSource);
334 : }
335 8 : PG_CATCH();
336 : {
337 8 : MemoryContextSwitchTo(oldcxt);
338 8 : PLy_procedure_delete(proc);
339 8 : PG_RE_THROW();
340 : }
341 540 : PG_END_TRY();
342 :
343 540 : MemoryContextSwitchTo(oldcxt);
344 540 : return proc;
345 : }
346 :
347 : /*
348 : * Insert the procedure into the Python interpreter
349 : */
350 : void
351 588 : PLy_procedure_compile(PLyProcedure *proc, const char *src)
352 : {
353 588 : PyObject *crv = NULL;
354 : char *msrc;
355 :
356 588 : proc->globals = PyDict_Copy(PLy_interp_globals);
357 :
358 : /*
359 : * SD is private preserved data between calls. GD is global data shared by
360 : * all functions
361 : */
362 588 : proc->statics = PyDict_New();
363 588 : if (!proc->statics)
364 0 : PLy_elog(ERROR, NULL);
365 588 : PyDict_SetItemString(proc->globals, "SD", proc->statics);
366 :
367 : /*
368 : * insert the function code into the interpreter
369 : */
370 588 : msrc = PLy_procedure_munge_source(proc->pyname, src);
371 : /* Save the mangled source for later inclusion in tracebacks */
372 588 : proc->src = MemoryContextStrdup(proc->mcxt, msrc);
373 588 : crv = PyRun_String(msrc, Py_file_input, proc->globals, NULL);
374 588 : pfree(msrc);
375 :
376 588 : if (crv != NULL)
377 : {
378 : int clen;
379 : char call[NAMEDATALEN + 256];
380 :
381 582 : Py_DECREF(crv);
382 :
383 : /*
384 : * compile a call to the function
385 : */
386 582 : clen = snprintf(call, sizeof(call), "%s()", proc->pyname);
387 582 : if (clen < 0 || clen >= sizeof(call))
388 0 : elog(ERROR, "string would overflow buffer");
389 582 : proc->code = Py_CompileString(call, "<string>", Py_eval_input);
390 582 : if (proc->code != NULL)
391 582 : return;
392 : }
393 :
394 6 : if (proc->proname)
395 6 : PLy_elog(ERROR, "could not compile PL/Python function \"%s\"",
396 : proc->proname);
397 : else
398 0 : PLy_elog(ERROR, "could not compile anonymous PL/Python code block");
399 : }
400 :
401 : void
402 60 : PLy_procedure_delete(PLyProcedure *proc)
403 : {
404 60 : Py_XDECREF(proc->code);
405 60 : Py_XDECREF(proc->statics);
406 60 : Py_XDECREF(proc->globals);
407 60 : MemoryContextDelete(proc->mcxt);
408 60 : }
409 :
410 : /*
411 : * Decide whether a cached PLyProcedure struct is still valid
412 : */
413 : static bool
414 1310 : PLy_procedure_valid(PLyProcedure *proc, HeapTuple procTup)
415 : {
416 1310 : if (proc == NULL)
417 0 : return false;
418 :
419 : /* If the pg_proc tuple has changed, it's not valid */
420 2610 : if (!(proc->fn_xmin == HeapTupleHeaderGetRawXmin(procTup->t_data) &&
421 1300 : ItemPointerEquals(&proc->fn_tid, &procTup->t_self)))
422 10 : return false;
423 :
424 1300 : return true;
425 : }
426 :
427 : static char *
428 588 : PLy_procedure_munge_source(const char *name, const char *src)
429 : {
430 : char *mrc,
431 : *mp;
432 : const char *sp;
433 : size_t mlen;
434 : int plen;
435 :
436 : /*
437 : * room for function source and the def statement
438 : */
439 588 : mlen = (strlen(src) * 2) + strlen(name) + 16;
440 :
441 588 : mrc = palloc(mlen);
442 588 : plen = snprintf(mrc, mlen, "def %s():\n\t", name);
443 : Assert(plen >= 0 && plen < mlen);
444 :
445 588 : sp = src;
446 588 : mp = mrc + plen;
447 :
448 63132 : while (*sp != '\0')
449 : {
450 62544 : if (*sp == '\r' && *(sp + 1) == '\n')
451 6 : sp++;
452 :
453 62544 : if (*sp == '\n' || *sp == '\r')
454 : {
455 2664 : *mp++ = '\n';
456 2664 : *mp++ = '\t';
457 2664 : sp++;
458 : }
459 : else
460 59880 : *mp++ = *sp++;
461 : }
462 588 : *mp++ = '\n';
463 588 : *mp++ = '\n';
464 588 : *mp = '\0';
465 :
466 588 : if (mp > (mrc + mlen))
467 0 : elog(FATAL, "buffer overrun in PLy_procedure_munge_source");
468 :
469 588 : return mrc;
470 : }
|