Location via proxy:   [ UP ]  
[Report a bug]   [Manage cookies]                
Skip to content

Commit b995518

Browse files
committed
Add defenses against putting expanded objects into Const nodes.
Putting a reference to an expanded-format value into a Const node would be a bad idea for a couple of reasons. It'd be possible for the supposedly immutable Const to change value, if something modified the referenced variable ... in fact, if the Const's reference were R/W, any function that has the Const as argument might itself change it at runtime. Also, because datumIsEqual() is pretty simplistic, the Const might fail to compare equal to other Consts that it should compare equal to, notably including copies of itself. This could lead to unexpected planner behavior, such as "could not find pathkey item to sort" errors or inferior plans. I have not been able to find any way to get an expanded value into a Const within the existing core code; but Paul Ramsey was able to trigger the problem by writing a datatype input function that returns an expanded value. The best fix seems to be to establish a rule that varlena values being placed into Const nodes should be passed through pg_detoast_datum(). That will do nothing (and cost little) in normal cases, but it will flatten expanded values and thereby avoid the above problems. Also, it will convert short-header or compressed values into canonical format, which will avoid possible unexpected lack-of-equality issues for those cases too. And it provides a last-ditch defense against putting a toasted value into a Const, which we already knew was dangerous, cf commit 2b0c86b. (In the light of this discussion, I'm no longer sure that that commit provided 100% protection against such cases, but this fix should do it.) The test added in commit 65c3d05 to catch datatype input functions with unstable results would fail for functions that returned expanded values; but it seems a bit uncharitable to deem a result unstable just because it's expressed in expanded form, so revise the coding so that we check for bitwise equality only after applying pg_detoast_datum(). That's a sufficient condition anyway given the new rule about detoasting when forming a Const. Back-patch to 9.5 where the expanded-object facility was added. It's possible that this should go back further; but in the absence of clear evidence that there's any live bug in older branches, I'll refrain for now.
1 parent 38710a3 commit b995518

File tree

5 files changed

+55
-31
lines changed

5 files changed

+55
-31
lines changed

src/backend/nodes/makefuncs.c

+9
Original file line numberDiff line numberDiff line change
@@ -17,6 +17,7 @@
1717

1818
#include "catalog/pg_class.h"
1919
#include "catalog/pg_type.h"
20+
#include "fmgr.h"
2021
#include "nodes/makefuncs.h"
2122
#include "nodes/nodeFuncs.h"
2223
#include "utils/lsyscache.h"
@@ -302,6 +303,14 @@ makeConst(Oid consttype,
302303
{
303304
Const *cnst = makeNode(Const);
304305

306+
/*
307+
* If it's a varlena value, force it to be in non-expanded (non-toasted)
308+
* format; this avoids any possible dependency on external values and
309+
* improves consistency of representation, which is important for equal().
310+
*/
311+
if (!constisnull && constlen == -1)
312+
constvalue = PointerGetDatum(PG_DETOAST_DATUM(constvalue));
313+
305314
cnst->consttype = consttype;
306315
cnst->consttypmod = consttypmod;
307316
cnst->constcollid = constcollid;

src/backend/optimizer/util/clauses.c

+2-1
Original file line numberDiff line numberDiff line change
@@ -4886,7 +4886,8 @@ evaluate_expr(Expr *expr, Oid result_type, int32 result_typmod,
48864886
*
48874887
* Also, if it's varlena, forcibly detoast it. This protects us against
48884888
* storing TOAST pointers into plans that might outlive the referenced
4889-
* data.
4889+
* data. (makeConst would handle detoasting anyway, but it's worth a few
4890+
* extra lines here so that we can do the copy and detoast in one step.)
48904891
*/
48914892
if (!const_is_null)
48924893
{

src/backend/parser/parse_coerce.c

+38
Original file line numberDiff line numberDiff line change
@@ -26,6 +26,7 @@
2626
#include "parser/parse_relation.h"
2727
#include "parser/parse_type.h"
2828
#include "utils/builtins.h"
29+
#include "utils/datum.h"
2930
#include "utils/lsyscache.h"
3031
#include "utils/syscache.h"
3132
#include "utils/typcache.h"
@@ -308,6 +309,43 @@ coerce_type(ParseState *pstate, Node *node,
308309
NULL,
309310
inputTypeMod);
310311

312+
/*
313+
* If it's a varlena value, force it to be in non-expanded
314+
* (non-toasted) format; this avoids any possible dependency on
315+
* external values and improves consistency of representation.
316+
*/
317+
if (!con->constisnull && newcon->constlen == -1)
318+
newcon->constvalue =
319+
PointerGetDatum(PG_DETOAST_DATUM(newcon->constvalue));
320+
321+
#ifdef RANDOMIZE_ALLOCATED_MEMORY
322+
323+
/*
324+
* For pass-by-reference data types, repeat the conversion to see if
325+
* the input function leaves any uninitialized bytes in the result. We
326+
* can only detect that reliably if RANDOMIZE_ALLOCATED_MEMORY is
327+
* enabled, so we don't bother testing otherwise. The reason we don't
328+
* want any instability in the input function is that comparison of
329+
* Const nodes relies on bytewise comparison of the datums, so if the
330+
* input function leaves garbage then subexpressions that should be
331+
* identical may not get recognized as such. See pgsql-hackers
332+
* discussion of 2008-04-04.
333+
*/
334+
if (!con->constisnull && !newcon->constbyval)
335+
{
336+
Datum val2;
337+
338+
val2 = stringTypeDatum(baseType,
339+
DatumGetCString(con->constvalue),
340+
inputTypeMod);
341+
if (newcon->constlen == -1)
342+
val2 = PointerGetDatum(PG_DETOAST_DATUM(val2));
343+
if (!datumIsEqual(newcon->constvalue, val2, false, newcon->constlen))
344+
elog(WARNING, "type %s has unstable input conversion for \"%s\"",
345+
typeTypeName(baseType), DatumGetCString(con->constvalue));
346+
}
347+
#endif
348+
311349
cancel_parser_errposition_callback(&pcbstate);
312350

313351
result = (Node *) newcon;

src/backend/parser/parse_type.c

+1-30
Original file line numberDiff line numberDiff line change
@@ -23,7 +23,6 @@
2323
#include "parser/parse_type.h"
2424
#include "utils/array.h"
2525
#include "utils/builtins.h"
26-
#include "utils/datum.h"
2726
#include "utils/lsyscache.h"
2827
#include "utils/syscache.h"
2928

@@ -639,36 +638,8 @@ stringTypeDatum(Type tp, char *string, int32 atttypmod)
639638
Form_pg_type typform = (Form_pg_type) GETSTRUCT(tp);
640639
Oid typinput = typform->typinput;
641640
Oid typioparam = getTypeIOParam(tp);
642-
Datum result;
643641

644-
result = OidInputFunctionCall(typinput, string,
645-
typioparam, atttypmod);
646-
647-
#ifdef RANDOMIZE_ALLOCATED_MEMORY
648-
649-
/*
650-
* For pass-by-reference data types, repeat the conversion to see if the
651-
* input function leaves any uninitialized bytes in the result. We can
652-
* only detect that reliably if RANDOMIZE_ALLOCATED_MEMORY is enabled, so
653-
* we don't bother testing otherwise. The reason we don't want any
654-
* instability in the input function is that comparison of Const nodes
655-
* relies on bytewise comparison of the datums, so if the input function
656-
* leaves garbage then subexpressions that should be identical may not get
657-
* recognized as such. See pgsql-hackers discussion of 2008-04-04.
658-
*/
659-
if (string && !typform->typbyval)
660-
{
661-
Datum result2;
662-
663-
result2 = OidInputFunctionCall(typinput, string,
664-
typioparam, atttypmod);
665-
if (!datumIsEqual(result, result2, typform->typbyval, typform->typlen))
666-
elog(WARNING, "type %s has unstable input conversion for \"%s\"",
667-
NameStr(typform->typname), string);
668-
}
669-
#endif
670-
671-
return result;
642+
return OidInputFunctionCall(typinput, string, typioparam, atttypmod);
672643
}
673644

674645
/* given a typeid, return the type's typrelid (associated relation, if any) */

src/include/nodes/primnodes.h

+5
Original file line numberDiff line numberDiff line change
@@ -165,6 +165,11 @@ typedef struct Var
165165

166166
/*
167167
* Const
168+
*
169+
* Note: for varlena data types, we make a rule that a Const node's value
170+
* must be in non-extended form (4-byte header, no compression or external
171+
* references). This ensures that the Const node is self-contained and makes
172+
* it more likely that equal() will see logically identical values as equal.
168173
*/
169174
typedef struct Const
170175
{

0 commit comments

Comments
 (0)