NotificationsYou must be signed in to change notification settings
Fork6
Star31

Commit74a1a36

committed

Fix JSON error reporting for many cases of erroneous string values.

The majority of error exit cases in json_lex_string() failed toset lex->token_terminator, causing problems for the error contextreporting code: it would see token_terminator less than token_startand do something more or less nuts. In v14 and up the end resultcould be as bad as a crash in report_json_context(). Olderversions accidentally avoided that fate; but all versions produceerror context lines that are far less useful than intended,because they'd stop at the end of the prior token instead ofcontinuing to where the actually-bad input is.To fix, invent some macros that make it less notationally painfulto do the right thing. Also add documentation about what thefunction is actually required to do; and in >= v14, add an assertionin report_json_context about token_terminator being sufficientlyfar advanced.Per report from Nikolay Shaplov. Back-patch to all supportedversions.Discussion:https://postgr.es/m/7332649.x5DLKWyVIX@thinkpad-pgpro

1 parent5fd61bd commit74a1a36Copy full SHA for 74a1a36

File tree

4 files changed

+72

-54

lines changed

src
- backend/utils/adt
  - jsonfuncs.c
- common
  - jsonapi.c
- test/regress/expected
  - json_encoding.out
  - json_encoding_1.out

4 files changed

+72

-54

lines changed

`‎src/backend/utils/adt/jsonfuncs.c‎`

Lines changed: 1 addition & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -656,6 +656,7 @@ report_json_context(JsonLexContext *lex)`
`656`	`656`	`line_start=lex->line_start;`
`657`	`657`	`context_start=line_start;`
`658`	`658`	`context_end=lex->token_terminator;`
	`659`	`+Assert(context_end >=context_start);`
`659`	`660`
`660`	`661`	`/* Advance until we are close enough to context_end */`
`661`	`662`	`while (context_end-context_start >=50)`

`‎src/common/jsonapi.c‎`

Lines changed: 47 additions & 30 deletions

Original file line number	Diff line number	Diff line change
`@@ -667,6 +667,14 @@ json_lex(JsonLexContext *lex)`
`667`	`667`
`668`	`668`	`/*`
`669`	`669`	`* The next token in the input stream is known to be a string; lex it.`
	`670`	`+ *`
	`671`	`+ * If lex->strval isn't NULL, fill it with the decoded string.`
	`672`	`+ * Set lex->token_terminator to the end of the decoded input, and in`
	`673`	`+ * success cases, transfer its previous value to lex->prev_token_terminator.`
	`674`	`+ * Return JSON_SUCCESS or an error code.`
	`675`	`+ *`
	`676`	`+ * Note: be careful that all error exits advance lex->token_terminator`
	`677`	`+ * to the point after the character we detected the error on.`
`670`	`678`	`*/`
`671`	`679`	`staticinlineJsonParseErrorType`
`672`	`680`	`json_lex_string(JsonLexContext*lex)`
`@@ -675,6 +683,19 @@ json_lex_string(JsonLexContext *lex)`
`675`	`683`	`intlen;`
`676`	`684`	`inthi_surrogate=-1;`
`677`	`685`
	`686`	`+/* Convenience macros for error exits */`
	`687`	`+#defineFAIL_AT_CHAR_START(code) \`
	`688`	`+do { \`
	`689`	`+lex->token_terminator = s; \`
	`690`	`+return code; \`
	`691`	`+} while (0)`
	`692`	`+#defineFAIL_AT_CHAR_END(code) \`
	`693`	`+do { \`
	`694`	`+lex->token_terminator = \`
	`695`	`+s + pg_encoding_mblen_bounded(lex->input_encoding, s); \`
	`696`	`+return code; \`
	`697`	`+} while (0)`
	`698`	`+`
`678`	`699`	`if (lex->strval!=NULL)`
`679`	`700`	`resetStringInfo(lex->strval);`
`680`	`701`
`@@ -687,29 +708,22 @@ json_lex_string(JsonLexContext *lex)`
`687`	`708`	`len++;`
`688`	`709`	`/* Premature end of the string. */`
`689`	`710`	`if (len >=lex->input_length)`
`690`		`-{`
`691`		`-lex->token_terminator=s;`
`692`		`-returnJSON_INVALID_TOKEN;`
`693`		`-}`
	`711`	`+FAIL_AT_CHAR_START(JSON_INVALID_TOKEN);`
`694`	`712`	`elseif (*s=='"')`
`695`	`713`	`break;`
`696`	`714`	`elseif ((unsignedchar)*s<32)`
`697`	`715`	`{`
`698`	`716`	`/* Per RFC4627, these characters MUST be escaped. */`
`699`	`717`	`/* Since s isn't printable, exclude it from the context string /`
`700`		`-lex->token_terminator=s;`
`701`		`-returnJSON_ESCAPING_REQUIRED;`
	`718`	`+FAIL_AT_CHAR_START(JSON_ESCAPING_REQUIRED);`
`702`	`719`	`}`
`703`	`720`	`elseif (*s=='\\')`
`704`	`721`	`{`
`705`	`722`	`/* OK, we have an escape character. */`
`706`	`723`	`s++;`
`707`	`724`	`len++;`
`708`	`725`	`if (len >=lex->input_length)`
`709`		`-{`
`710`		`-lex->token_terminator=s;`
`711`		`-returnJSON_INVALID_TOKEN;`
`712`		`-}`
	`726`	`+FAIL_AT_CHAR_START(JSON_INVALID_TOKEN);`
`713`	`727`	`elseif (*s=='u')`
`714`	`728`	`{`
`715`	`729`	`inti;`
`@@ -720,21 +734,15 @@ json_lex_string(JsonLexContext *lex)`
`720`	`734`	`s++;`
`721`	`735`	`len++;`
`722`	`736`	`if (len >=lex->input_length)`
`723`		`-{`
`724`		`-lex->token_terminator=s;`
`725`		`-returnJSON_INVALID_TOKEN;`
`726`		`-}`
	`737`	`+FAIL_AT_CHAR_START(JSON_INVALID_TOKEN);`
`727`	`738`	`elseif (s >='0'&&s <='9')`
`728`	`739`	`ch= (ch16)+ (s-'0');`
`729`	`740`	`elseif (s >='a'&&s <='f')`
`730`	`741`	`ch= (ch16)+ (s-'a')+10;`
`731`	`742`	`elseif (s >='A'&&s <='F')`
`732`	`743`	`ch= (ch16)+ (s-'A')+10;`
`733`	`744`	`else`
`734`		`-{`
`735`		`-lex->token_terminator=s+pg_encoding_mblen_bounded(lex->input_encoding,s);`
`736`		`-returnJSON_UNICODE_ESCAPE_FORMAT;`
`737`		`-}`
	`745`	`+FAIL_AT_CHAR_END(JSON_UNICODE_ESCAPE_FORMAT);`
`738`	`746`	`}`
`739`	`747`	`if (lex->strval!=NULL)`
`740`	`748`	`{`
`@@ -744,20 +752,20 @@ json_lex_string(JsonLexContext *lex)`
`744`	`752`	`if (is_utf16_surrogate_first(ch))`
`745`	`753`	`{`
`746`	`754`	`if (hi_surrogate!=-1)`
`747`		`-returnJSON_UNICODE_HIGH_SURROGATE;`
	`755`	`+FAIL_AT_CHAR_END(JSON_UNICODE_HIGH_SURROGATE);`
`748`	`756`	`hi_surrogate=ch;`
`749`	`757`	`continue;`
`750`	`758`	`}`
`751`	`759`	`elseif (is_utf16_surrogate_second(ch))`
`752`	`760`	`{`
`753`	`761`	`if (hi_surrogate==-1)`
`754`		`-returnJSON_UNICODE_LOW_SURROGATE;`
	`762`	`+FAIL_AT_CHAR_END(JSON_UNICODE_LOW_SURROGATE);`
`755`	`763`	`ch=surrogate_pair_to_codepoint(hi_surrogate,ch);`
`756`	`764`	`hi_surrogate=-1;`
`757`	`765`	`}`
`758`	`766`
`759`	`767`	`if (hi_surrogate!=-1)`
`760`		`-returnJSON_UNICODE_LOW_SURROGATE;`
	`768`	`+FAIL_AT_CHAR_END(JSON_UNICODE_LOW_SURROGATE);`
`761`	`769`
`762`	`770`	`/*`
`763`	`771`	`* Reject invalid cases. We can't have a value above`
`@@ -767,7 +775,7 @@ json_lex_string(JsonLexContext *lex)`
`767`	`775`	`if (ch==0)`
`768`	`776`	`{`
`769`	`777`	`/* We can't allow this, since our TEXT type doesn't */`
`770`		`-returnJSON_UNICODE_CODE_POINT_ZERO;`
	`778`	`+FAIL_AT_CHAR_END(JSON_UNICODE_CODE_POINT_ZERO);`
`771`	`779`	`}`
`772`	`780`
`773`	`781`	`/*`
`@@ -804,14 +812,14 @@ json_lex_string(JsonLexContext *lex)`
`804`	`812`	`appendStringInfoChar(lex->strval, (char)ch);`
`805`	`813`	`}`
`806`	`814`	`else`
`807`		`-returnJSON_UNICODE_HIGH_ESCAPE;`
	`815`	`+FAIL_AT_CHAR_END(JSON_UNICODE_HIGH_ESCAPE);`
`808`	`816`	`#endif/* FRONTEND */`
`809`	`817`	`}`
`810`	`818`	`}`
`811`	`819`	`elseif (lex->strval!=NULL)`
`812`	`820`	`{`
`813`	`821`	`if (hi_surrogate!=-1)`
`814`		`-returnJSON_UNICODE_LOW_SURROGATE;`
	`822`	`+FAIL_AT_CHAR_END(JSON_UNICODE_LOW_SURROGATE);`
`815`	`823`
`816`	`824`	`switch (*s)`
`817`	`825`	`{`
`@@ -836,10 +844,14 @@ json_lex_string(JsonLexContext *lex)`
`836`	`844`	`appendStringInfoChar(lex->strval,'\t');`
`837`	`845`	`break;`
`838`	`846`	`default:`
`839`		`-/* Not a valid string escape, so signal error. */`
	`847`	`+`
	`848`	`+/*`
	`849`	`+ * Not a valid string escape, so signal error. We`
	`850`	`+ * adjust token_start so that just the escape sequence`
	`851`	`+ * is reported, not the whole string.`
	`852`	`+ */`
`840`	`853`	`lex->token_start=s;`
`841`		`-lex->token_terminator=s+pg_encoding_mblen_bounded(lex->input_encoding,s);`
`842`		`-returnJSON_ESCAPING_INVALID;`
	`854`	`+FAIL_AT_CHAR_END(JSON_ESCAPING_INVALID);`
`843`	`855`	`}`
`844`	`856`	`}`
`845`	`857`	`elseif (strchr("\"\\/bfnrt",*s)==NULL)`
`@@ -852,26 +864,31 @@ json_lex_string(JsonLexContext *lex)`
`852`	`864`	`* shown it's not a performance win.`
`853`	`865`	`*/`
`854`	`866`	`lex->token_start=s;`
`855`		`-lex->token_terminator=s+pg_encoding_mblen_bounded(lex->input_encoding,s);`
`856`		`-returnJSON_ESCAPING_INVALID;`
	`867`	`+FAIL_AT_CHAR_END(JSON_ESCAPING_INVALID);`
`857`	`868`	`}`
`858`	`869`	`}`
`859`	`870`	`elseif (lex->strval!=NULL)`
`860`	`871`	`{`
`861`	`872`	`if (hi_surrogate!=-1)`
`862`		`-returnJSON_UNICODE_LOW_SURROGATE;`
	`873`	`+FAIL_AT_CHAR_END(JSON_UNICODE_LOW_SURROGATE);`
`863`	`874`
`864`	`875`	`appendStringInfoChar(lex->strval,*s);`
`865`	`876`	`}`
`866`	`877`	`}`
`867`	`878`
`868`	`879`	`if (hi_surrogate!=-1)`
	`880`	`+{`
	`881`	`+lex->token_terminator=s+1;`
`869`	`882`	`returnJSON_UNICODE_LOW_SURROGATE;`
	`883`	`+}`
`870`	`884`
`871`	`885`	`/* Hooray, we found the end of the string! */`
`872`	`886`	`lex->prev_token_terminator=lex->token_terminator;`
`873`	`887`	`lex->token_terminator=s+1;`
`874`	`888`	`returnJSON_SUCCESS;`
	`889`	`+`
	`890`	`+#undef FAIL_AT_CHAR_START`
	`891`	`+#undef FAIL_AT_CHAR_END`
`875`	`892`	`}`
`876`	`893`
`877`	`894`	`/*`

`‎src/test/regress/expected/json_encoding.out‎`

Lines changed: 12 additions & 12 deletions

Original file line number	Diff line number	Diff line change
`@@ -56,19 +56,19 @@ select json '{ "a": "\ud83d\ude04\ud83d\udc36" }' -> 'a' as correct_in_utf8;`
`56`	`56`	`select json '{ "a": "\ud83d\ud83d" }' -> 'a'; -- 2 high surrogates in a row`
`57`	`57`	`ERROR: invalid input syntax for type json`
`58`	`58`	`DETAIL: Unicode high surrogate must not follow a high surrogate.`
`59`		`-CONTEXT: JSON data, line 1: { "a":...`
	`59`	`+CONTEXT: JSON data, line 1: { "a": "\ud83d\ud83d...`
`60`	`60`	`select json '{ "a": "\ude04\ud83d" }' -> 'a'; -- surrogates in wrong order`
`61`	`61`	`ERROR: invalid input syntax for type json`
`62`	`62`	`DETAIL: Unicode low surrogate must follow a high surrogate.`
`63`		`-CONTEXT: JSON data, line 1: { "a":...`
	`63`	`+CONTEXT: JSON data, line 1: { "a": "\ude04...`
`64`	`64`	`select json '{ "a": "\ud83dX" }' -> 'a'; -- orphan high surrogate`
`65`	`65`	`ERROR: invalid input syntax for type json`
`66`	`66`	`DETAIL: Unicode low surrogate must follow a high surrogate.`
`67`		`-CONTEXT: JSON data, line 1: { "a":...`
	`67`	`+CONTEXT: JSON data, line 1: { "a": "\ud83dX...`
`68`	`68`	`select json '{ "a": "\ude04X" }' -> 'a'; -- orphan low surrogate`
`69`	`69`	`ERROR: invalid input syntax for type json`
`70`	`70`	`DETAIL: Unicode low surrogate must follow a high surrogate.`
`71`		`-CONTEXT: JSON data, line 1: { "a":...`
	`71`	`+CONTEXT: JSON data, line 1: { "a": "\ude04...`
`72`	`72`	`--handling of simple unicode escapes`
`73`	`73`	`select json '{ "a": "the Copyright \u00a9 sign" }' as correct_in_utf8;`
`74`	`74`	`correct_in_utf8`
`@@ -121,7 +121,7 @@ select json '{ "a": "dollar \\u0024 character" }' ->> 'a' as not_an_escape;`
`121`	`121`	`select json '{ "a": "null \u0000 escape" }' ->> 'a' as fails;`
`122`	`122`	`ERROR: unsupported Unicode escape sequence`
`123`	`123`	`DETAIL: \u0000 cannot be converted to text.`
`124`		`-CONTEXT: JSON data, line 1: { "a":...`
	`124`	`+CONTEXT: JSON data, line 1: { "a": "null \u0000...`
`125`	`125`	`select json '{ "a": "null \\u0000 escape" }' ->> 'a' as not_an_escape;`
`126`	`126`	`not_an_escape`
`127`	`127`	`--------------------`
`@@ -159,7 +159,7 @@ ERROR: unsupported Unicode escape sequence`
`159`	`159`	`LINE 1: SELECT '"\u0000"'::jsonb;`
`160`	`160`	`^`
`161`	`161`	`DETAIL: \u0000 cannot be converted to text.`
`162`		`-CONTEXT: JSON data, line 1: ...`
	`162`	`+CONTEXT: JSON data, line 1:"\u0000...`
`163`	`163`	`-- use octet_length here so we don't get an odd unicode char in the`
`164`	`164`	`-- output`
`165`	`165`	`SELECT octet_length('"\uaBcD"'::jsonb::text); -- OK, uppercase and lower case both OK`
`@@ -180,25 +180,25 @@ ERROR: invalid input syntax for type json`
`180`	`180`	`LINE 1: SELECT jsonb '{ "a": "\ud83d\ud83d" }' -> 'a';`
`181`	`181`	`^`
`182`	`182`	`DETAIL: Unicode high surrogate must not follow a high surrogate.`
`183`		`-CONTEXT: JSON data, line 1: { "a":...`
	`183`	`+CONTEXT: JSON data, line 1: { "a": "\ud83d\ud83d...`
`184`	`184`	`SELECT jsonb '{ "a": "\ude04\ud83d" }' -> 'a'; -- surrogates in wrong order`
`185`	`185`	`ERROR: invalid input syntax for type json`
`186`	`186`	`LINE 1: SELECT jsonb '{ "a": "\ude04\ud83d" }' -> 'a';`
`187`	`187`	`^`
`188`	`188`	`DETAIL: Unicode low surrogate must follow a high surrogate.`
`189`		`-CONTEXT: JSON data, line 1: { "a":...`
	`189`	`+CONTEXT: JSON data, line 1: { "a": "\ude04...`
`190`	`190`	`SELECT jsonb '{ "a": "\ud83dX" }' -> 'a'; -- orphan high surrogate`
`191`	`191`	`ERROR: invalid input syntax for type json`
`192`	`192`	`LINE 1: SELECT jsonb '{ "a": "\ud83dX" }' -> 'a';`
`193`	`193`	`^`
`194`	`194`	`DETAIL: Unicode low surrogate must follow a high surrogate.`
`195`		`-CONTEXT: JSON data, line 1: { "a":...`
	`195`	`+CONTEXT: JSON data, line 1: { "a": "\ud83dX...`
`196`	`196`	`SELECT jsonb '{ "a": "\ude04X" }' -> 'a'; -- orphan low surrogate`
`197`	`197`	`ERROR: invalid input syntax for type json`
`198`	`198`	`LINE 1: SELECT jsonb '{ "a": "\ude04X" }' -> 'a';`
`199`	`199`	`^`
`200`	`200`	`DETAIL: Unicode low surrogate must follow a high surrogate.`
`201`		`-CONTEXT: JSON data, line 1: { "a":...`
	`201`	`+CONTEXT: JSON data, line 1: { "a": "\ude04...`
`202`	`202`	`-- handling of simple unicode escapes`
`203`	`203`	`SELECT jsonb '{ "a": "the Copyright \u00a9 sign" }' as correct_in_utf8;`
`204`	`204`	`correct_in_utf8`
`@@ -223,7 +223,7 @@ ERROR: unsupported Unicode escape sequence`
`223`	`223`	`LINE 1: SELECT jsonb '{ "a": "null \u0000 escape" }' as fails;`
`224`	`224`	`^`
`225`	`225`	`DETAIL: \u0000 cannot be converted to text.`
`226`		`-CONTEXT: JSON data, line 1: { "a":...`
	`226`	`+CONTEXT: JSON data, line 1: { "a": "null \u0000...`
`227`	`227`	`SELECT jsonb '{ "a": "null \\u0000 escape" }' as not_an_escape;`
`228`	`228`	`not_an_escape`
`229`	`229`	`------------------------------`
`@@ -253,7 +253,7 @@ ERROR: unsupported Unicode escape sequence`
`253`	`253`	`LINE 1: SELECT jsonb '{ "a": "null \u0000 escape" }' ->> 'a' as fai...`
`254`	`254`	`^`
`255`	`255`	`DETAIL: \u0000 cannot be converted to text.`
`256`		`-CONTEXT: JSON data, line 1: { "a":...`
	`256`	`+CONTEXT: JSON data, line 1: { "a": "null \u0000...`
`257`	`257`	`SELECT jsonb '{ "a": "null \\u0000 escape" }' ->> 'a' as not_an_escape;`
`258`	`258`	`not_an_escape`
`259`	`259`	`--------------------`

`‎src/test/regress/expected/json_encoding_1.out‎`

Lines changed: 12 additions & 12 deletions

Original file line number	Diff line number	Diff line change
`@@ -52,19 +52,19 @@ ERROR: conversion between UTF8 and SQL_ASCII is not supported`
`52`	`52`	`select json '{ "a": "\ud83d\ud83d" }' -> 'a'; -- 2 high surrogates in a row`
`53`	`53`	`ERROR: invalid input syntax for type json`
`54`	`54`	`DETAIL: Unicode high surrogate must not follow a high surrogate.`
`55`		`-CONTEXT: JSON data, line 1: { "a":...`
	`55`	`+CONTEXT: JSON data, line 1: { "a": "\ud83d\ud83d...`
`56`	`56`	`select json '{ "a": "\ude04\ud83d" }' -> 'a'; -- surrogates in wrong order`
`57`	`57`	`ERROR: invalid input syntax for type json`
`58`	`58`	`DETAIL: Unicode low surrogate must follow a high surrogate.`
`59`		`-CONTEXT: JSON data, line 1: { "a":...`
	`59`	`+CONTEXT: JSON data, line 1: { "a": "\ude04...`
`60`	`60`	`select json '{ "a": "\ud83dX" }' -> 'a'; -- orphan high surrogate`
`61`	`61`	`ERROR: invalid input syntax for type json`
`62`	`62`	`DETAIL: Unicode low surrogate must follow a high surrogate.`
`63`		`-CONTEXT: JSON data, line 1: { "a":...`
	`63`	`+CONTEXT: JSON data, line 1: { "a": "\ud83dX...`
`64`	`64`	`select json '{ "a": "\ude04X" }' -> 'a'; -- orphan low surrogate`
`65`	`65`	`ERROR: invalid input syntax for type json`
`66`	`66`	`DETAIL: Unicode low surrogate must follow a high surrogate.`
`67`		`-CONTEXT: JSON data, line 1: { "a":...`
	`67`	`+CONTEXT: JSON data, line 1: { "a": "\ude04...`
`68`	`68`	`--handling of simple unicode escapes`
`69`	`69`	`select json '{ "a": "the Copyright \u00a9 sign" }' as correct_in_utf8;`
`70`	`70`	`correct_in_utf8`
`@@ -113,7 +113,7 @@ select json '{ "a": "dollar \\u0024 character" }' ->> 'a' as not_an_escape;`
`113`	`113`	`select json '{ "a": "null \u0000 escape" }' ->> 'a' as fails;`
`114`	`114`	`ERROR: unsupported Unicode escape sequence`
`115`	`115`	`DETAIL: \u0000 cannot be converted to text.`
`116`		`-CONTEXT: JSON data, line 1: { "a":...`
	`116`	`+CONTEXT: JSON data, line 1: { "a": "null \u0000...`
`117`	`117`	`select json '{ "a": "null \\u0000 escape" }' ->> 'a' as not_an_escape;`
`118`	`118`	`not_an_escape`
`119`	`119`	`--------------------`
`@@ -151,7 +151,7 @@ ERROR: unsupported Unicode escape sequence`
`151`	`151`	`LINE 1: SELECT '"\u0000"'::jsonb;`
`152`	`152`	`^`
`153`	`153`	`DETAIL: \u0000 cannot be converted to text.`
`154`		`-CONTEXT: JSON data, line 1: ...`
	`154`	`+CONTEXT: JSON data, line 1:"\u0000...`
`155`	`155`	`-- use octet_length here so we don't get an odd unicode char in the`
`156`	`156`	`-- output`
`157`	`157`	`SELECT octet_length('"\uaBcD"'::jsonb::text); -- OK, uppercase and lower case both OK`
`@@ -168,25 +168,25 @@ ERROR: invalid input syntax for type json`
`168`	`168`	`LINE 1: SELECT jsonb '{ "a": "\ud83d\ud83d" }' -> 'a';`
`169`	`169`	`^`
`170`	`170`	`DETAIL: Unicode high surrogate must not follow a high surrogate.`
`171`		`-CONTEXT: JSON data, line 1: { "a":...`
	`171`	`+CONTEXT: JSON data, line 1: { "a": "\ud83d\ud83d...`
`172`	`172`	`SELECT jsonb '{ "a": "\ude04\ud83d" }' -> 'a'; -- surrogates in wrong order`
`173`	`173`	`ERROR: invalid input syntax for type json`
`174`	`174`	`LINE 1: SELECT jsonb '{ "a": "\ude04\ud83d" }' -> 'a';`
`175`	`175`	`^`
`176`	`176`	`DETAIL: Unicode low surrogate must follow a high surrogate.`
`177`		`-CONTEXT: JSON data, line 1: { "a":...`
	`177`	`+CONTEXT: JSON data, line 1: { "a": "\ude04...`
`178`	`178`	`SELECT jsonb '{ "a": "\ud83dX" }' -> 'a'; -- orphan high surrogate`
`179`	`179`	`ERROR: invalid input syntax for type json`
`180`	`180`	`LINE 1: SELECT jsonb '{ "a": "\ud83dX" }' -> 'a';`
`181`	`181`	`^`
`182`	`182`	`DETAIL: Unicode low surrogate must follow a high surrogate.`
`183`		`-CONTEXT: JSON data, line 1: { "a":...`
	`183`	`+CONTEXT: JSON data, line 1: { "a": "\ud83dX...`
`184`	`184`	`SELECT jsonb '{ "a": "\ude04X" }' -> 'a'; -- orphan low surrogate`
`185`	`185`	`ERROR: invalid input syntax for type json`
`186`	`186`	`LINE 1: SELECT jsonb '{ "a": "\ude04X" }' -> 'a';`
`187`	`187`	`^`
`188`	`188`	`DETAIL: Unicode low surrogate must follow a high surrogate.`
`189`		`-CONTEXT: JSON data, line 1: { "a":...`
	`189`	`+CONTEXT: JSON data, line 1: { "a": "\ude04...`
`190`	`190`	`-- handling of simple unicode escapes`
`191`	`191`	`SELECT jsonb '{ "a": "the Copyright \u00a9 sign" }' as correct_in_utf8;`
`192`	`192`	`ERROR: conversion between UTF8 and SQL_ASCII is not supported`
`@@ -209,7 +209,7 @@ ERROR: unsupported Unicode escape sequence`
`209`	`209`	`LINE 1: SELECT jsonb '{ "a": "null \u0000 escape" }' as fails;`
`210`	`210`	`^`
`211`	`211`	`DETAIL: \u0000 cannot be converted to text.`
`212`		`-CONTEXT: JSON data, line 1: { "a":...`
	`212`	`+CONTEXT: JSON data, line 1: { "a": "null \u0000...`
`213`	`213`	`SELECT jsonb '{ "a": "null \\u0000 escape" }' as not_an_escape;`
`214`	`214`	`not_an_escape`
`215`	`215`	`------------------------------`
`@@ -237,7 +237,7 @@ ERROR: unsupported Unicode escape sequence`
`237`	`237`	`LINE 1: SELECT jsonb '{ "a": "null \u0000 escape" }' ->> 'a' as fai...`
`238`	`238`	`^`
`239`	`239`	`DETAIL: \u0000 cannot be converted to text.`
`240`		`-CONTEXT: JSON data, line 1: { "a":...`
	`240`	`+CONTEXT: JSON data, line 1: { "a": "null \u0000...`
`241`	`241`	`SELECT jsonb '{ "a": "null \\u0000 escape" }' ->> 'a' as not_an_escape;`
`242`	`242`	`not_an_escape`
`243`	`243`	`--------------------`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commit74a1a36

File tree

4 files changed

4 files changed

`‎src/backend/utils/adt/jsonfuncs.c‎`

`‎src/common/jsonapi.c‎`

`‎src/test/regress/expected/json_encoding.out‎`

`‎src/test/regress/expected/json_encoding_1.out‎`

0 commit comments