NotificationsYou must be signed in to change notification settings
Fork6
Star31

Commit4e7f62b

committed

Add support for Unicode case folding.

Expand case mapping tables to include entries for case folding, whichare parsed from CaseFolding.txt.Discussion:https://postgr.es/m/a1886ddfcd8f60cb3e905c93009b646b4cfb74c5.camel%40j-davis.com

1 parent7921927 commit4e7f62bCopy full SHA for 4e7f62b

File tree

7 files changed

+3280

-3125

lines changed

src
- common
  - unicode
  - unicode_case.c
- include/common
  - unicode_case.h
  - unicode_case_table.h

7 files changed

+3280

-3125

lines changed

`‎src/common/unicode/Makefile`

Lines changed: 3 additions & 3 deletions

Original file line number	Diff line number	Diff line change
`@@ -30,13 +30,13 @@ update-unicode: unicode_case_table.h unicode_category_table.h unicode_east_asian`
`30`	`30`	`# These files are part of the Unicode Character Database. Download`
`31`	`31`	`# them on demand. The dependency on Makefile.global is for`
`32`	`32`	`# UNICODE_VERSION.`
`33`		`-CompositionExclusions.txtDerivedCoreProperties.txtDerivedNormalizationProps.txtEastAsianWidth.txtNormalizationTest.txtPropList.txtSpecialCasing.txtUnicodeData.txt:$(top_builddir)/src/Makefile.global`
	`33`	`+CompositionExclusions.txtCaseFolding.txtDerivedCoreProperties.txtDerivedNormalizationProps.txtEastAsianWidth.txtNormalizationTest.txtPropList.txtSpecialCasing.txtUnicodeData.txt:$(top_builddir)/src/Makefile.global`
`34`	`34`	`$(DOWNLOAD) https://www.unicode.org/Public/$(UNICODE_VERSION)/ucd/$(@F)`
`35`	`35`
`36`	`36`	`unicode_version.h: generate-unicode_version.pl`
`37`	`37`	`$(PERL)$< --version$(UNICODE_VERSION)`
`38`	`38`
`39`		`-unicode_case_table.h: generate-unicode_case_table.pl UnicodeData.txt`
	`39`	`+unicode_case_table.h: generate-unicode_case_table.plCaseFolding.txtUnicodeData.txt`
`40`	`40`	`$(PERL)$<`
`41`	`41`
`42`	`42`	`unicode_category_table.h: generate-unicode_category_table.pl DerivedCoreProperties.txt PropList.txt UnicodeData.txt`
`@@ -91,4 +91,4 @@ clean:`
`91`	`91`	`rm -f$(OBJS) case_test case_test.o category_test category_test.o norm_test norm_test.o`
`92`	`92`
`93`	`93`	`distclean: clean`
`94`		`-rm -f CompositionExclusions.txt DerivedCoreProperties.txt DerivedNormalizationProps.txt EastAsianWidth.txt NormalizationTest.txt PropList.txt SpecialCasing.txt UnicodeData.txt norm_test_table.h unicode_case_table.h unicode_category_table.h unicode_norm_table.h`
	`94`	`+rm -f CompositionExclusions.txtCaseFolding.txtDerivedCoreProperties.txt DerivedNormalizationProps.txt EastAsianWidth.txt NormalizationTest.txt PropList.txt SpecialCasing.txt UnicodeData.txt norm_test_table.h unicode_case_table.h unicode_category_table.h unicode_norm_table.h`

`‎src/common/unicode/case_test.c`

Lines changed: 27 additions & 5 deletions

Original file line number	Diff line number	Diff line change
`@@ -81,17 +81,20 @@ icu_test_simple(pg_wchar code)`
`81`	`81`	`pg_wcharlower=unicode_lowercase_simple(code);`
`82`	`82`	`pg_wchartitle=unicode_titlecase_simple(code);`
`83`	`83`	`pg_wcharupper=unicode_uppercase_simple(code);`
	`84`	`+pg_wcharfold=unicode_casefold_simple(code);`
`84`	`85`	`pg_wchariculower=u_tolower(code);`
`85`	`86`	`pg_wcharicutitle=u_totitle(code);`
`86`	`87`	`pg_wcharicuupper=u_toupper(code);`
	`88`	`+pg_wcharicufold=u_foldCase(code,U_FOLD_CASE_DEFAULT);`
`87`	`89`
`88`		`-if (lower!=iculower\|\|title!=icutitle\|\|upper!=icuupper)`
	`90`	`+if (lower!=iculower\|\|title!=icutitle\|\|upper!=icuupper\|\|`
	`91`	`+fold!=icufold)`
`89`	`92`	`{`
`90`	`93`	`printf("case_test: FAILURE for codepoint 0x%06x\n",code);`
`91`		`-printf("case_test: Postgres lower/title/upper:0x%06x/0x%06x/0x%06x\n",`
`92`		`-lower,title,upper);`
`93`		`-printf("case_test: ICU lower/title/upper:0x%06x/0x%06x/0x%06x\n",`
`94`		`-iculower,icutitle,icuupper);`
	`94`	`+printf("case_test: Postgres lower/title/upper/fold:0x%06x/0x%06x/0x%06x/0x%06x\n",`
	`95`	`+lower,title,upper,fold);`
	`96`	`+printf("case_test: ICU lower/title/upper/fold:0x%06x/0x%06x/0x%06x/0x%06x\n",`
	`97`	`+iculower,icutitle,icuupper,icufold);`
`95`	`98`	`printf("\n");`
`96`	`99`	`exit(1);`
`97`	`100`	`}`
`@@ -103,9 +106,11 @@ icu_test_full(char *str)`
`103`	`106`	`charlower[BUFSZ];`
`104`	`107`	`chartitle[BUFSZ];`
`105`	`108`	`charupper[BUFSZ];`
	`109`	`+charfold[BUFSZ];`
`106`	`110`	`charicu_lower[BUFSZ];`
`107`	`111`	`charicu_title[BUFSZ];`
`108`	`112`	`charicu_upper[BUFSZ];`
	`113`	`+charicu_fold[BUFSZ];`
`109`	`114`	`UErrorCodestatus;`
`110`	`115`	`structWordBoundaryStatewbstate= {`
`111`	`116`	`.str=str,`
`@@ -118,12 +123,15 @@ icu_test_full(char *str)`
`118`	`123`	`unicode_strlower(lower,BUFSZ,str,-1, true);`
`119`	`124`	`unicode_strtitle(title,BUFSZ,str,-1, true,initcap_wbnext,&wbstate);`
`120`	`125`	`unicode_strupper(upper,BUFSZ,str,-1, true);`
	`126`	`+unicode_strfold(fold,BUFSZ,str,-1, true);`
`121`	`127`	`status=U_ZERO_ERROR;`
`122`	`128`	`ucasemap_utf8ToLower(casemap,icu_lower,BUFSZ,str,-1,&status);`
`123`	`129`	`status=U_ZERO_ERROR;`
`124`	`130`	`ucasemap_utf8ToTitle(casemap,icu_title,BUFSZ,str,-1,&status);`
`125`	`131`	`status=U_ZERO_ERROR;`
`126`	`132`	`ucasemap_utf8ToUpper(casemap,icu_upper,BUFSZ,str,-1,&status);`
	`133`	`+status=U_ZERO_ERROR;`
	`134`	`+ucasemap_utf8FoldCase(casemap,icu_fold,BUFSZ,str,-1,&status);`
`127`	`135`
`128`	`136`	`if (strcmp(lower,icu_lower)!=0)`
`129`	`137`	`{`
`@@ -143,6 +151,12 @@ icu_test_full(char *str)`
`143`	`151`	`icu_upper);`
`144`	`152`	`exit(1);`
`145`	`153`	`}`
	`154`	`+if (strcmp(fold,icu_fold)!=0)`
	`155`	`+{`
	`156`	`+printf("case_test: str='%s' fold='%s' icu_fold='%s'\n",str,fold,`
	`157`	`+icu_fold);`
	`158`	`+exit(1);`
	`159`	`+}`
`146`	`160`	`}`
`147`	`161`
`148`	`162`	`/*`
`@@ -302,6 +316,12 @@ tfunc_upper(char dst, size_t dstsize, const char src,`
`302`	`316`	`returnunicode_strupper(dst,dstsize,src,srclen, true);`
`303`	`317`	`}`
`304`	`318`
	`319`	`+staticsize_t`
	`320`	`+tfunc_fold(chardst,size_tdstsize,constcharsrc,`
	`321`	`+ssize_tsrclen)`
	`322`	`+{`
	`323`	`+returnunicode_strfold(dst,dstsize,src,srclen, true);`
	`324`	`+}`
`305`	`325`
`306`	`326`	`staticvoid`
`307`	`327`	`test_convert_case()`
`@@ -318,10 +338,12 @@ test_convert_case()`
`318`	`338`	`test_convert(tfunc_upper,"ß","SS");`
`319`	`339`	`test_convert(tfunc_lower,"ıiIİ","ıiii\u0307");`
`320`	`340`	`test_convert(tfunc_upper,"ıiIİ","IIIİ");`
	`341`	`+test_convert(tfunc_fold,"ıiIİ","ıiii\u0307");`
`321`	`342`	`/* test final sigma */`
`322`	`343`	`test_convert(tfunc_lower,"σςΣ ΣΣΣ","σςς σσς");`
`323`	`344`	`test_convert(tfunc_lower,"σς'Σ' ΣΣ'Σ'","σς'ς' σσ'ς'");`
`324`	`345`	`test_convert(tfunc_title,"σςΣ ΣΣΣ","Σςς Σσς");`
	`346`	`+test_convert(tfunc_fold,"σςΣ ΣΣΣ","σσσ σσσ");`
`325`	`347`
`326`	`348`	`#ifdefUSE_ICU`
`327`	`349`	`icu_test_full("");`

`‎src/common/unicode/generate-unicode_case_table.pl`

Lines changed: 103 additions & 7 deletions

Original file line number	Diff line number	Diff line change
`@@ -49,7 +49,8 @@`
`49`	`49`	`$simple{$code} = {`
`50`	`50`	`Simple_Lowercase=> ($simple_lowercase \|\|$code),`
`51`	`51`	`Simple_Titlecase=> ($simple_titlecase \|\|$code),`
`52`		`-Simple_Uppercase=> ($simple_uppercase \|\|$code)`
	`52`	`+Simple_Uppercase=> ($simple_uppercase \|\|$code),`
	`53`	`+Simple_Foldcase=>$code,`
`53`	`54`	`};`
`54`	`55`	`}`
`55`	`56`	`}`
`@@ -87,6 +88,7 @@`
`87`	`88`	`my@lower =map {hex$_ } (grep /^[0-9A-F]+$/, (split /\s+/,$elts[1]));`
`88`	`89`	`my@title =map {hex$_ } (grep /^[0-9A-F]+$/, (split /\s+/,$elts[2]));`
`89`	`90`	`my@upper =map {hex$_ } (grep /^[0-9A-F]+$/, (split /\s+/,$elts[3]));`
	`91`	`+my@fold = ();`
`90`	`92`	`my@conditions =map {`
`91`	`93`	`# supporting negated conditions may require storing a`
`92`	`94`	`# mask of relevant conditions for a given rule to differentiate`
`@@ -101,6 +103,7 @@`
`101`	`103`	`push@lower,$codeif (scalar@lower == 0);`
`102`	`104`	`push@title,$codeif (scalar@title == 0);`
`103`	`105`	`push@upper,$codeif (scalar@upper == 0);`
	`106`	`+push@fold,$code;`
`104`	`107`
`105`	`108`	`# none should map to more than 3 codepoints`
`106`	`109`	`die"lowercase expansion for 0x$elts[0] exceeds maximum: '$elts[1]'"`
`@@ -114,13 +117,15 @@`
`114`	`117`	`while (scalar@upper <$MAX_CASE_EXPANSION) {push@upper, 0x000000 }`
`115`	`118`	`while (scalar@lower <$MAX_CASE_EXPANSION) {push@lower, 0x000000 }`
`116`	`119`	`while (scalar@title <$MAX_CASE_EXPANSION) {push@title, 0x000000 }`
	`120`	`+while (scalar@fold <$MAX_CASE_EXPANSION) {push@fold, 0x000000 }`
`117`	`121`
`118`	`122`	`# Characters with special mappings may not have simple mappings;`
`119`	`123`	`# ensure that an entry exists.`
`120`	`124`	`$simple{$code} \|\|= {`
`121`	`125`	`Simple_Lowercase=>$code,`
`122`	`126`	`Simple_Titlecase=>$code,`
`123`		`-Simple_Uppercase=>$code`
	`127`	`+Simple_Uppercase=>$code,`
	`128`	`+Simple_Foldcase=>$code`
`124`	`129`	`};`
`125`	`130`
`126`	`131`	`# Multiple special case rules for a single codepoint could be`
`@@ -135,11 +140,96 @@`
`135`	`140`	`Lowercase=> \@lower,`
`136`	`141`	`Titlecase=> \@title,`
`137`	`142`	`Uppercase=> \@upper,`
	`143`	`+Foldcase=> \@fold,`
`138`	`144`	`Conditions=>$cond_str`
`139`	`145`	`};`
`140`	`146`	`}`
`141`	`147`	`close$FH;`
`142`	`148`
	`149`	`+open($FH,'<',"$output_path/CaseFolding.txt")`
	`150`	`+ordie"Could not open$output_path/CaseFolding.txt:$!.";`
	`151`	`+while (my$line = <$FH>)`
	`152`	`+{`
	`153`	`+# remove comments`
	`154`	`+$line =~s/^(.?)#.$/$1/s;`
	`155`	`+`
	`156`	`+# ignore empty lines`
	`157`	`+nextunless$line =~/;/;`
	`158`	`+`
	`159`	`+my@elts =split(';',$line);`
	`160`	`+my$code =hex($elts[0]);`
	`161`	`+my$status =$elts[1] =~s/^\s+\|\s+$//rg;`
	`162`	`+`
	`163`	`+# Codepoint may map to multiple characters when folding. Split`
	`164`	`+# each mapping on whitespace and extract the hexadecimal into an`
	`165`	`+# array of codepoints.`
	`166`	`+my@fold =map {hex$_ } (grep /[0-9A-F]+/, (split /\s+/,$elts[2]));`
	`167`	`+`
	`168`	`+die"codepoint$code out of range"if$code > 0x10FFFF;`
	`169`	`+`
	`170`	`+# status 'T' unsupported; skip`
	`171`	`+nextif$statuseq'T';`
	`172`	`+`
	`173`	`+# encountered unrecognized status type`
	`174`	`+die"unsupported status type '$status'"`
	`175`	`+if$statusne'S' &&$statusne'C' &&$statusne'F';`
	`176`	`+`
	`177`	`+# initialize simple case mappings if they don't exist`
	`178`	`+$simple{$code} \|\|= {`
	`179`	`+Simple_Lowercase=>$code,`
	`180`	`+Simple_Titlecase=>$code,`
	`181`	`+Simple_Uppercase=>$code,`
	`182`	`+Simple_Foldcase=>$code`
	`183`	`+};`
	`184`	`+`
	`185`	`+if ($statuseq'S' \|\|$statuseq'C')`
	`186`	`+{`
	`187`	`+die`
	`188`	`+"Simple case folding for$code has multiple codepoints: '$line' '$elts[2]'"`
	`189`	`+ifscalar@fold != 1;`
	`190`	`+my$simple_foldcase =$fold[0];`
	`191`	`+`
	`192`	`+die"Simple_Foldcase$code out of range"`
	`193`	`+if$simple_foldcase > 0x10FFFF;`
	`194`	`+`
	`195`	`+$simple{$code}{Simple_Foldcase} =$simple_foldcase;`
	`196`	`+}`
	`197`	`+`
	`198`	`+if ($statuseq'F' \|\| ($statuseq'C' &&defined$special{$code}))`
	`199`	`+{`
	`200`	`+while (scalar@fold <$MAX_CASE_EXPANSION) {push@fold, 0x000000 }`
	`201`	`+`
	`202`	`+#initialize special case mappings if they don't exist`
	`203`	`+if (!defined$special{$code})`
	`204`	`+{`
	`205`	`+my@lower = ($simple{$code}{Simple_Lowercase});`
	`206`	`+my@title = ($simple{$code}{Simple_Titlecase});`
	`207`	`+my@upper = ($simple{$code}{Simple_Uppercase});`
	`208`	`+while (scalar@lower <$MAX_CASE_EXPANSION)`
	`209`	`+{`
	`210`	`+push@lower, 0x000000;`
	`211`	`+}`
	`212`	`+while (scalar@title <$MAX_CASE_EXPANSION)`
	`213`	`+{`
	`214`	`+push@title, 0x000000;`
	`215`	`+}`
	`216`	`+while (scalar@upper <$MAX_CASE_EXPANSION)`
	`217`	`+{`
	`218`	`+push@upper, 0x000000;`
	`219`	`+}`
	`220`	`+$special{$code} = {`
	`221`	`+Lowercase=> \@lower,`
	`222`	`+Titlecase=> \@title,`
	`223`	`+Uppercase=> \@upper,`
	`224`	`+Conditions=>'0'`
	`225`	`+};`
	`226`	`+}`
	`227`	`+`
	`228`	`+$special{$code}{Foldcase} = \@fold;`
	`229`	`+}`
	`230`	`+}`
	`231`	`+close$FH;`
	`232`	`+`
`143`	`233`	`# assign sequential array indexes to the special mappings`
`144`	`234`	`my$special_idx = 0;`
`145`	`235`	`foreachmy$code (sort {$a<=>$b } (keys%special))`
`@@ -202,6 +292,7 @@`
`202`	`292`	`CaseLower = 0,`
`203`	`293`	`CaseTitle = 1,`
`204`	`294`	`CaseUpper = 2,`
	`295`	`+CaseFold = 3,`
`205`	`296`	`NCaseKind`
`206`	`297`	`} CaseKind;`
`207`	`298`
`@@ -232,14 +323,17 @@`
`232`	`323`	`dieifscalar @{$special{$code}{Lowercase} } !=$MAX_CASE_EXPANSION;`
`233`	`324`	`dieifscalar @{$special{$code}{Titlecase} } !=$MAX_CASE_EXPANSION;`
`234`	`325`	`dieifscalar @{$special{$code}{Uppercase} } !=$MAX_CASE_EXPANSION;`
	`326`	`+dieifscalar @{$special{$code}{Foldcase} } !=$MAX_CASE_EXPANSION;`
`235`	`327`	`my$lower =join",",`
`236`	`328`	`(map {sprintf"0x%06x",$_ } @{$special{$code}{Lowercase} });`
`237`	`329`	`my$title =join",",`
`238`	`330`	`(map {sprintf"0x%06x",$_ } @{$special{$code}{Titlecase} });`
`239`	`331`	`my$upper =join",",`
`240`	`332`	`(map {sprintf"0x%06x",$_ } @{$special{$code}{Uppercase} });`
	`333`	`+my$fold =join",",`
	`334`	`+ (map {sprintf"0x%06x",$_ } @{$special{$code}{Foldcase} });`
`241`	`335`	`printf$OT"\t{0x%06x,%s,",$code,$special{$code}{Conditions};`
`242`		`-printf$OT"{{%s}, {%s}, {%s}}},\n",$lower,$title,$upper;`
	`336`	`+printf$OT"{{%s}, {%s}, {%s}, {%s}}},\n",$lower,$title,$upper,$fold;`
`243`	`337`	`}`
`244`	`338`
`245`	`339`	`print$OT"\t{0, 0, {{0, 0, 0}, {0, 0, 0}, {0, 0, 0}}}\n";`
`@@ -260,11 +354,13 @@`
`260`	`354`	`my$lc = ($simple{$code}{Simple_Lowercase} \|\|$code);`
`261`	`355`	`my$tc = ($simple{$code}{Simple_Titlecase} \|\|$code);`
`262`	`356`	`my$uc = ($simple{$code}{Simple_Uppercase} \|\|$code);`
	`357`	`+my$fc = ($simple{$code}{Simple_Foldcase} \|\|$code);`
	`358`	`+`
`263`	`359`	`die"unexpected special case for code$code"`
`264`	`360`	`ifdefined$special{$code};`
`265`	`361`	`printf$OT`
`266`		`-"\t{0x%06x, {[CaseLower] = 0x%06x,[CaseTitle] = 0x%06x,[CaseUpper] = 0x%06x}, NULL},\n",`
`267`		`-$code,$lc,$tc,$uc;`
	`362`	`+"\t{0x%06x, {[CaseLower] = 0x%06x,[CaseTitle] = 0x%06x,[CaseUpper] = 0x%06x,[CaseFold] = 0x%06x}, NULL},\n",`
	`363`	`+$code,$lc,$tc,$uc,$fc;`
`268`	`364`	`}`
`269`	`365`	`printf$OT"\n";`
`270`	`366`
`@@ -280,8 +376,8 @@`
`280`	`376`	`$special_case =sprintf"&special_case[%d]",$special{$code}{Index};`
`281`	`377`	`}`
`282`	`378`	`printf$OT`
`283`		`-"\t{0x%06x, {[CaseLower] = 0x%06x,[CaseTitle] = 0x%06x,[CaseUpper] = 0x%06x},%s},\n",`
	`379`	`+"\t{0x%06x, {[CaseLower] = 0x%06x,[CaseTitle] = 0x%06x,[CaseUpper] = 0x%06x,[CaseFold] = 0x%06x},%s},\n",`
`284`	`380`	`$code,$map->{Simple_Lowercase},$map->{Simple_Titlecase},`
`285`		`-$map->{Simple_Uppercase},$special_case;`
	`381`	`+$map->{Simple_Uppercase},$map->{Simple_Foldcase},$special_case;`
`286`	`382`	`}`
`287`	`383`	`print$OT"};\n";`

`‎src/common/unicode/meson.build`

Lines changed: 2 additions & 2 deletions

Original file line number	Diff line number	Diff line change
`@@ -11,7 +11,7 @@ endif`
`11`	`11`
`12`	`12`	`# These files are part of the Unicode Character Database. Download them on`
`13`	`13`	`# demand.`
`14`		`-foreachf: ['CompositionExclusions.txt','DerivedCoreProperties.txt','DerivedNormalizationProps.txt','EastAsianWidth.txt','NormalizationTest.txt','PropList.txt','SpecialCasing.txt','UnicodeData.txt']`
	`14`	`+foreachf: ['CompositionExclusions.txt','CaseFolding.txt','DerivedCoreProperties.txt','DerivedNormalizationProps.txt','EastAsianWidth.txt','NormalizationTest.txt','PropList.txt','SpecialCasing.txt','UnicodeData.txt']`
`15`	`15`	`url= unicode_baseurl.format(UNICODE_VERSION, f)`
`16`	`16`	`target=custom_target(f,`
`17`	`17`	`output: f,`
`@@ -26,7 +26,7 @@ update_unicode_targets = []`
`26`	`26`
`27`	`27`	`update_unicode_targets+= \`
`28`	`28`	`custom_target('unicode_case_table.h',`
`29`		`-input: [unicode_data['SpecialCasing.txt'], unicode_data['UnicodeData.txt']],`
	`29`	`+input: [unicode_data['CaseFolding.txt'], unicode_data['SpecialCasing.txt'], unicode_data['UnicodeData.txt']],`
`30`	`30`	`output: ['unicode_case_table.h'],`
`31`	`31`	`command: [`
`32`	`32`	`perl,files('generate-unicode_case_table.pl'),`

`‎src/common/unicode_case.c`

Lines changed: 32 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -51,6 +51,14 @@ unicode_uppercase_simple(pg_wchar code)`
`51`	`51`	`returnmap ?map->simplemap[CaseUpper] :code;`
`52`	`52`	`}`
`53`	`53`
	`54`	`+pg_wchar`
	`55`	`+unicode_casefold_simple(pg_wcharcode)`
	`56`	`+{`
	`57`	`+constpg_case_map*map=find_case_map(code);`
	`58`	`+`
	`59`	`+returnmap ?map->simplemap[CaseFold] :code;`
	`60`	`+}`
	`61`	`+`
`54`	`62`	`/*`
`55`	`63`	`* unicode_strlower()`
`56`	`64`	`*`
`@@ -142,6 +150,30 @@ unicode_strupper(char dst, size_t dstsize, const char src, ssize_t srclen,`
`142`	`150`	`NULL);`
`143`	`151`	`}`
`144`	`152`
	`153`	`+/*`
	`154`	`+ * unicode_strfold()`
	`155`	`+ *`
	`156`	`+ * Case fold src, and return the result length (not including terminating`
	`157`	`+ * NUL).`
	`158`	`+ *`
	`159`	`+ * String src must be encoded in UTF-8. If srclen < 0, src must be`
	`160`	`+ * NUL-terminated.`
	`161`	`+ *`
	`162`	`+ * Result string is stored in dst, truncating if larger than dstsize. If`
	`163`	`+ * dstsize is greater than the result length, dst will be NUL-terminated;`
	`164`	`+ * otherwise not.`
	`165`	`+ *`
	`166`	`+ * If dstsize is zero, dst may be NULL. This is useful for calculating the`
	`167`	`+ * required buffer size before allocating.`
	`168`	`+ */`
	`169`	`+size_t`
	`170`	`+unicode_strfold(chardst,size_tdstsize,constcharsrc,ssize_tsrclen,`
	`171`	`+boolfull)`
	`172`	`+{`
	`173`	`+returnconvert_case(dst,dstsize,src,srclen,CaseFold,full,NULL,`
	`174`	`+NULL);`
	`175`	`+}`
	`176`	`+`
`145`	`177`	`/*`
`146`	`178`	`* Implement Unicode Default Case Conversion algorithm.`
`147`	`179`	`*`

`‎src/include/common/unicode_case.h`

Lines changed: 3 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -21,12 +21,15 @@ typedef size_t (WordBoundaryNext) (void wbstate);`
`21`	`21`	`pg_wcharunicode_lowercase_simple(pg_wcharcode);`
`22`	`22`	`pg_wcharunicode_titlecase_simple(pg_wcharcode);`
`23`	`23`	`pg_wcharunicode_uppercase_simple(pg_wcharcode);`
	`24`	`+pg_wcharunicode_casefold_simple(pg_wcharcode);`
`24`	`25`	`size_tunicode_strlower(chardst,size_tdstsize,constcharsrc,`
`25`	`26`	`ssize_tsrclen,boolfull);`
`26`	`27`	`size_tunicode_strtitle(chardst,size_tdstsize,constcharsrc,`
`27`	`28`	`ssize_tsrclen,boolfull,`
`28`	`29`	`WordBoundaryNextwbnext,void*wbstate);`
`29`	`30`	`size_tunicode_strupper(chardst,size_tdstsize,constcharsrc,`
`30`	`31`	`ssize_tsrclen,boolfull);`
	`32`	`+size_tunicode_strfold(chardst,size_tdstsize,constcharsrc,`
	`33`	`+ssize_tsrclen,boolfull);`
`31`	`34`
`32`	`35`	`#endif/* UNICODE_CASE_H */`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commit4e7f62b

File tree

7 files changed

7 files changed

`‎src/common/unicode/Makefile`

`‎src/common/unicode/case_test.c`

`‎src/common/unicode/generate-unicode_case_table.pl`

`‎src/common/unicode/meson.build`

`‎src/common/unicode_case.c`

`‎src/include/common/unicode_case.h`

0 commit comments