From e9af22730e68908f46c9aee3b35e133d34191bef Mon Sep 17 00:00:00 2001 From: Ryo Nihei Date: Fri, 26 Nov 2021 00:01:16 +0900 Subject: Support Alphabetic property (Meet RL1.2 of UTS #18 partially) --- compiler/ucd_table.go.tmpl | 10 ++++++++++ 1 file changed, 10 insertions(+) (limited to 'compiler/ucd_table.go.tmpl') diff --git a/compiler/ucd_table.go.tmpl b/compiler/ucd_table.go.tmpl index ad336d9..8d6fbc8 100644 --- a/compiler/ucd_table.go.tmpl +++ b/compiler/ucd_table.go.tmpl @@ -26,6 +26,7 @@ var compositGeneralCategories = map[string][]string{ // https://www.unicode.org/Public/13.0.0/ucd/DerivedCoreProperties.txt var derivedCoreProperties = map[string][]string{ + "alpha": {`\p{Lowercase=yes}`, `\p{Uppercase=yes}`, `\p{Lt}`, `\p{Lm}`, `\p{Lo}`, `\p{Nl}`, `\p{Other_Alphabetic=yes}`}, "lower": {`\p{Ll}`, `\p{Other_Lowercase=yes}`}, "upper": {`\p{Lu}`, `\p{Other_Uppercase=yes}`}, } @@ -34,6 +35,10 @@ var derivedCoreProperties = map[string][]string{ var propertyNameAbbs = map[string]string{ "generalcategory": "gc", "gc": "gc", + "alphabetic": "alpha", + "alpha": "alpha", + "otheralphabetic": "oalpha", + "oalpha": "oalpha", "lowercase": "lower", "lower": "lower", "uppercase": "upper", @@ -72,6 +77,11 @@ var generalCategoryCodePoints = map[string][]*ucd.CodePointRange{ {{ range $prop },{{ end }} } +// https://www.unicode.org/Public/13.0.0/ucd/PropList.txt +var otherAlphabeticCodePoints = []*ucd.CodePointRange{ {{ range .PropList.OtherAlphabetic }} + &ucd.CodePointRange{From: rune({{ .From }}), To: rune({{ .To }})},{{ end }} +} + // https://www.unicode.org/Public/13.0.0/ucd/PropList.txt var otherLowercaseCodePoints = []*ucd.CodePointRange{ {{ range .PropList.OtherLowercase }} &ucd.CodePointRange{From: rune({{ .From }}), To: rune({{ .To }})},{{ end }} -- cgit v1.2.3