aboutsummaryrefslogtreecommitdiff
path: root/spec
diff options
context:
space:
mode:
authorRyo Nihei <nihei.dev@gmail.com>2021-09-18 17:07:09 +0900
committerRyo Nihei <nihei.dev@gmail.com>2021-09-18 17:07:09 +0900
commitfe865a812401c2c612f2cd17cedd4728dc4798f7 (patch)
tree007dbc653364809e2273ba95aef0f1bea2006127 /spec
parentUpdate CHANGELOG (diff)
downloadtre-fe865a812401c2c612f2cd17cedd4728dc4798f7.tar.gz
tre-fe865a812401c2c612f2cd17cedd4728dc4798f7.tar.xz
Generate constant values representing mode IDs, mode names, kind IDs, and kind names
Diffstat (limited to 'spec')
-rw-r--r--spec/spec.go154
-rw-r--r--spec/spec_test.go211
2 files changed, 350 insertions, 15 deletions
diff --git a/spec/spec.go b/spec/spec.go
index 9ac5f4b..62acfc4 100644
--- a/spec/spec.go
+++ b/spec/spec.go
@@ -3,6 +3,7 @@ package spec
import (
"fmt"
"regexp"
+ "sort"
"strconv"
"strings"
)
@@ -42,19 +43,13 @@ func (k LexKindName) String() string {
}
func (k LexKindName) validate() error {
- if k == "" {
- return fmt.Errorf("kind doesn't allow to be the empty string")
- }
- if !lexKindNameRE.Match([]byte(k)) {
- return fmt.Errorf("kind must be %v", lexKindNamePattern)
+ err := validateIdentifier(k.String())
+ if err != nil {
+ return fmt.Errorf("invalid kind name: %v", err)
}
return nil
}
-const lexKindNamePattern = "[A-Za-z_][0-9A-Za-z_]*"
-
-var lexKindNameRE = regexp.MustCompile(lexKindNamePattern)
-
// LexPattern represents a pattern of a lexeme.
// The pattern is written in regular expression.
type LexPattern string
@@ -99,19 +94,38 @@ func (m LexModeName) String() string {
}
func (m LexModeName) validate() error {
- if m.isNil() || !lexModeNameRE.Match([]byte(m)) {
- return fmt.Errorf("mode must be %v", lexModeNamePattern)
+ err := validateIdentifier(m.String())
+ if err != nil {
+ return fmt.Errorf("invalid mode name: %v", err)
}
return nil
}
-func (m LexModeName) isNil() bool {
- return m == LexModeNameNil
+const idPattern = `^[A-Za-z](_?[0-9A-Za-z]+)*$`
+
+var idRE = regexp.MustCompile(idPattern)
+
+func validateIdentifier(id string) error {
+ if id == "" {
+ return fmt.Errorf("identifier doesn't allow to be the empty string")
+ }
+ if !idRE.MatchString(id) {
+ return fmt.Errorf("identifier must be %v", idPattern)
+ }
+ return nil
}
-const lexModeNamePattern = "[A-Za-z_][0-9A-Za-z_]*"
+func SnakeCaseToUpperCamelCase(snake string) string {
+ elems := strings.Split(snake, "_")
+ for i, e := range elems {
+ if len(e) == 0 {
+ continue
+ }
+ elems[i] = strings.ToUpper(string(e[0])) + e[1:]
+ }
-var lexModeNameRE = regexp.MustCompile(lexModeNamePattern)
+ return strings.Join(elems, "")
+}
type LexEntry struct {
Kind LexKindName `json:"kind"`
@@ -185,9 +199,119 @@ func (s *LexSpec) Validate() error {
}
}
}
+ {
+ kinds := []string{}
+ modes := []string{
+ LexModeNameDefault.String(), // This is a predefined mode.
+ }
+ for _, e := range s.Entries {
+ if e.Fragment {
+ continue
+ }
+
+ kinds = append(kinds, e.Kind.String())
+
+ for _, m := range e.Modes {
+ modes = append(modes, m.String())
+ }
+ }
+
+ kindErrs := findSpellingInconsistenciesErrors(kinds, nil)
+ modeErrs := findSpellingInconsistenciesErrors(modes, func(ids []string) error {
+ if SnakeCaseToUpperCamelCase(ids[0]) == SnakeCaseToUpperCamelCase(LexModeNameDefault.String()) {
+ var b strings.Builder
+ fmt.Fprintf(&b, "%+v", ids[0])
+ for _, id := range ids[1:] {
+ fmt.Fprintf(&b, ", %+v", id)
+ }
+ return fmt.Errorf("these identifiers are treated as the same. please use the same spelling as predefined '%v': %v", LexModeNameDefault, b.String())
+ }
+ return nil
+ })
+ errs := append(kindErrs, modeErrs...)
+ if len(errs) > 0 {
+ var b strings.Builder
+ fmt.Fprintf(&b, "%v", errs[0])
+ for _, err := range errs[1:] {
+ fmt.Fprintf(&b, "\n%v", err)
+ }
+ return fmt.Errorf(b.String())
+ }
+ }
+
return nil
}
+func findSpellingInconsistenciesErrors(ids []string, hook func(ids []string) error) []error {
+ duplicated := FindSpellingInconsistencies(ids)
+ if len(duplicated) == 0 {
+ return nil
+ }
+
+ var errs []error
+ for _, dup := range duplicated {
+ err := hook(dup)
+ if err != nil {
+ errs = append(errs, err)
+ continue
+ }
+
+ var b strings.Builder
+ fmt.Fprintf(&b, "%+v", dup[0])
+ for _, id := range dup[1:] {
+ fmt.Fprintf(&b, ", %+v", id)
+ }
+ err = fmt.Errorf("these identifiers are treated as the same. please use the same spelling: %v", b.String())
+ errs = append(errs, err)
+ }
+
+ return errs
+}
+
+// FindSpellingInconsistencies finds spelling inconsistencies in identifiers. The identifiers are considered to be the same
+// if they are spelled the same when expressed in UpperCamelCase. For example, `left_paren` and `LeftParen` are spelled the same
+// in UpperCamelCase. Thus they are considere to be spelling inconsistency.
+func FindSpellingInconsistencies(ids []string) [][]string {
+ m := map[string][]string{}
+ for _, id := range removeDuplicates(ids) {
+ c := SnakeCaseToUpperCamelCase(id)
+ m[c] = append(m[c], id)
+ }
+
+ var duplicated [][]string
+ for _, camels := range m {
+ if len(camels) == 1 {
+ continue
+ }
+ duplicated = append(duplicated, camels)
+ }
+
+ for _, dup := range duplicated {
+ sort.Slice(dup, func(i, j int) bool {
+ return dup[i] < dup[j]
+ })
+ }
+ sort.Slice(duplicated, func(i, j int) bool {
+ return duplicated[i][0] < duplicated[j][0]
+ })
+
+ return duplicated
+}
+
+func removeDuplicates(s []string) []string {
+ m := map[string]struct{}{}
+ for _, v := range s {
+ m[v] = struct{}{}
+ }
+
+ var unique []string
+ for v := range m {
+ unique = append(unique, v)
+ }
+
+ return unique
+}
+
// StateID represents an ID of a state of a transition table.
type StateID int
diff --git a/spec/spec_test.go b/spec/spec_test.go
new file mode 100644
index 0000000..54d7b7d
--- /dev/null
+++ b/spec/spec_test.go
@@ -0,0 +1,211 @@
+package spec
+
+import (
+ "fmt"
+ "testing"
+)
+
+var idTests = []struct {
+ id string
+ invalid bool
+}{
+ {
+ id: "foo",
+ },
+ {
+ id: "foo2",
+ },
+ {
+ id: "foo_bar_baz",
+ },
+ {
+ id: "f_o_o",
+ },
+ {
+ id: "2foo",
+ invalid: true,
+ },
+ {
+ id: "_foo",
+ invalid: true,
+ },
+ {
+ id: "foo_",
+ invalid: true,
+ },
+ {
+ id: "foo__bar",
+ invalid: true,
+ },
+}
+
+func TestValidateIdentifier(t *testing.T) {
+ for _, tt := range idTests {
+ t.Run(tt.id, func(t *testing.T) {
+ err := validateIdentifier(tt.id)
+ if tt.invalid {
+ if err == nil {
+ t.Errorf("expected error didn't occur")
+ }
+ } else {
+ if err != nil {
+ t.Errorf("unexpected error occurred: %v", err)
+ }
+ }
+ })
+ }
+}
+
+func TestLexKindName_validate(t *testing.T) {
+ for _, tt := range idTests {
+ t.Run(tt.id, func(t *testing.T) {
+ err := LexKindName(tt.id).validate()
+ if tt.invalid {
+ if err == nil {
+ t.Errorf("expected error didn't occur")
+ }
+ } else {
+ if err != nil {
+ t.Errorf("unexpected error occurred: %v", err)
+ }
+ }
+ })
+ }
+}
+
+func TestLexModeName_validate(t *testing.T) {
+ for _, tt := range idTests {
+ t.Run(tt.id, func(t *testing.T) {
+ err := LexModeName(tt.id).validate()
+ if tt.invalid {
+ if err == nil {
+ t.Errorf("expected error didn't occur")
+ }
+ } else {
+ if err != nil {
+ t.Errorf("unexpected error occurred: %v", err)
+ }
+ }
+ })
+ }
+}
+
+func TestSnakeCaseToUpperCamelCase(t *testing.T) {
+ tests := []struct {
+ snake string
+ camel string
+ }{
+ {
+ snake: "foo",
+ camel: "Foo",
+ },
+ {
+ snake: "foo_bar",
+ camel: "FooBar",
+ },
+ {
+ snake: "foo_bar_baz",
+ camel: "FooBarBaz",
+ },
+ {
+ snake: "Foo",
+ camel: "Foo",
+ },
+ {
+ snake: "fooBar",
+ camel: "FooBar",
+ },
+ {
+ snake: "FOO",
+ camel: "FOO",
+ },
+ {
+ snake: "FOO_BAR",
+ camel: "FOOBAR",
+ },
+ {
+ snake: "_foo_bar_",
+ camel: "FooBar",
+ },
+ {
+ snake: "___foo___bar___",
+ camel: "FooBar",
+ },
+ }
+ for _, tt := range tests {
+ c := SnakeCaseToUpperCamelCase(tt.snake)
+ if c != tt.camel {
+ t.Errorf("unexpected string; want: %v, got: %v", tt.camel, c)
+ }
+ }
+}
+
+func TestFindSpellingInconsistencies(t *testing.T) {
+ tests := []struct {
+ ids []string
+ duplicated [][]string
+ }{
+ {
+ ids: []string{"foo", "foo"},
+ duplicated: nil,
+ },
+ {
+ ids: []string{"foo", "Foo"},
+ duplicated: [][]string{{"Foo", "foo"}},
+ },
+ {
+ ids: []string{"foo", "foo", "Foo"},
+ duplicated: [][]string{{"Foo", "foo"}},
+ },
+ {
+ ids: []string{"foo_bar_baz", "FooBarBaz"},
+ duplicated: [][]string{{"FooBarBaz", "foo_bar_baz"}},
+ },
+ {
+ ids: []string{"foo", "Foo", "bar", "Bar"},
+ duplicated: [][]string{{"Bar", "bar"}, {"Foo", "foo"}},
+ },
+ {
+ ids: []string{"foo", "Foo", "bar", "Bar", "baz", "bra"},
+ duplicated: [][]string{{"Bar", "bar"}, {"Foo", "foo"}},
+ },
+ }
+ for i, tt := range tests {
+ t.Run(fmt.Sprintf("#%v", i), func(t *testing.T) {
+ duplicated := FindSpellingInconsistencies(tt.ids)
+ if len(duplicated) != len(tt.duplicated) {
+ t.Fatalf("unexpected IDs; want: %#v, got: %#v", tt.duplicated, duplicated)
+ }
+ for i, dupIDs := range duplicated {
+ if len(dupIDs) != len(tt.duplicated[i]) {
+ t.Fatalf("unexpected IDs; want: %#v, got: %#v", tt.duplicated[i], dupIDs)
+ }
+ for j, id := range dupIDs {
+ if id != tt.duplicated[i][j] {
+ t.Fatalf("unexpected IDs; want: %#v, got: %#v", tt.duplicated[i], dupIDs)
+ }
+ }
+ }
+ })
+ }
+}
+
+func TestLexSpec_Validate(t *testing.T) {
+ // We expect that the spelling inconsistency error will occur.
+ spec := &LexSpec{
+ Entries: []*LexEntry{
+ {
+ Modes: []LexModeName{
+ // 'Default' is the spelling inconsistency because 'default' is predefined.
+ "Default",
+ },
+ Kind: "foo",
+ Pattern: "foo",
+ },
+ },
+ }
+ err := spec.Validate()
+ if err == nil {
+ t.Fatalf("expected error didn't occur")
+ }
+}