| // Copyright 2013 The Go Authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style |
| // license that can be found in the LICENSE file. |
| |
| package language |
| |
| import ( |
| "reflect" |
| "testing" |
| ) |
| |
| func TestTagSize(t *testing.T) { |
| id := Tag{} |
| typ := reflect.TypeOf(id) |
| if typ.Size() > 24 { |
| t.Errorf("size of Tag was %d; want 24", typ.Size()) |
| } |
| } |
| |
| func TestIsRoot(t *testing.T) { |
| loc := Tag{} |
| if !loc.IsRoot() { |
| t.Errorf("unspecified should be root.") |
| } |
| for i, tt := range parseTests() { |
| loc, _ := Parse(tt.in) |
| undef := tt.lang == "und" && tt.script == "" && tt.region == "" && tt.ext == "" |
| if loc.IsRoot() != undef { |
| t.Errorf("%d: was %v; want %v", i, loc.IsRoot(), undef) |
| } |
| } |
| } |
| |
| func TestEquality(t *testing.T) { |
| for i, tt := range parseTests() { |
| s := tt.in |
| tag := Make(s) |
| t1 := Make(tag.String()) |
| if tag != t1 { |
| t.Errorf("%d:%s: equality test 1 failed\n got: %#v\nwant: %#v)", i, s, t1, tag) |
| } |
| t2, _ := Compose(tag) |
| if tag != t2 { |
| t.Errorf("%d:%s: equality test 2 failed\n got: %#v\nwant: %#v", i, s, t2, tag) |
| } |
| } |
| } |
| |
| func TestString(t *testing.T) { |
| tests := []string{ |
| "no-u-rg-dkzzzz", |
| } |
| for i, s := range tests { |
| tag := Make(s) |
| if tag.String() != s { |
| t.Errorf("%d:%s: got %s: want %s (%#v)", i, s, tag.String(), s, tag) |
| } |
| } |
| } |
| |
| func TestMarshal(t *testing.T) { |
| testCases := []string{ |
| // TODO: these values will change with each CLDR update. This issue |
| // will be solved if we decide to fix the indexes. |
| "und", |
| "ca-ES-valencia", |
| "ca-ES-valencia-u-va-posix", |
| "ca-ES-valencia-u-co-phonebk", |
| "ca-ES-valencia-u-co-phonebk-va-posix", |
| "x-klingon", |
| "en-US", |
| "en-US-u-va-posix", |
| "en", |
| "en-u-co-phonebk", |
| "en-001", |
| "sh", |
| |
| "en-GB-u-rg-uszzzz", |
| "en-GB-u-rg-uszzzz-va-posix", |
| "en-GB-u-co-phonebk-rg-uszzzz", |
| // Invalid tags should also roundtrip. |
| "en-GB-u-co-phonebk-rg-uszz", |
| } |
| for _, tc := range testCases { |
| var tag Tag |
| err := tag.UnmarshalText([]byte(tc)) |
| if err != nil { |
| t.Errorf("UnmarshalText(%q): unexpected error: %v", tc, err) |
| } |
| b, err := tag.MarshalText() |
| if err != nil { |
| t.Errorf("MarshalText(%q): unexpected error: %v", tc, err) |
| } |
| if got := string(b); got != tc { |
| t.Errorf("%s: got %q; want %q", tc, got, tc) |
| } |
| } |
| } |
| |
| func TestBase(t *testing.T) { |
| tests := []struct { |
| loc, lang string |
| conf Confidence |
| }{ |
| {"und", "en", Low}, |
| {"x-abc", "und", No}, |
| {"en", "en", Exact}, |
| {"und-Cyrl", "ru", High}, |
| // If a region is not included, the official language should be English. |
| {"und-US", "en", High}, |
| // TODO: not-explicitly listed scripts should probably be und, No |
| // Modify addTags to return info on how the match was derived. |
| // {"und-Aghb", "und", No}, |
| } |
| for i, tt := range tests { |
| loc, _ := Parse(tt.loc) |
| lang, conf := loc.Base() |
| if lang.String() != tt.lang { |
| t.Errorf("%d: language was %s; want %s", i, lang, tt.lang) |
| } |
| if conf != tt.conf { |
| t.Errorf("%d: confidence was %d; want %d", i, conf, tt.conf) |
| } |
| } |
| } |
| |
| func TestParseBase(t *testing.T) { |
| tests := []struct { |
| in string |
| out string |
| ok bool |
| }{ |
| {"en", "en", true}, |
| {"EN", "en", true}, |
| {"nld", "nl", true}, |
| {"dut", "dut", true}, // bibliographic |
| {"aaj", "und", false}, // unknown |
| {"qaa", "qaa", true}, |
| {"a", "und", false}, |
| {"", "und", false}, |
| {"aaaa", "und", false}, |
| } |
| for i, tt := range tests { |
| x, err := ParseBase(tt.in) |
| if x.String() != tt.out || err == nil != tt.ok { |
| t.Errorf("%d:%s: was %s, %v; want %s, %v", i, tt.in, x, err == nil, tt.out, tt.ok) |
| } |
| if y, _, _ := Raw.Make(tt.out).Raw(); x != y { |
| t.Errorf("%d:%s: tag was %s; want %s", i, tt.in, x, y) |
| } |
| } |
| } |
| |
| func TestScript(t *testing.T) { |
| tests := []struct { |
| loc, scr string |
| conf Confidence |
| }{ |
| {"und", "Latn", Low}, |
| {"en-Latn", "Latn", Exact}, |
| {"en", "Latn", High}, |
| {"sr", "Cyrl", Low}, |
| {"kk", "Cyrl", High}, |
| {"kk-CN", "Arab", Low}, |
| {"cmn", "Hans", Low}, |
| {"ru", "Cyrl", High}, |
| {"ru-RU", "Cyrl", High}, |
| {"yue", "Hant", Low}, |
| {"x-abc", "Zzzz", Low}, |
| {"und-zyyy", "Zyyy", Exact}, |
| } |
| for i, tt := range tests { |
| loc, _ := Parse(tt.loc) |
| sc, conf := loc.Script() |
| if sc.String() != tt.scr { |
| t.Errorf("%d:%s: script was %s; want %s", i, tt.loc, sc, tt.scr) |
| } |
| if conf != tt.conf { |
| t.Errorf("%d:%s: confidence was %d; want %d", i, tt.loc, conf, tt.conf) |
| } |
| } |
| } |
| |
| func TestParseScript(t *testing.T) { |
| tests := []struct { |
| in string |
| out string |
| ok bool |
| }{ |
| {"Latn", "Latn", true}, |
| {"zzzz", "Zzzz", true}, |
| {"zyyy", "Zyyy", true}, |
| {"Latm", "Zzzz", false}, |
| {"Zzz", "Zzzz", false}, |
| {"", "Zzzz", false}, |
| {"Zzzxx", "Zzzz", false}, |
| } |
| for i, tt := range tests { |
| x, err := ParseScript(tt.in) |
| if x.String() != tt.out || err == nil != tt.ok { |
| t.Errorf("%d:%s: was %s, %v; want %s, %v", i, tt.in, x, err == nil, tt.out, tt.ok) |
| } |
| if err == nil { |
| if _, y, _ := Raw.Make("und-" + tt.out).Raw(); x != y { |
| t.Errorf("%d:%s: tag was %s; want %s", i, tt.in, x, y) |
| } |
| } |
| } |
| } |
| |
| func TestRegion(t *testing.T) { |
| tests := []struct { |
| loc, reg string |
| conf Confidence |
| }{ |
| {"und", "US", Low}, |
| {"en", "US", Low}, |
| {"zh-Hant", "TW", Low}, |
| {"en-US", "US", Exact}, |
| {"cmn", "CN", Low}, |
| {"ru", "RU", Low}, |
| {"yue", "HK", Low}, |
| {"x-abc", "ZZ", Low}, |
| } |
| for i, tt := range tests { |
| loc, _ := Raw.Parse(tt.loc) |
| reg, conf := loc.Region() |
| if reg.String() != tt.reg { |
| t.Errorf("%d:%s: region was %s; want %s", i, tt.loc, reg, tt.reg) |
| } |
| if conf != tt.conf { |
| t.Errorf("%d:%s: confidence was %d; want %d", i, tt.loc, conf, tt.conf) |
| } |
| } |
| } |
| |
| func TestEncodeM49(t *testing.T) { |
| tests := []struct { |
| m49 int |
| code string |
| ok bool |
| }{ |
| {1, "001", true}, |
| {840, "US", true}, |
| {899, "ZZ", false}, |
| } |
| for i, tt := range tests { |
| if r, err := EncodeM49(tt.m49); r.String() != tt.code || err == nil != tt.ok { |
| t.Errorf("%d:%d: was %s, %v; want %s, %v", i, tt.m49, r, err == nil, tt.code, tt.ok) |
| } |
| } |
| for i := 1; i <= 1000; i++ { |
| if r, err := EncodeM49(i); err == nil && r.M49() == 0 { |
| t.Errorf("%d has no error, but maps to undefined region", i) |
| } |
| } |
| } |
| |
| func TestParseRegion(t *testing.T) { |
| tests := []struct { |
| in string |
| out string |
| ok bool |
| }{ |
| {"001", "001", true}, |
| {"840", "US", true}, |
| {"899", "ZZ", false}, |
| {"USA", "US", true}, |
| {"US", "US", true}, |
| {"BC", "ZZ", false}, |
| {"C", "ZZ", false}, |
| {"CCCC", "ZZ", false}, |
| {"01", "ZZ", false}, |
| } |
| for i, tt := range tests { |
| r, err := ParseRegion(tt.in) |
| if r.String() != tt.out || err == nil != tt.ok { |
| t.Errorf("%d:%s: was %s, %v; want %s, %v", i, tt.in, r, err == nil, tt.out, tt.ok) |
| } |
| if err == nil { |
| if _, _, y := Raw.Make("und-" + tt.out).Raw(); r != y { |
| t.Errorf("%d:%s: tag was %s; want %s", i, tt.in, r, y) |
| } |
| } |
| } |
| } |
| |
| func TestIsCountry(t *testing.T) { |
| tests := []struct { |
| reg string |
| country bool |
| }{ |
| {"US", true}, |
| {"001", false}, |
| {"958", false}, |
| {"419", false}, |
| {"203", true}, |
| {"020", true}, |
| {"900", false}, |
| {"999", false}, |
| {"QO", false}, |
| {"EU", false}, |
| {"AA", false}, |
| {"XK", true}, |
| } |
| for i, tt := range tests { |
| r, _ := ParseRegion(tt.reg) |
| if r.IsCountry() != tt.country { |
| t.Errorf("%d: IsCountry(%s) was %v; want %v", i, tt.reg, r.IsCountry(), tt.country) |
| } |
| } |
| } |
| |
| func TestIsGroup(t *testing.T) { |
| tests := []struct { |
| reg string |
| group bool |
| }{ |
| {"US", false}, |
| {"001", true}, |
| {"958", false}, |
| {"419", true}, |
| {"203", false}, |
| {"020", false}, |
| {"900", false}, |
| {"999", false}, |
| {"QO", true}, |
| {"EU", true}, |
| {"AA", false}, |
| {"XK", false}, |
| } |
| for i, tt := range tests { |
| r, _ := ParseRegion(tt.reg) |
| if r.IsGroup() != tt.group { |
| t.Errorf("%d: IsGroup(%s) was %v; want %v", i, tt.reg, r.IsGroup(), tt.group) |
| } |
| } |
| } |
| |
| func TestContains(t *testing.T) { |
| tests := []struct { |
| enclosing, contained string |
| contains bool |
| }{ |
| // A region contains itself. |
| {"US", "US", true}, |
| {"001", "001", true}, |
| |
| // Direct containment. |
| {"001", "002", true}, |
| {"039", "XK", true}, |
| {"150", "XK", true}, |
| {"EU", "AT", true}, |
| {"QO", "AQ", true}, |
| |
| // Indirect containemnt. |
| {"001", "US", true}, |
| {"001", "419", true}, |
| {"001", "013", true}, |
| |
| // No containment. |
| {"US", "001", false}, |
| {"155", "EU", false}, |
| } |
| for i, tt := range tests { |
| r := MustParseRegion(tt.enclosing) |
| con := MustParseRegion(tt.contained) |
| if got := r.Contains(con); got != tt.contains { |
| t.Errorf("%d: %s.Contains(%s) was %v; want %v", i, tt.enclosing, tt.contained, got, tt.contains) |
| } |
| } |
| } |
| |
| func TestRegionCanonicalize(t *testing.T) { |
| for i, tt := range []struct{ in, out string }{ |
| {"UK", "GB"}, |
| {"TP", "TL"}, |
| {"QU", "EU"}, |
| {"SU", "SU"}, |
| {"VD", "VN"}, |
| {"DD", "DE"}, |
| } { |
| r := MustParseRegion(tt.in) |
| want := MustParseRegion(tt.out) |
| if got := r.Canonicalize(); got != want { |
| t.Errorf("%d: got %v; want %v", i, got, want) |
| } |
| } |
| } |
| |
| func TestRegionTLD(t *testing.T) { |
| for _, tt := range []struct { |
| in, out string |
| ok bool |
| }{ |
| {"EH", "EH", true}, |
| {"FR", "FR", true}, |
| {"TL", "TL", true}, |
| |
| // In ccTLD before in ISO. |
| {"GG", "GG", true}, |
| |
| // Non-standard assignment of ccTLD to ISO code. |
| {"GB", "UK", true}, |
| |
| // Exceptionally reserved in ISO and valid ccTLD. |
| {"UK", "UK", true}, |
| {"AC", "AC", true}, |
| {"EU", "EU", true}, |
| {"SU", "SU", true}, |
| |
| // Exceptionally reserved in ISO and invalid ccTLD. |
| {"CP", "ZZ", false}, |
| {"DG", "ZZ", false}, |
| {"EA", "ZZ", false}, |
| {"FX", "ZZ", false}, |
| {"IC", "ZZ", false}, |
| {"TA", "ZZ", false}, |
| |
| // Transitionally reserved in ISO (e.g. deprecated) but valid ccTLD as |
| // it is still being phased out. |
| {"AN", "AN", true}, |
| {"TP", "TP", true}, |
| |
| // Transitionally reserved in ISO (e.g. deprecated) and invalid ccTLD. |
| // Defined in package language as it has a mapping in CLDR. |
| {"BU", "ZZ", false}, |
| {"CS", "ZZ", false}, |
| {"NT", "ZZ", false}, |
| {"YU", "ZZ", false}, |
| {"ZR", "ZZ", false}, |
| // Not defined in package: SF. |
| |
| // Indeterminately reserved in ISO. |
| // Defined in package language as it has a legacy mapping in CLDR. |
| {"DY", "ZZ", false}, |
| {"RH", "ZZ", false}, |
| {"VD", "ZZ", false}, |
| // Not defined in package: EW, FL, JA, LF, PI, RA, RB, RC, RI, RL, RM, |
| // RN, RP, WG, WL, WV, and YV. |
| |
| // Not assigned in ISO, but legacy definitions in CLDR. |
| {"DD", "ZZ", false}, |
| {"YD", "ZZ", false}, |
| |
| // Normal mappings but somewhat special status in ccTLD. |
| {"BL", "BL", true}, |
| {"MF", "MF", true}, |
| {"BV", "BV", true}, |
| {"SJ", "SJ", true}, |
| |
| // Have values when normalized, but not as is. |
| {"QU", "ZZ", false}, |
| |
| // ISO Private Use. |
| {"AA", "ZZ", false}, |
| {"QM", "ZZ", false}, |
| {"QO", "ZZ", false}, |
| {"XA", "ZZ", false}, |
| {"XK", "ZZ", false}, // Sometimes used for Kosovo, but invalid ccTLD. |
| } { |
| if tt.in == "" { |
| continue |
| } |
| |
| r := MustParseRegion(tt.in) |
| var want Region |
| if tt.out != "ZZ" { |
| want = MustParseRegion(tt.out) |
| } |
| tld, err := r.TLD() |
| if got := err == nil; got != tt.ok { |
| t.Errorf("error(%v): got %v; want %v", r, got, tt.ok) |
| } |
| if tld != want { |
| t.Errorf("TLD(%v): got %v; want %v", r, tld, want) |
| } |
| } |
| } |
| |
| func TestCanonicalize(t *testing.T) { |
| // TODO: do a full test using CLDR data in a separate regression test. |
| tests := []struct { |
| in, out string |
| option CanonType |
| }{ |
| {"en-Latn", "en", SuppressScript}, |
| {"sr-Cyrl", "sr-Cyrl", SuppressScript}, |
| {"sh", "sr-Latn", Legacy}, |
| {"sh-HR", "sr-Latn-HR", Legacy}, |
| {"sh-Cyrl-HR", "sr-Cyrl-HR", Legacy}, |
| {"tl", "fil", Legacy}, |
| {"no", "no", Legacy}, |
| {"no", "nb", Legacy | CLDR}, |
| {"cmn", "cmn", Legacy}, |
| {"cmn", "zh", Macro}, |
| {"cmn-u-co-stroke", "zh-u-co-stroke", Macro}, |
| {"yue", "yue", Macro}, |
| {"nb", "no", Macro}, |
| {"nb", "nb", Macro | CLDR}, |
| {"no", "no", Macro}, |
| {"no", "no", Macro | CLDR}, |
| {"iw", "he", DeprecatedBase}, |
| {"iw", "he", Deprecated | CLDR}, |
| {"mo", "ro-MD", Deprecated}, // Adopted by CLDR as of version 25. |
| {"alb", "sq", Legacy}, // bibliographic |
| {"dut", "nl", Legacy}, // bibliographic |
| // As of CLDR 25, mo is no longer considered a legacy mapping. |
| {"mo", "mo", Legacy | CLDR}, |
| {"und-AN", "und-AN", Deprecated}, |
| {"und-YD", "und-YE", DeprecatedRegion}, |
| {"und-YD", "und-YD", DeprecatedBase}, |
| {"und-Qaai", "und-Zinh", DeprecatedScript}, |
| {"und-Qaai", "und-Qaai", DeprecatedBase}, |
| {"drh", "mn", All}, // drh -> khk -> mn |
| |
| {"en-GB-u-rg-uszzzz", "en-GB-u-rg-uszzzz", Raw}, |
| {"en-GB-u-rg-USZZZZ", "en-GB-u-rg-uszzzz", Raw}, |
| // TODO: use different exact values for language and regional tag? |
| {"en-GB-u-rg-uszzzz-va-posix", "en-GB-u-rg-uszzzz-va-posix", Raw}, |
| {"en-GB-u-rg-uszzzz-co-phonebk", "en-GB-u-co-phonebk-rg-uszzzz", Raw}, |
| // Invalid region specifications are left as is. |
| {"en-GB-u-rg-usz", "en-GB-u-rg-usz", Raw}, |
| {"en-GB-u-rg-usz-va-posix", "en-GB-u-rg-usz-va-posix", Raw}, |
| {"en-GB-u-rg-usz-co-phonebk", "en-GB-u-co-phonebk-rg-usz", Raw}, |
| |
| // CVE-2020-28851 |
| // invalid key-value pair of -u- extension. |
| {"ES-u-000-00", "es-u-000-00", Raw}, |
| {"ES-u-000-00-v-00", "es-u-000-00-v-00", Raw}, |
| // reordered and unknown extension. |
| {"ES-v-00-u-000-00", "es-u-000-00-v-00", Raw}, |
| } |
| for i, tt := range tests { |
| in, _ := Raw.Parse(tt.in) |
| in, _ = tt.option.Canonicalize(in) |
| if in.String() != tt.out { |
| t.Errorf("%d:%s: was %s; want %s", i, tt.in, in.String(), tt.out) |
| } |
| } |
| // Test idempotence. |
| for _, base := range Supported.BaseLanguages() { |
| tag, _ := Raw.Compose(base) |
| got, _ := All.Canonicalize(tag) |
| want, _ := All.Canonicalize(got) |
| if got != want { |
| t.Errorf("idem(%s): got %s; want %s", tag, got, want) |
| } |
| } |
| } |
| |
| func TestTypeForKey(t *testing.T) { |
| tests := []struct{ key, in, out string }{ |
| {"co", "en", ""}, |
| {"co", "en-u-abc", ""}, |
| {"co", "en-u-co-phonebk", "phonebk"}, |
| {"co", "en-u-co-phonebk-cu-aud", "phonebk"}, |
| {"co", "x-foo-u-co-phonebk", ""}, |
| {"va", "en-US-u-va-posix", "posix"}, |
| {"rg", "en-u-rg-gbzzzz", "gbzzzz"}, |
| {"nu", "en-u-co-phonebk-nu-arabic", "arabic"}, |
| {"kc", "cmn-u-co-stroke", ""}, |
| {"rg", "cmn-u-rg", ""}, |
| {"rg", "cmn-u-rg-co-stroke", ""}, |
| {"co", "cmn-u-rg-co-stroke", "stroke"}, |
| {"co", "cmn-u-co-rg-gbzzzz", ""}, |
| {"rg", "cmn-u-co-rg-gbzzzz", "gbzzzz"}, |
| {"rg", "cmn-u-rg-gbzzzz-nlzzzz", "gbzzzz"}, |
| } |
| for _, tt := range tests { |
| if v := Make(tt.in).TypeForKey(tt.key); v != tt.out { |
| t.Errorf("%q[%q]: was %q; want %q", tt.in, tt.key, v, tt.out) |
| } |
| } |
| } |
| |
| func TestParent(t *testing.T) { |
| tests := []struct{ in, out string }{ |
| // Strip variants and extensions first |
| {"de-u-co-phonebk", "de"}, |
| {"de-1994", "de"}, |
| {"de-Latn-1994", "de"}, // remove superfluous script. |
| |
| // Ensure the canonical Tag for an entry is in the chain for base-script |
| // pairs. |
| {"zh-Hans", "zh"}, |
| |
| // Skip the script if it is the maximized version. CLDR files for the |
| // skipped tag are always empty. |
| {"zh-Hans-TW", "zh"}, |
| {"zh-Hans-CN", "zh"}, |
| |
| // Insert the script if the maximized script is not the same as the |
| // maximized script of the base language. |
| {"zh-TW", "zh-Hant"}, |
| {"zh-HK", "zh-Hant"}, |
| {"zh-Hant-TW", "zh-Hant"}, |
| {"zh-Hant-HK", "zh-Hant"}, |
| |
| // Non-default script skips to und. |
| // CLDR |
| {"az-Cyrl", "und"}, |
| {"bs-Cyrl", "und"}, |
| {"en-Dsrt", "und"}, |
| {"ha-Arab", "und"}, |
| {"mn-Mong", "und"}, |
| {"pa-Arab", "und"}, |
| {"shi-Latn", "und"}, |
| {"sr-Latn", "und"}, |
| {"uz-Arab", "und"}, |
| {"uz-Cyrl", "und"}, |
| {"vai-Latn", "und"}, |
| {"zh-Hant", "und"}, |
| // extra |
| {"nl-Cyrl", "und"}, |
| |
| // World english inherits from en-001. |
| {"en-150", "en-001"}, |
| {"en-AU", "en-001"}, |
| {"en-BE", "en-001"}, |
| {"en-GG", "en-001"}, |
| {"en-GI", "en-001"}, |
| {"en-HK", "en-001"}, |
| {"en-IE", "en-001"}, |
| {"en-IM", "en-001"}, |
| {"en-IN", "en-001"}, |
| {"en-JE", "en-001"}, |
| {"en-MT", "en-001"}, |
| {"en-NZ", "en-001"}, |
| {"en-PK", "en-001"}, |
| {"en-SG", "en-001"}, |
| |
| // Spanish in Latin-American countries have es-419 as parent. |
| {"es-AR", "es-419"}, |
| {"es-BO", "es-419"}, |
| {"es-CL", "es-419"}, |
| {"es-CO", "es-419"}, |
| {"es-CR", "es-419"}, |
| {"es-CU", "es-419"}, |
| {"es-DO", "es-419"}, |
| {"es-EC", "es-419"}, |
| {"es-GT", "es-419"}, |
| {"es-HN", "es-419"}, |
| {"es-MX", "es-419"}, |
| {"es-NI", "es-419"}, |
| {"es-PA", "es-419"}, |
| {"es-PE", "es-419"}, |
| {"es-PR", "es-419"}, |
| {"es-PY", "es-419"}, |
| {"es-SV", "es-419"}, |
| {"es-US", "es-419"}, |
| {"es-UY", "es-419"}, |
| {"es-VE", "es-419"}, |
| // exceptions (according to CLDR) |
| {"es-CW", "es"}, |
| |
| // Inherit from pt-PT, instead of pt for these countries. |
| {"pt-AO", "pt-PT"}, |
| {"pt-CV", "pt-PT"}, |
| {"pt-GW", "pt-PT"}, |
| {"pt-MO", "pt-PT"}, |
| {"pt-MZ", "pt-PT"}, |
| {"pt-ST", "pt-PT"}, |
| {"pt-TL", "pt-PT"}, |
| |
| {"en-GB-u-co-phonebk-rg-uszzzz", "en-GB"}, |
| {"en-GB-u-rg-uszzzz", "en-GB"}, |
| {"en-US-u-va-posix", "en-US"}, |
| |
| // Difference between language and regional tag. |
| {"ca-ES-valencia", "ca-ES"}, |
| {"ca-ES-valencia-u-rg-ptzzzz", "ca-ES"}, |
| {"en-US-u-va-variant", "en-US"}, |
| {"en-u-va-variant", "en"}, |
| {"en-u-rg-gbzzzz", "en"}, |
| {"en-US-u-rg-gbzzzz", "en-US"}, |
| {"nl-US-u-rg-gbzzzz", "nl-US"}, |
| } |
| for _, tt := range tests { |
| tag := Raw.MustParse(tt.in) |
| if p := Raw.MustParse(tt.out); p != tag.Parent() { |
| t.Errorf("%s: was %v; want %v", tt.in, tag.Parent(), p) |
| } |
| } |
| } |
| |
| var ( |
| // Tags without error that don't need to be changed. |
| benchBasic = []string{ |
| "en", |
| "en-Latn", |
| "en-GB", |
| "za", |
| "zh-Hant", |
| "zh", |
| "zh-HK", |
| "ar-MK", |
| "en-CA", |
| "fr-CA", |
| "fr-CH", |
| "fr", |
| "lv", |
| "he-IT", |
| "tlh", |
| "ja", |
| "ja-Jpan", |
| "ja-Jpan-JP", |
| "de-1996", |
| "de-CH", |
| "sr", |
| "sr-Latn", |
| } |
| // Tags with extensions, not changes required. |
| benchExt = []string{ |
| "x-a-b-c-d", |
| "x-aa-bbbb-cccccccc-d", |
| "en-x_cc-b-bbb-a-aaa", |
| "en-c_cc-b-bbb-a-aaa-x-x", |
| "en-u-co-phonebk", |
| "en-Cyrl-u-co-phonebk", |
| "en-US-u-co-phonebk-cu-xau", |
| "en-nedix-u-co-phonebk", |
| "en-t-t0-abcd", |
| "en-t-nl-latn", |
| "en-t-t0-abcd-x-a", |
| } |
| // Change, but not memory allocation required. |
| benchSimpleChange = []string{ |
| "EN", |
| "i-klingon", |
| "en-latn", |
| "zh-cmn-Hans-CN", |
| "iw-NL", |
| } |
| // Change and memory allocation required. |
| benchChangeAlloc = []string{ |
| "en-c_cc-b-bbb-a-aaa", |
| "en-u-cu-xua-co-phonebk", |
| "en-u-cu-xua-co-phonebk-a-cd", |
| "en-u-def-abc-cu-xua-co-phonebk", |
| "en-t-en-Cyrl-NL-1994", |
| "en-t-en-Cyrl-NL-1994-t0-abc-def", |
| } |
| // Tags that result in errors. |
| benchErr = []string{ |
| // IllFormed |
| "x_A.-B-C_D", |
| "en-u-cu-co-phonebk", |
| "en-u-cu-xau-co", |
| "en-t-nl-abcd", |
| // Invalid |
| "xx", |
| "nl-Uuuu", |
| "nl-QB", |
| } |
| benchChange = append(benchSimpleChange, benchChangeAlloc...) |
| benchAll = append(append(append(benchBasic, benchExt...), benchChange...), benchErr...) |
| ) |
| |
| func doParse(b *testing.B, tag []string) { |
| for i := 0; i < b.N; i++ { |
| // Use the modulo instead of looping over all tags so that we get a somewhat |
| // meaningful ns/op. |
| Parse(tag[i%len(tag)]) |
| } |
| } |
| |
| func BenchmarkParse(b *testing.B) { |
| doParse(b, benchAll) |
| } |
| |
| func BenchmarkParseBasic(b *testing.B) { |
| doParse(b, benchBasic) |
| } |
| |
| func BenchmarkParseError(b *testing.B) { |
| doParse(b, benchErr) |
| } |
| |
| func BenchmarkParseSimpleChange(b *testing.B) { |
| doParse(b, benchSimpleChange) |
| } |
| |
| func BenchmarkParseChangeAlloc(b *testing.B) { |
| doParse(b, benchChangeAlloc) |
| } |