databricks
diff --git a/‎libs/tags/aws.go‎
Lines changed: 10 additions & 8 deletions b/‎libs/tags/aws.go‎
Lines changed: 10 additions & 8 deletions
diff --git a/‎libs/tags/azure.go‎
Lines changed: 7 additions & 5 deletions b/‎libs/tags/azure.go‎
Lines changed: 7 additions & 5 deletions
diff --git a/‎libs/tags/gcp.go‎
Lines changed: 12 additions & 10 deletions b/‎libs/tags/gcp.go‎
Lines changed: 12 additions & 10 deletions
diff --git a/‎libs/tags/latin_test.go‎
Lines changed: 0 additions & 16 deletions b/‎libs/tags/latin_test.go‎
Lines changed: 0 additions & 16 deletions
diff --git a/‎libs/tags/tag.go‎
Lines changed: 8 additions & 6 deletions b/‎libs/tags/tag.go‎
Lines changed: 8 additions & 6 deletions
diff --git a/‎libs/tags/transform.go‎
Lines changed: 0 additions & 87 deletions b/‎libs/tags/transform.go‎
Lines changed: 0 additions & 87 deletions
diff --git a/‎libs/tags/transform_test.go‎
Lines changed: 0 additions & 25 deletions b/‎libs/tags/transform_test.go‎
Lines changed: 0 additions & 25 deletions
diff --git a/‎libs/tags/latin.go‎ ‎libs/textutil/latin.go‎libs/tags/latin.go renamed to libs/textutil/latin.go
Lines changed: 2 additions & 2 deletions b/‎libs/tags/latin.go‎ ‎libs/textutil/latin.go‎libs/tags/latin.go renamed to libs/textutil/latin.go
Lines changed: 2 additions & 2 deletions
diff --git a/‎libs/textutil/latin_test.go‎
Lines changed: 16 additions & 0 deletions b/‎libs/textutil/latin_test.go‎
Lines changed: 16 additions & 0 deletions
@@ -4,6 +4,8 @@ import (
 	"regexp"
 	"unicode"
 
+	"github.com/databricks/cli/libs/textutil"
+
 	"golang.org/x/text/unicode/rangetable"
 )
 
@@ -20,17 +22,17 @@ var awsChars = rangetable.Merge(
 var awsTag = &tag{
 	keyLength:  127,
 	keyPattern: regexp.MustCompile(`^[\d \w\+\-=\.:\/@]*$`),
-	keyNormalize: chain(
-		normalizeMarks(),
-		replaceNotIn(latin1, '_'),
-		replaceNotIn(awsChars, '_'),
+	keyNormalize: textutil.Chain(
+		textutil.NormalizeMarks(),
+		textutil.ReplaceNotIn(textutil.Latin1, '_'),
+		textutil.ReplaceNotIn(awsChars, '_'),
 	),
 
 	valueLength:  255,
 	valuePattern: regexp.MustCompile(`^[\d \w\+\-=\.:/@]*$`),
-	valueNormalize: chain(
-		normalizeMarks(),
-		replaceNotIn(latin1, '_'),
-		replaceNotIn(awsChars, '_'),
+	valueNormalize: textutil.Chain(
+		textutil.NormalizeMarks(),
+		textutil.ReplaceNotIn(textutil.Latin1, '_'),
+		textutil.ReplaceNotIn(awsChars, '_'),
 	),
 }
@@ -3,6 +3,8 @@ package tags
 import (
 	"regexp"
 
+	"github.com/databricks/cli/libs/textutil"
+
 	"golang.org/x/text/unicode/rangetable"
 )
 
@@ -12,14 +14,14 @@ var azureForbiddenChars = rangetable.New('<', '>', '*', '&', '%', ';', '\\', '/'
 var azureTag = &tag{
 	keyLength:  512,
 	keyPattern: regexp.MustCompile(`^[^<>\*&%;\\\/\+\?]*$`),
-	keyNormalize: chain(
-		replaceNotIn(latin1, '_'),
-		replaceIn(azureForbiddenChars, '_'),
+	keyNormalize: textutil.Chain(
+		textutil.ReplaceNotIn(textutil.Latin1, '_'),
+		textutil.ReplaceIn(azureForbiddenChars, '_'),
 	),
 
 	valueLength:  256,
 	valuePattern: regexp.MustCompile(`^.*$`),
-	valueNormalize: chain(
-		replaceNotIn(latin1, '_'),
+	valueNormalize: textutil.Chain(
+		textutil.ReplaceNotIn(textutil.Latin1, '_'),
 	),
 }
@@ -3,6 +3,8 @@ package tags
 import (
 	"regexp"
 	"unicode"
+
+	"github.com/databricks/cli/libs/textutil"
 )
 
 // Tag keys and values on GCP are limited to 63 characters and must match the
@@ -45,19 +47,19 @@ var gcpInner = &unicode.RangeTable{
 var gcpTag = &tag{
 	keyLength:  63,
 	keyPattern: regexp.MustCompile(`^([A-Za-z0-9][-A-Za-z0-9_.]*)?[A-Za-z0-9]$`),
-	keyNormalize: chain(
-		normalizeMarks(),
-		replaceNotIn(latin1, '_'),
-		replaceNotIn(gcpInner, '_'),
-		trimIfNotIn(gcpOuter),
+	keyNormalize: textutil.Chain(
+		textutil.NormalizeMarks(),
+		textutil.ReplaceNotIn(textutil.Latin1, '_'),
+		textutil.ReplaceNotIn(gcpInner, '_'),
+		textutil.TrimIfNotIn(gcpOuter),
 	),
 
 	valueLength:  63,
 	valuePattern: regexp.MustCompile(`^(([A-Za-z0-9][-A-Za-z0-9_.]*)?[A-Za-z0-9])?$`),
-	valueNormalize: chain(
-		normalizeMarks(),
-		replaceNotIn(latin1, '_'),
-		replaceNotIn(gcpInner, '_'),
-		trimIfNotIn(gcpOuter),
+	valueNormalize: textutil.Chain(
+		textutil.NormalizeMarks(),
+		textutil.ReplaceNotIn(textutil.Latin1, '_'),
+		textutil.ReplaceNotIn(gcpInner, '_'),
+		textutil.TrimIfNotIn(gcpOuter),
 	),
 }
@@ -6,18 +6,20 @@ import (
 	"regexp"
 	"strings"
 	"unicode"
+
+	"github.com/databricks/cli/libs/textutil"
 )
 
 // The tag type holds the validation and normalization rules for
 // a cloud provider's resource tags as applied by Databricks.
 type tag struct {
 	keyLength    int
 	keyPattern   *regexp.Regexp
-	keyNormalize transformer
+	keyNormalize textutil.Transformer
 
 	valueLength    int
 	valuePattern   *regexp.Regexp
-	valueNormalize transformer
+	valueNormalize textutil.Transformer
 }
 
 func (t *tag) ValidateKey(s string) error {
@@ -27,7 +29,7 @@ func (t *tag) ValidateKey(s string) error {
 	if len(s) > t.keyLength {
 		return fmt.Errorf("key length %d exceeds maximum of %d", len(s), t.keyLength)
 	}
-	if strings.ContainsFunc(s, func(r rune) bool { return !unicode.Is(latin1, r) }) {
+	if strings.ContainsFunc(s, func(r rune) bool { return !unicode.Is(textutil.Latin1, r) }) {
 		return errors.New("key contains non-latin1 characters")
 	}
 	if !t.keyPattern.MatchString(s) {
@@ -40,7 +42,7 @@ func (t *tag) ValidateValue(s string) error {
 	if len(s) > t.valueLength {
 		return fmt.Errorf("value length %d exceeds maximum of %d", len(s), t.valueLength)
 	}
-	if strings.ContainsFunc(s, func(r rune) bool { return !unicode.Is(latin1, r) }) {
+	if strings.ContainsFunc(s, func(r rune) bool { return !unicode.Is(textutil.Latin1, r) }) {
 		return errors.New("value contains non-latin1 characters")
 	}
 	if !t.valuePattern.MatchString(s) {
@@ -50,9 +52,9 @@ func (t *tag) ValidateValue(s string) error {
 }
 
 func (t *tag) NormalizeKey(s string) string {
-	return t.keyNormalize.transform(s)
+	return t.keyNormalize.TransformString(s)
 }
 
 func (t *tag) NormalizeValue(s string) string {
-	return t.valueNormalize.transform(s)
+	return t.valueNormalize.TransformString(s)
 }
@@ -1,9 +1,9 @@
-package tags
+package textutil
 
 import "unicode"
 
 // Range table for all characters in the Latin1 character set.
-var latin1 = &unicode.RangeTable{
+var Latin1 = &unicode.RangeTable{
 	R16: []unicode.Range16{
 		{0x0000, 0x00ff, 1},
 	},
 
@@ -0,0 +1,16 @@
+package textutil
+
+import (
+	"testing"
+	"unicode"
+
+	"github.com/stretchr/testify/assert"
+)
+
+func TestLatinTable(t *testing.T) {
+	assert.True(t, unicode.In('\u0000', Latin1))
+	assert.True(t, unicode.In('A', Latin1))
+	assert.True(t, unicode.In('Z', Latin1))
+	assert.True(t, unicode.In('\u00ff', Latin1))
+	assert.False(t, unicode.In('\u0100', Latin1))
+}
Original file line number	Diff line number	Diff line change
`@@ -6,18 +6,20 @@ import (`
`6`	`6`	`"regexp"`
`7`	`7`	`"strings"`
`8`	`8`	`"unicode"`
	`9`	`+`
	`10`	`+ "github.com/databricks/cli/libs/textutil"`
`9`	`11`	`)`
`10`	`12`
`11`	`13`	`// The tag type holds the validation and normalization rules for`
`12`	`14`	`// a cloud provider's resource tags as applied by Databricks.`
`13`	`15`	`type tag struct {`
`14`	`16`	`keyLength int`
`15`	`17`	`keyPattern *regexp.Regexp`
`16`		`- keyNormalize transformer`
	`18`	`+ keyNormalize textutil.Transformer`
`17`	`19`
`18`	`20`	`valueLength int`
`19`	`21`	`valuePattern *regexp.Regexp`
`20`		`- valueNormalize transformer`
	`22`	`+ valueNormalize textutil.Transformer`
`21`	`23`	`}`
`22`	`24`
`23`	`25`	`func (t *tag) ValidateKey(s string) error {`
`@@ -27,7 +29,7 @@ func (t *tag) ValidateKey(s string) error {`
`27`	`29`	`if len(s) > t.keyLength {`
`28`	`30`	`return fmt.Errorf("key length %d exceeds maximum of %d", len(s), t.keyLength)`
`29`	`31`	`}`
`30`		`- if strings.ContainsFunc(s, func(r rune) bool { return !unicode.Is(latin1, r) }) {`
	`32`	`+ if strings.ContainsFunc(s, func(r rune) bool { return !unicode.Is(textutil.Latin1, r) }) {`
`31`	`33`	`return errors.New("key contains non-latin1 characters")`
`32`	`34`	`}`
`33`	`35`	`if !t.keyPattern.MatchString(s) {`
`@@ -40,7 +42,7 @@ func (t *tag) ValidateValue(s string) error {`
`40`	`42`	`if len(s) > t.valueLength {`
`41`	`43`	`return fmt.Errorf("value length %d exceeds maximum of %d", len(s), t.valueLength)`
`42`	`44`	`}`
`43`		`- if strings.ContainsFunc(s, func(r rune) bool { return !unicode.Is(latin1, r) }) {`
	`45`	`+ if strings.ContainsFunc(s, func(r rune) bool { return !unicode.Is(textutil.Latin1, r) }) {`
`44`	`46`	`return errors.New("value contains non-latin1 characters")`
`45`	`47`	`}`
`46`	`48`	`if !t.valuePattern.MatchString(s) {`
`@@ -50,9 +52,9 @@ func (t *tag) ValidateValue(s string) error {`
`50`	`52`	`}`
`51`	`53`
`52`	`54`	`func (t *tag) NormalizeKey(s string) string {`
`53`		`- return t.keyNormalize.transform(s)`
	`55`	`+ return t.keyNormalize.TransformString(s)`
`54`	`56`	`}`
`55`	`57`
`56`	`58`	`func (t *tag) NormalizeValue(s string) string {`
`57`		`- return t.valueNormalize.transform(s)`
	`59`	`+ return t.valueNormalize.TransformString(s)`
`58`	`60`	`}`