mirror of
https://github.com/golang/go.git
synced 2025-11-11 22:21:06 +00:00
utf8.String: Slice(i,j)
R=rsc CC=golang-dev https://golang.org/cl/2225048
This commit is contained in:
parent
b1f44a120f
commit
2f80d328e8
2 changed files with 76 additions and 1 deletions
|
|
@ -11,6 +11,8 @@ package utf8
|
||||||
// O(N) in the length of the string, but the overhead is less than always
|
// O(N) in the length of the string, but the overhead is less than always
|
||||||
// scanning from the beginning.
|
// scanning from the beginning.
|
||||||
// If the string is ASCII, random access is O(1).
|
// If the string is ASCII, random access is O(1).
|
||||||
|
// Unlike the built-in string type, String has internal mutable state and
|
||||||
|
// is not thread-safe.
|
||||||
type String struct {
|
type String struct {
|
||||||
str string
|
str string
|
||||||
numRunes int
|
numRunes int
|
||||||
|
|
@ -55,6 +57,39 @@ func (s *String) IsASCII() bool {
|
||||||
return s.width == 0
|
return s.width == 0
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// Slice returns the string sliced at rune positions [i:j].
|
||||||
|
func (s *String) Slice(i, j int) string {
|
||||||
|
// ASCII is easy. Let the compiler catch the indexing error if there is one.
|
||||||
|
if j < s.nonASCII {
|
||||||
|
return s.str[i:j]
|
||||||
|
}
|
||||||
|
if i < 0 || j > s.numRunes || i > j {
|
||||||
|
panic(sliceOutOfRange)
|
||||||
|
}
|
||||||
|
if i == j {
|
||||||
|
return ""
|
||||||
|
}
|
||||||
|
// For non-ASCII, after At(i), bytePos is always the position of the indexed character.
|
||||||
|
var low, high int
|
||||||
|
switch {
|
||||||
|
case i < s.nonASCII:
|
||||||
|
low = i
|
||||||
|
case i == s.numRunes:
|
||||||
|
low = len(s.str)
|
||||||
|
default:
|
||||||
|
s.At(i)
|
||||||
|
low = s.bytePos
|
||||||
|
}
|
||||||
|
switch {
|
||||||
|
case j == s.numRunes:
|
||||||
|
high = len(s.str)
|
||||||
|
default:
|
||||||
|
s.At(j)
|
||||||
|
high = s.bytePos
|
||||||
|
}
|
||||||
|
return s.str[low:high]
|
||||||
|
}
|
||||||
|
|
||||||
// At returns the rune with index i in the String. The sequence of runes is the same
|
// At returns the rune with index i in the String. The sequence of runes is the same
|
||||||
// as iterating over the contents with a "for range" clause.
|
// as iterating over the contents with a "for range" clause.
|
||||||
func (s *String) At(i int) int {
|
func (s *String) At(i int) int {
|
||||||
|
|
@ -163,4 +198,5 @@ func (err error) String() string {
|
||||||
func (err error) RunTimeError() {
|
func (err error) RunTimeError() {
|
||||||
}
|
}
|
||||||
|
|
||||||
var outOfRange = error("utf8.String: index out of Range")
|
var outOfRange = error("utf8.String: index out of range")
|
||||||
|
var sliceOutOfRange = error("utf8.String: slice index out of range")
|
||||||
|
|
|
||||||
|
|
@ -68,3 +68,42 @@ func TestRandomAccess(t *testing.T) {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
func TestRandomSliceAccess(t *testing.T) {
|
||||||
|
for _, s := range testStrings {
|
||||||
|
if len(s) == 0 || s[0] == '\x80' { // the bad-UTF-8 string fools this simple test
|
||||||
|
continue
|
||||||
|
}
|
||||||
|
runes := []int(s)
|
||||||
|
str := NewString(s)
|
||||||
|
if str.RuneCount() != len(runes) {
|
||||||
|
t.Error("%s: expected %d runes; got %d", s, len(runes), str.RuneCount())
|
||||||
|
break
|
||||||
|
}
|
||||||
|
for k := 0; k < randCount; k++ {
|
||||||
|
i := rand.Intn(len(runes))
|
||||||
|
j := rand.Intn(len(runes) + 1)
|
||||||
|
if i > j { // include empty strings
|
||||||
|
continue
|
||||||
|
}
|
||||||
|
expect := string(runes[i:j])
|
||||||
|
got := str.Slice(i, j)
|
||||||
|
if got != expect {
|
||||||
|
t.Errorf("%s[%d:%d]: expected %q got %q", s, i, j, expect, got)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
func TestLimitSliceAccess(t *testing.T) {
|
||||||
|
for _, s := range testStrings {
|
||||||
|
str := NewString(s)
|
||||||
|
if str.Slice(0, 0) != "" {
|
||||||
|
t.Error("failure with empty slice at beginning")
|
||||||
|
}
|
||||||
|
nr := RuneCountInString(s)
|
||||||
|
if str.Slice(nr, nr) != "" {
|
||||||
|
t.Error("failure with empty slice at end")
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue