bytes, strings: speed up TrimSpace

author Julien Cretel <jub0bsinthecloud@gmail.com>

Mon, 25 Aug 2025 20:38:20 +0000 (20:38 +0000)

committer Gopher Robot <gobot@golang.org>

Fri, 29 Aug 2025 16:34:38 +0000 (09:34 -0700)
author Julien Cretel <jub0bsinthecloud@gmail.com>
Mon, 25 Aug 2025 20:38:20 +0000 (20:38 +0000)
committer Gopher Robot <gobot@golang.org>
Fri, 29 Aug 2025 16:34:38 +0000 (09:34 -0700)
diff --git a/src/bytes/bytes.go b/src/bytes/bytes.go

index a0a8fa0b2986e1e3e937de239a0da216352b9627..ce2e004910223440bfc7f60bfe2e8bca86000e80 100644 (file)
--- a/src/bytes/bytes.go
+++ b/src/bytes/bytes.go
@@ -1117,41 +1117,34 @@ func trimRightUnicode(s []byte, cutset string) []byte {
  // TrimSpace returns a subslice of s by slicing off all leading and
  // trailing white space, as defined by Unicode.
  func TrimSpace(s []byte) []byte {
-       // Fast path for ASCII: look for the first ASCII non-space byte
-       start := 0
-       for ; start < len(s); start++ {
-               c := s[start]
+       // Fast path for ASCII: look for the first ASCII non-space byte.
+       for lo, c := range s {
                 if c >= utf8.RuneSelf {
                         // If we run into a non-ASCII byte, fall back to the
-                       // slower unicode-aware method on the remaining bytes
-                       return TrimFunc(s[start:], unicode.IsSpace)
-               }
-               if asciiSpace[c] == 0 {
-                       break
+                       // slower unicode-aware method on the remaining bytes.
+                       return TrimFunc(s[lo:], unicode.IsSpace)
                 }
-       }
-
-       // Now look for the first ASCII non-space byte from the end
-       stop := len(s)
-       for ; stop > start; stop-- {
-               c := s[stop-1]
-               if c >= utf8.RuneSelf {
-                       return TrimFunc(s[start:stop], unicode.IsSpace)
+               if asciiSpace[c] != 0 {
+                       continue
                 }
-               if asciiSpace[c] == 0 {
-                       break
+               s = s[lo:]
+               // Now look for the first ASCII non-space byte from the end.
+               for hi := len(s) - 1; hi >= 0; hi-- {
+                       c := s[hi]
+                       if c >= utf8.RuneSelf {
+                               return TrimFunc(s[:hi+1], unicode.IsSpace)
+                       }
+                       if asciiSpace[c] == 0 {
+                               // At this point, s[:hi+1] starts and ends with ASCII
+                               // non-space bytes, so we're done. Non-ASCII cases have
+                               // already been handled above.
+                               return s[:hi+1]
+                       }
                 }
         }
-
-       // At this point s[start:stop] starts and ends with an ASCII
-       // non-space bytes, so we're done. Non-ASCII cases have already
-       // been handled above.
-       if start == stop {
-               // Special case to preserve previous TrimLeftFunc behavior,
-               // returning nil instead of empty slice if all spaces.
-               return nil
-       }
-       return s[start:stop]
+       // Special case to preserve previous TrimLeftFunc behavior,
+       // returning nil instead of empty slice if all spaces.
+       return nil
  }
  
  // Runes interprets s as a sequence of UTF-8-encoded code points.
diff --git a/src/strings/strings.go b/src/strings/strings.go

index 91c6ddef669f3089a9602b77b83faed4579b0fa3..74007977d911f0382e559f7b68bb119819364066 100644 (file)
--- a/src/strings/strings.go
+++ b/src/strings/strings.go
@@ -1091,37 +1091,32 @@ func trimRightUnicode(s, cutset string) string {
  // TrimSpace returns a slice of the string s, with all leading
  // and trailing white space removed, as defined by Unicode.
  func TrimSpace(s string) string {
-       // Fast path for ASCII: look for the first ASCII non-space byte
-       start := 0
-       for ; start < len(s); start++ {
-               c := s[start]
+       // Fast path for ASCII: look for the first ASCII non-space byte.
+       for lo, c := range []byte(s) {
                 if c >= utf8.RuneSelf {
                         // If we run into a non-ASCII byte, fall back to the
-                       // slower unicode-aware method on the remaining bytes
-                       return TrimFunc(s[start:], unicode.IsSpace)
-               }
-               if asciiSpace[c] == 0 {
-                       break
+                       // slower unicode-aware method on the remaining bytes.
+                       return TrimFunc(s[lo:], unicode.IsSpace)
                 }
-       }
-
-       // Now look for the first ASCII non-space byte from the end
-       stop := len(s)
-       for ; stop > start; stop-- {
-               c := s[stop-1]
-               if c >= utf8.RuneSelf {
-                       // start has been already trimmed above, should trim end only
-                       return TrimRightFunc(s[start:stop], unicode.IsSpace)
+               if asciiSpace[c] != 0 {
+                       continue
                 }
-               if asciiSpace[c] == 0 {
-                       break
+               s = s[lo:]
+               // Now look for the first ASCII non-space byte from the end.
+               for hi := len(s) - 1; hi >= 0; hi-- {
+                       c := s[hi]
+                       if c >= utf8.RuneSelf {
+                               return TrimRightFunc(s[:hi+1], unicode.IsSpace)
+                       }
+                       if asciiSpace[c] == 0 {
+                               // At this point, s[:hi+1] starts and ends with ASCII
+                               // non-space bytes, so we're done. Non-ASCII cases have
+                               // already been handled above.
+                               return s[:hi+1]
+                       }
                 }
         }
-
-       // At this point s[start:stop] starts and ends with an ASCII
-       // non-space bytes, so we're done. Non-ASCII cases have already
-       // been handled above.
-       return s[start:stop]
+       return ""
  }
  
  // TrimPrefix returns s without the provided leading prefix string.
author	Julien Cretel <jub0bsinthecloud@gmail.com>
	Mon, 25 Aug 2025 20:38:20 +0000 (20:38 +0000)
committer	Gopher Robot <gobot@golang.org>
	Fri, 29 Aug 2025 16:34:38 +0000 (09:34 -0700)
src/bytes/bytes.go		patch \| blob \| history
src/strings/strings.go		patch \| blob \| history