math/big: optimize shlVU_g and shrVU_g

author Josh Bleecher Snyder <josharian@gmail.com>

Sun, 3 Mar 2019 21:08:40 +0000 (13:08 -0800)

committer Josh Bleecher Snyder <josharian@gmail.com>

Mon, 4 Mar 2019 19:30:57 +0000 (19:30 +0000)
author Josh Bleecher Snyder <josharian@gmail.com>
Sun, 3 Mar 2019 21:08:40 +0000 (13:08 -0800)
committer Josh Bleecher Snyder <josharian@gmail.com>
Mon, 4 Mar 2019 19:30:57 +0000 (19:30 +0000)
diff --git a/src/math/big/arith.go b/src/math/big/arith.go

index f9db9118eb254e18a19e30a87ed0c55eca03e056..611193ef18299c5d5dffa89a61a5797e618ca2c7 100644 (file)
--- a/src/math/big/arith.go
+++ b/src/math/big/arith.go
@@ -204,32 +204,46 @@ func subVW_g(z, x []Word, y Word) (c Word) {
  }
  
  func shlVU_g(z, x []Word, s uint) (c Word) {
-       if n := len(z); n > 0 {
-               ŝ := _W - s
-               w1 := x[n-1]
-               c = w1 >> ŝ
-               for i := n - 1; i > 0; i-- {
-                       w := w1
-                       w1 = x[i-1]
-                       z[i] = w<<s | w1>>ŝ
-               }
-               z[0] = w1 << s
+       if s == 0 {
+               copy(z, x)
+               return
+       }
+       if len(z) == 0 {
+               return
+       }
+       s &= _W - 1 // hint to the compiler that shifts by s don't need guard code
+       ŝ := _W - s
+       ŝ &= _W - 1 // ditto
+       w1 := x[len(z)-1]
+       c = w1 >> ŝ
+       for i := len(z) - 1; i > 0; i-- {
+               w := w1
+               w1 = x[i-1]
+               z[i] = w<<s | w1>>ŝ
         }
+       z[0] = w1 << s
         return
  }
  
  func shrVU_g(z, x []Word, s uint) (c Word) {
-       if n := len(z); n > 0 {
-               ŝ := _W - s
-               w1 := x[0]
-               c = w1 << ŝ
-               for i := 0; i < n-1; i++ {
-                       w := w1
-                       w1 = x[i+1]
-                       z[i] = w>>s | w1<<ŝ
-               }
-               z[n-1] = w1 >> s
+       if s == 0 {
+               copy(z, x)
+               return
+       }
+       if len(z) == 0 {
+               return
+       }
+       s &= _W - 1 // hint to the compiler that shifts by s don't need guard code
+       ŝ := _W - s
+       ŝ &= _W - 1 // ditto
+       w1 := x[0]
+       c = w1 << ŝ
+       for i := 0; i < len(z)-1; i++ {
+               w := w1
+               w1 = x[i+1]
+               z[i] = w>>s | w1<<ŝ
         }
+       z[len(z)-1] = w1 >> s
         return
  }
author	Josh Bleecher Snyder <josharian@gmail.com>
	Sun, 3 Mar 2019 21:08:40 +0000 (13:08 -0800)
committer	Josh Bleecher Snyder <josharian@gmail.com>
	Mon, 4 Mar 2019 19:30:57 +0000 (19:30 +0000)