runtime: remove TODO notes suggesting jump tables

author Iskander Sharipov <iskander.sharipov@intel.com>

Fri, 1 Jun 2018 15:55:36 +0000 (18:55 +0300)

committer Brad Fitzpatrick <bradfitz@golang.org>

Mon, 11 Jun 2018 22:09:04 +0000 (22:09 +0000)
author Iskander Sharipov <iskander.sharipov@intel.com>
Fri, 1 Jun 2018 15:55:36 +0000 (18:55 +0300)
committer Brad Fitzpatrick <bradfitz@golang.org>
Mon, 11 Jun 2018 22:09:04 +0000 (22:09 +0000)
diff --git a/src/runtime/memclr_386.s b/src/runtime/memclr_386.s

index 7d5dd38c0a423f37067fc0135811ea89ea91e479..a6703b364111447a5483342e86e255a45714edc6 100644 (file)
--- a/src/runtime/memclr_386.s
+++ b/src/runtime/memclr_386.s
@@ -16,6 +16,7 @@ TEXT runtime·memclrNoHeapPointers(SB), NOSPLIT, $0-8
  
         // MOVOU seems always faster than REP STOSL.
  tail:
+       // BSR+branch table make almost all memmove/memclr benchmarks worse. Not worth doing.
         TESTL   BX, BX
         JEQ     _0
         CMPL    BX, $2
@@ -38,7 +39,6 @@ tail:
         JBE     _65through128
         CMPL    BX, $256
         JBE     _129through256
-       // TODO: use branch table and BSR to make this just a single dispatch
  
  loop:
         MOVOU   X0, 0(DI)
diff --git a/src/runtime/memclr_amd64.s b/src/runtime/memclr_amd64.s

index 63730eebfb3524559f0227d6cc2aba7188a0433c..d79078fd00bf5f389837603ad1c40fda72b20c18 100644 (file)
--- a/src/runtime/memclr_amd64.s
+++ b/src/runtime/memclr_amd64.s
@@ -17,6 +17,7 @@ TEXT runtime·memclrNoHeapPointers(SB), NOSPLIT, $0-16
  
         // MOVOU seems always faster than REP STOSQ.
  tail:
+       // BSR+branch table make almost all memmove/memclr benchmarks worse. Not worth doing.
         TESTQ   BX, BX
         JEQ     _0
         CMPQ    BX, $2
@@ -39,7 +40,6 @@ tail:
         JBE     _129through256
         CMPB    internal∕cpu·X86+const_offsetX86HasAVX2(SB), $1
         JE loop_preheader_avx2
-       // TODO: use branch table and BSR to make this just a single dispatch
         // TODO: for really big clears, use MOVNTDQ, even without AVX2.
  
  loop:
diff --git a/src/runtime/memmove_386.s b/src/runtime/memmove_386.s

index 1bf86a5453b5a476450d78998af009ad621c32fe..172ea40820b30b91741d4e61ac29f28af77fef66 100644 (file)
--- a/src/runtime/memmove_386.s
+++ b/src/runtime/memmove_386.s
@@ -39,6 +39,7 @@ TEXT runtime·memmove(SB), NOSPLIT, $0-12
         // 128 because that is the maximum SSE register load (loading all data
         // into registers lets us ignore copy direction).
  tail:
+       // BSR+branch table make almost all memmove/memclr benchmarks worse. Not worth doing.
         TESTL   BX, BX
         JEQ     move_0
         CMPL    BX, $2
@@ -58,7 +59,6 @@ tail:
         JBE     move_33through64
         CMPL    BX, $128
         JBE     move_65through128
-       // TODO: use branch table and BSR to make this just a single dispatch
  
  nosse2:
  /*
diff --git a/src/runtime/memmove_amd64.s b/src/runtime/memmove_amd64.s

index a671baf383f8369d0ad33dc7dd5062dc02414164..cb5cd02e45b9231a90bda4a4a9a96f3f5f28e948 100644 (file)
--- a/src/runtime/memmove_amd64.s
+++ b/src/runtime/memmove_amd64.s
@@ -43,6 +43,8 @@ tail:
         // registers before writing it back.  move_256through2048 on the other
         // hand can be used only when the memory regions don't overlap or the copy
         // direction is forward.
+       //
+       // BSR+branch table make almost all memmove/memclr benchmarks worse. Not worth doing.
         TESTQ   BX, BX
         JEQ     move_0
         CMPQ    BX, $2
@@ -63,7 +65,6 @@ tail:
         JBE     move_65through128
         CMPQ    BX, $256
         JBE     move_129through256
-       // TODO: use branch table and BSR to make this just a single dispatch
  
         TESTB   $1, runtime·useAVXmemmove(SB)
         JNZ     avxUnaligned
author	Iskander Sharipov <iskander.sharipov@intel.com>
	Fri, 1 Jun 2018 15:55:36 +0000 (18:55 +0300)
committer	Brad Fitzpatrick <bradfitz@golang.org>
	Mon, 11 Jun 2018 22:09:04 +0000 (22:09 +0000)
src/runtime/memclr_386.s		patch \| blob \| history
src/runtime/memclr_amd64.s		patch \| blob \| history
src/runtime/memmove_386.s		patch \| blob \| history
src/runtime/memmove_amd64.s		patch \| blob \| history