runtime: fix alignment code in memmove_riscv64.s

author Mark Ryan <markdryan@rivosinc.com>

Fri, 26 May 2023 08:51:21 +0000 (10:51 +0200)

committer Keith Randall <khr@golang.org>

Wed, 31 May 2023 19:56:05 +0000 (19:56 +0000)
author Mark Ryan <markdryan@rivosinc.com>
Fri, 26 May 2023 08:51:21 +0000 (10:51 +0200)
committer Keith Randall <khr@golang.org>
Wed, 31 May 2023 19:56:05 +0000 (19:56 +0000)
diff --git a/src/runtime/memmove_riscv64.s b/src/runtime/memmove_riscv64.s

index ea622ed951befe2b00d85d950ae12e0481e70a68..f5db86562b449cd73265cb5593bf9ba586e22f1e 100644 (file)
--- a/src/runtime/memmove_riscv64.s
+++ b/src/runtime/memmove_riscv64.s
@@ -23,12 +23,13 @@ TEXT runtime·memmove<ABIInternal>(SB),NOSPLIT,$-0-24
         BLT     X12, X9, f_loop4_check
  
         // Check alignment - if alignment differs we have to do one byte at a time.
-       AND     $3, X10, X5
-       AND     $3, X11, X6
+       AND     $7, X10, X5
+       AND     $7, X11, X6
         BNE     X5, X6, f_loop8_unaligned_check
         BEQZ    X5, f_loop_check
  
         // Move one byte at a time until we reach 8 byte alignment.
+       SUB     X5, X9, X5
         SUB     X5, X12, X12
  f_align:
         ADD     $-1, X5
@@ -173,8 +174,8 @@ backward:
         BLT     X12, X9, b_loop4_check
  
         // Check alignment - if alignment differs we have to do one byte at a time.
-       AND     $3, X10, X5
-       AND     $3, X11, X6
+       AND     $7, X10, X5
+       AND     $7, X11, X6
         BNE     X5, X6, b_loop8_unaligned_check
         BEQZ    X5, b_loop_check
  
diff --git a/src/runtime/memmove_test.go b/src/runtime/memmove_test.go

index f0c9a82bb629767d38792641349cf97e8f137c33..21236d19da56d064fab21d123dca086cff112c3b 100644 (file)
--- a/src/runtime/memmove_test.go
+++ b/src/runtime/memmove_test.go
@@ -338,6 +338,29 @@ func BenchmarkMemmoveUnalignedSrc(b *testing.B) {
         })
  }
  
+func BenchmarkMemmoveUnalignedSrcDst(b *testing.B) {
+       for _, n := range []int{16, 64, 256, 4096, 65536} {
+               buf := make([]byte, (n+8)*2)
+               x := buf[:len(buf)/2]
+               y := buf[len(buf)/2:]
+               for _, off := range []int{0, 1, 4, 7} {
+                       b.Run(fmt.Sprint("f_", n, off), func(b *testing.B) {
+                               b.SetBytes(int64(n))
+                               for i := 0; i < b.N; i++ {
+                                       copy(x[off:n+off], y[off:n+off])
+                               }
+                       })
+
+                       b.Run(fmt.Sprint("b_", n, off), func(b *testing.B) {
+                               b.SetBytes(int64(n))
+                               for i := 0; i < b.N; i++ {
+                                       copy(y[off:n+off], x[off:n+off])
+                               }
+                       })
+               }
+       }
+}
+
  func BenchmarkMemmoveUnalignedSrcOverlap(b *testing.B) {
         benchmarkSizes(b, bufSizesOverlap, func(b *testing.B, n int) {
                 x := make([]byte, n+1)
author	Mark Ryan <markdryan@rivosinc.com>
	Fri, 26 May 2023 08:51:21 +0000 (10:51 +0200)
committer	Keith Randall <khr@golang.org>
	Wed, 31 May 2023 19:56:05 +0000 (19:56 +0000)
src/runtime/memmove_riscv64.s		patch \| blob \| history
src/runtime/memmove_test.go		patch \| blob \| history