aboutsummaryrefslogtreecommitdiff
path: root/src/internal/bytealg/equal_riscv64.s
blob: 5dd13beb5552de196fed663f4a361c7b7af2e86a (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
// Copyright 2019 The Go Authors. All rights reserved.
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file.

#include "go_asm.h"
#include "textflag.h"

#define	CTXT	S10

// func memequal(a, b unsafe.Pointer, size uintptr) bool
TEXT runtime·memequal(SB),NOSPLIT|NOFRAME,$0-25
	MOV	a+0(FP), X5
	MOV	b+8(FP), X6
	MOV	size+16(FP), X7
	MOV	$ret+24(FP), X19
	JMP	memequal<>(SB)

// func memequal_varlen(a, b unsafe.Pointer) bool
TEXT runtime·memequal_varlen(SB),NOSPLIT|NOFRAME,$0-17
	MOV	a+0(FP), X5
	MOV	b+8(FP), X6
	MOV	8(CTXT), X7    // compiler stores size at offset 8 in the closure
	MOV	$ret+16(FP), X19
	JMP	memequal<>(SB)

// On entry X5 and X6 contain pointers, X7 contains length.
// X19 contains address for return value.
TEXT memequal<>(SB),NOSPLIT|NOFRAME,$0
	BEQ	X5, X6, eq

	MOV	$32, X8
	BLT	X7, X8, loop4_check

	// Check alignment - if alignment differs we have to do one byte at a time.
	AND	$3, X5, X9
	AND	$3, X6, X10
	BNE	X9, X10, loop4_check
	BEQZ	X9, loop32_check

	// Check one byte at a time until we reach 8 byte alignment.
	SUB	X9, X7, X7
align:
	ADD	$-1, X9
	MOVBU	0(X5), X10
	MOVBU	0(X6), X11
	BNE	X10, X11, not_eq
	ADD	$1, X5
	ADD	$1, X6
	BNEZ	X9, align

loop32_check:
	MOV	$32, X9
	BLT	X7, X9, loop16_check
loop32:
	MOV	0(X5), X10
	MOV	0(X6), X11
	MOV	8(X5), X12
	MOV	8(X6), X13
	BNE	X10, X11, not_eq
	BNE	X12, X13, not_eq
	MOV	16(X5), X14
	MOV	16(X6), X15
	MOV	24(X5), X16
	MOV	24(X6), X17
	BNE	X14, X15, not_eq
	BNE	X16, X17, not_eq
	ADD	$32, X5
	ADD	$32, X6
	ADD	$-32, X7
	BGE	X7, X9, loop32
	BEQZ	X7, eq

loop16_check:
	MOV	$16, X8
	BLT	X7, X8, loop4_check
loop16:
	MOV	0(X5), X10
	MOV	0(X6), X11
	MOV	8(X5), X12
	MOV	8(X6), X13
	BNE	X10, X11, not_eq
	BNE	X12, X13, not_eq
	ADD	$16, X5
	ADD	$16, X6
	ADD	$-16, X7
	BGE	X7, X8, loop16
	BEQZ	X7, eq

loop4_check:
	MOV	$4, X8
	BLT	X7, X8, loop1
loop4:
	MOVBU	0(X5), X10
	MOVBU	0(X6), X11
	MOVBU	1(X5), X12
	MOVBU	1(X6), X13
	BNE	X10, X11, not_eq
	BNE	X12, X13, not_eq
	MOVBU	2(X5), X14
	MOVBU	2(X6), X15
	MOVBU	3(X5), X16
	MOVBU	3(X6), X17
	BNE	X14, X15, not_eq
	BNE	X16, X17, not_eq
	ADD	$4, X5
	ADD	$4, X6
	ADD	$-4, X7
	BGE	X7, X8, loop4

loop1:
	BEQZ	X7, eq
	MOVBU	0(X5), X10
	MOVBU	0(X6), X11
	BNE	X10, X11, not_eq
	ADD	$1, X5
	ADD	$1, X6
	ADD	$-1, X7
	JMP	loop1

not_eq:
	MOV	$0, X5
	MOVB	X5, (X19)
	RET
eq:
	MOV	$1, X5
	MOVB	X5, (X19)
	RET