aboutsummaryrefslogtreecommitdiff
path: root/benchmarks/vec-strcmp/vec-strcmp.S
diff options
context:
space:
mode:
Diffstat (limited to 'benchmarks/vec-strcmp/vec-strcmp.S')
-rw-r--r--benchmarks/vec-strcmp/vec-strcmp.S32
1 files changed, 32 insertions, 0 deletions
diff --git a/benchmarks/vec-strcmp/vec-strcmp.S b/benchmarks/vec-strcmp/vec-strcmp.S
new file mode 100644
index 0000000..ff04333
--- /dev/null
+++ b/benchmarks/vec-strcmp/vec-strcmp.S
@@ -0,0 +1,32 @@
+ .text
+ .balign 4
+ .global vec_strcmp
+ # int vec_strcmp(const char *src1, const char* src2)
+vec_strcmp:
+ ## Using LMUL=2, but same register names work for larger LMULs
+ li t1, 0 # Initial pointer bump
+loop:
+ vsetvli t0, x0, e8, m2, ta, ma # Max length vectors of bytes
+ add a0, a0, t1 # Bump src1 pointer
+ vle8ff.v v8, (a0) # Get src1 bytes
+ add a1, a1, t1 # Bump src2 pointer
+ vle8ff.v v16, (a1) # Get src2 bytes
+
+ vmseq.vi v0, v8, 0 # Flag zero bytes in src1
+ vmsne.vv v1, v8, v16 # Flag if src1 != src2
+ vmor.mm v0, v0, v1 # Combine exit conditions
+
+ vfirst.m a2, v0 # ==0 or != ?
+ csrr t1, vl # Get number of bytes fetched
+
+ bltz a2, loop # Loop if all same and no zero byte
+
+ add a0, a0, a2 # Get src1 element address
+ lbu a3, (a0) # Get src1 byte from memory
+
+ add a1, a1, a2 # Get src2 element address
+ lbu a4, (a1) # Get src2 byte from memory
+
+ sub a0, a3, a4 # Return value.
+
+ ret