1
2
3
4
5
6
7
8
9
10
11
12
13
14
15 #include <asm/export.h>
16 .set noreorder
17 .set noat
18
19 .align 3
20
21 .globl strlen
22 .ent strlen
23
24 strlen:
25 ldq_u $1, 0($16) # load first quadword ($16 may be misaligned)
26 lda $2, -1($31)
27 insqh $2, $16, $2
28 andnot $16, 7, $0
29 or $2, $1, $1
30 cmpbge $31, $1, $2 # $2 <- bitmask: bit i == 1 <==> i-th byte == 0
31 bne $2, found
32
33 loop: ldq $1, 8($0)
34 addq $0, 8, $0 # addr += 8
35 nop # helps dual issue last two insns
36 cmpbge $31, $1, $2
37 beq $2, loop
38
39 found: blbs $2, done # make aligned case fast
40 negq $2, $3
41 and $2, $3, $2
42
43 and $2, 0x0f, $1
44 addq $0, 4, $3
45 cmoveq $1, $3, $0
46
47 and $2, 0x33, $1
48 addq $0, 2, $3
49 cmoveq $1, $3, $0
50
51 and $2, 0x55, $1
52 addq $0, 1, $3
53 cmoveq $1, $3, $0
54
55 done: subq $0, $16, $0
56 ret $31, ($26)
57
58 .end strlen
59 EXPORT_SYMBOL(strlen)