123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314 |
- .literal .Lmask0, MASK0
- .literal .Lmask1, MASK1
- .literal .Lmask2, MASK2
- .literal .Lmask3, MASK3
- .literal .Lmask4, MASK4
- .text
- ENTRY (strcmp)
-
- l8ui a8, a2, 0
- l8ui a9, a3, 0
- movi a10, 3
- bne a8, a9, .Lretdiff
- or a11, a2, a3
- bnone a11, a10, .Laligned
- xor a11, a2, a3
- bany a11, a10, .Lunaligned
-
- addi a2, a2, 1
- beqz a8, .Leq
- addi a3, a3, 1
- bnone a2, a10, .Laligned
- l8ui a8, a2, 0
- l8ui a9, a3, 0
- addi a2, a2, 1
- bne a8, a9, .Lretdiff
- beqz a8, .Leq
- addi a3, a3, 1
- bnone a2, a10, .Laligned
- l8ui a8, a2, 0
- l8ui a9, a3, 0
- addi a2, a2, 1
- bne a8, a9, .Lretdiff
- beqz a8, .Leq
- addi a3, a3, 1
- j .Laligned
- .align 4
-
- .Lunaligned:
- _movi.n a8, 0
- loop a8, .Lretdiff
- .Lnextbyte:
- l8ui a8, a2, 0
- l8ui a9, a3, 0
- addi a2, a2, 1
- bne a8, a9, .Lretdiff
- addi a3, a3, 1
- beqz a8, .Lretdiff
- bnez a8, .Lnextbyte
- .Lretdiff:
- sub a2, a8, a9
- retw
- .align 4
- .Laligned:
- .begin no-transform
- l32r a4, .Lmask0
- l32r a7, .Lmask4
-
- loop a4, .Laligned_done
-
- l32i a8, a2, 0
- l32i a9, a3, 0
- slli a5, a8, 1
- bne a8, a9, .Lwne2
- or a9, a8, a5
- bnall a9, a7, .Lprobeq
-
- l32i a8, a2, 4
- l32i a9, a3, 4
- slli a5, a8, 1
- bne a8, a9, .Lwne2
- or a9, a8, a5
- bnall a9, a7, .Lprobeq2
- addi a2, a2, 8
- addi a3, a3, 8
- .Laligned_done:
- or a1, a1, a1
- .Lprobeq2:
-
- addi a2, a2, 4
- addi a3, a3, 4
- .Laligned:
- movi a4, MASK0
- movi a7, MASK4
- j .Lfirstword
- .Lnextword:
- addi a2, a2, 4
- addi a3, a3, 4
- .Lfirstword:
- l32i a8, a2, 0
- l32i a9, a3, 0
- slli a5, a8, 1
- bne a8, a9, .Lwne2
- or a9, a8, a5
- ball a9, a7, .Lnextword
-
- .Lprobeq:
-
- bnone a8, a4, .Leq
- l32r a5, .Lmask1
- l32r a6, .Lmask2
- bnone a8, a5, .Leq
- l32r a7, .Lmask3
- bnone a8, a6, .Leq
- bnone a8, a7, .Leq
- addi.n a2, a2, 4
- addi.n a3, a3, 4
-
- loop a4, .Leq
- .end no-transform
- l32i a8, a2, 0
- l32i a9, a3, 0
- addi a2, a2, 4
- bne a8, a9, .Lwne
- bnone a8, a4, .Leq
- bnone a8, a5, .Leq
- bnone a8, a6, .Leq
- bnone a8, a7, .Leq
- addi a3, a3, 4
- j .Lfirstword2
- .Lnextword2:
- addi a3, a3, 4
- .Lfirstword2:
- l32i a8, a2, 0
- l32i a9, a3, 0
- addi a2, a2, 4
- bne a8, a9, .Lwne
- bnone a8, a4, .Leq
- bnone a8, a5, .Leq
- bnone a8, a6, .Leq
- bany a8, a7, .Lnextword2
-
- .Leq: movi a2, 0
- retw
- .Lwne2:
- or a10, a8, a5
- bnall a10, a7, .Lsomezero
- bgeu a8, a9, .Lposreturn
- movi a2, -1
- retw
- .Lposreturn:
- movi a2, 1
- retw
- .Lsomezero:
- .Lwne:
- xor a2, a8, a9
- bany a2, a4, .Ldiff0
- movi a5, MASK1
- bnone a8, a4, .Leq
- bany a2, a5, .Ldiff1
- movi a6, MASK2
- bnone a8, a5, .Leq
- bany a2, a6, .Ldiff2
- bnone a8, a6, .Leq
- .Ldiff3:
- .Ldiff2:
- .Ldiff1:
-
- sub a2, a8, a9
- retw
- .Ldiff0:
-
- extui a10, a8, 24, 8
- extui a11, a9, 24, 8
- sub a2, a10, a11
- retw
-
- .Ldiff3:
-
- extui a10, a8, 24, 8
- extui a11, a9, 24, 8
- sub a2, a10, a11
- retw
- .Ldiff0:
-
- extui a10, a8, 0, 8
- extui a11, a9, 0, 8
- sub a2, a10, a11
- retw
- .Ldiff1:
-
- extui a10, a8, 8, 8
- extui a11, a9, 8, 8
- sub a2, a10, a11
- retw
- .Ldiff2:
-
- extui a10, a8, 16, 8
- extui a11, a9, 16, 8
- sub a2, a10, a11
- retw
- libc_hidden_def (strcmp)
- strong_alias (strcmp, strcoll)
- libc_hidden_def (strcoll)
|