// Copyright 2018 The Go Authors. All rights reserved. // Use of this source code is governed by a BSD-style // license that can be found in the LICENSE file. #include "go_asm.h" #include "textflag.h" TEXT ·IndexByte(SB),NOSPLIT|NOFRAME,$0-40 MOVD b_base+0(FP), R3// b_base => R3 MOVD b_len+8(FP), R4 // b_len => R4 MOVBZ c+24(FP), R5 // c => R5 MOVD $ret+32(FP), R2 // &ret => R9 BR indexbytebody<>(SB) TEXT ·IndexByteString(SB),NOSPLIT|NOFRAME,$0-32 MOVD s_base+0(FP), R3// s_base => R3 MOVD s_len+8(FP), R4 // s_len => R4 MOVBZ c+16(FP), R5 // c => R5 MOVD $ret+24(FP), R2 // &ret => R9 BR indexbytebody<>(SB) // input: // R3: s // R4: s_len // R5: c -- byte sought // R2: &ret -- address to put index into TEXT indexbytebody<>(SB),NOSPLIT|NOFRAME,$0 CMPBEQ R4, $0, notfound MOVD R3, R6 // store base for later ADD R3, R4, R8 // the address after the end of the string //if the length is small, use loop; otherwise, use vector or srst search CMPBGE R4, $16, large residual: CMPBEQ R3, R8, notfound MOVBZ 0(R3), R7 LA 1(R3), R3 CMPBNE R7, R5, residual found: SUB R6, R3 SUB $1, R3 MOVD R3, 0(R2) RET notfound: MOVD $-1, 0(R2) RET large: MOVBZ internal∕cpu·S390X+const_offsetS390xHasVX(SB), R1 CMPBNE R1, $0, vectorimpl srstimpl: // no vector facility MOVBZ R5, R0 // c needs to be in R0, leave until last minute as currently R0 is expected to be 0 srstloop: WORD $0xB25E0083 // srst %r8, %r3 (search the range [R3, R8)) BVS srstloop // interrupted - continue BGT notfoundr0 foundr0: XOR R0, R0 // reset R0 SUB R6, R8 // remove base MOVD R8, 0(R2) RET notfoundr0: XOR R0, R0 // reset R0 MOVD $-1, 0(R2) RET vectorimpl: //if the address is not 16byte aligned, use loop for the header MOVD R3, R8 AND $15, R8 CMPBGT R8, $0, notaligned aligned: ADD R6, R4, R8 MOVD R8, R7 AND $-16, R7 // replicate c across V17 VLVGB $0, R5, V19 VREPB $0, V19, V17 vectorloop: CMPBGE R3, R7, residual VL 0(R3), V16 // load string to be searched into V16 ADD $16, R3 VFEEBS V16, V17, V18 // search V17 in V16 and set conditional code accordingly BVS vectorloop // when vector search found c in the string VLGVB $7, V18, R7 // load 7th element of V18 containing index into R7 SUB $16, R3 SUB R6, R3 ADD R3, R7 MOVD R7, 0(R2) RET notaligned: MOVD R3, R8 AND $-16, R8 ADD $16, R8 notalignedloop: CMPBEQ R3, R8, aligned MOVBZ 0(R3), R7 LA 1(R3), R3 CMPBNE R7, R5, notalignedloop BR found