Skip to content

Instantly share code, notes, and snippets.

@Mistuke
Created January 23, 2024 12:59
Show Gist options
  • Save Mistuke/d9252bfcb2aa766327c5f377e162f5b7 to your computer and use it in GitHub Desktop.
Save Mistuke/d9252bfcb2aa766327c5f377e162f5b7 to your computer and use it in GitHub Desktop.
.L4:
mov z22.s, w1
add z22.s, z22.s, z31.s
lsl z22.s, z22.s, #1
movprfx z19, z22
add z19.s, z19.s, #1
ld1sh z21.s, p6/z, [x6, z22.s, uxtw 1]
ld1sh z2.s, p6/z, [x6, z19.s, uxtw 1]
ld1sh z1.s, p6/z, [x5, z19.s, uxtw 1]
ld1sh z17.s, p6/z, [x5, z22.s, uxtw 1]
ld1sh z0.s, p6/z, [x4, z19.s, uxtw 1]
ld1sh z6.s, p6/z, [x4, z22.s, uxtw 1]
ld1sh z4.s, p6/z, [x3, z19.s, uxtw 1]
ld1sh z18.s, p6/z, [x3, z22.s, uxtw 1]
movprfx z20, z30
mul z20.s, p7/m, z20.s, z21.s
movprfx z16, z28
mul z16.s, p7/m, z16.s, z17.s
movprfx z5, z26
mul z5.s, p7/m, z5.s, z6.s
movprfx z7, z24
mul z7.s, p7/m, z7.s, z18.s
mls z20.s, p7/m, z29.s, z2.s
mls z16.s, p7/m, z27.s, z1.s
mls z5.s, p7/m, z25.s, z0.s
add z16.s, z16.s, z20.s
mls z7.s, p7/m, z23.s, z4.s
add z16.s, z16.s, z5.s
add z16.s, z16.s, z7.s
asr z16.s, z16.s, #15
st1h z16.s, p6, [x2, z22.s, uxtw 1]
mul z21.s, p7/m, z21.s, z29.s
mul z17.s, p7/m, z17.s, z27.s
mla z21.s, p7/m, z2.s, z30.s
mla z17.s, p7/m, z1.s, z28.s
mul z6.s, p7/m, z6.s, z25.s
add z17.s, z17.s, z21.s
mla z6.s, p7/m, z0.s, z26.s
mul z18.s, p7/m, z18.s, z23.s
add z17.s, z17.s, z6.s
mla z18.s, p7/m, z4.s, z24.s
add w1, w1, 12
add z17.s, z17.s, z18.s
asr z17.s, z17.s, #15
st1h z17.s, p6, [x2, z19.s, uxtw 1]
cmp w8, w1
bne .L4
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment