unified callee save register handling

This commit is contained in:
JanLJL
2022-01-31 12:04:28 -05:00
parent 97bfe42eac
commit ca87e93fd6
178 changed files with 5530 additions and 3581 deletions

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -42,16 +50,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -86,16 +94,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -42,16 +50,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -87,16 +95,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -43,16 +51,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -87,16 +95,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -40,16 +48,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -42,16 +50,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -87,16 +95,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -234,16 +242,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -234,16 +242,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -44,16 +52,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -64,16 +72,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -64,16 +72,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -43,16 +51,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -44,16 +52,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -44,16 +52,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -42,16 +50,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -42,16 +50,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -187,16 +195,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -57,16 +65,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -63,16 +71,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -57,16 +65,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -42,16 +50,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -57,16 +65,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -67,16 +75,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -67,16 +75,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -68,16 +76,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -68,16 +76,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -74,16 +82,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -78,16 +86,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -68,16 +76,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -68,16 +76,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -95,16 +103,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -123,16 +131,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -65,16 +73,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -65,16 +73,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -50,16 +58,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -51,16 +59,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -50,16 +58,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -42,16 +50,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -42,16 +50,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -42,16 +50,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -40,16 +48,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -40,16 +48,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -68,16 +76,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -74,16 +82,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -68,16 +76,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -74,16 +82,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -75,16 +83,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -73,16 +81,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -75,16 +83,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -73,16 +81,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -42,16 +50,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
sub sp, sp, #64
st1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -42,16 +50,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.4s, v13.4s, v14.4s, v15.4s}, [sp]
add sp, sp, #64
ld1 {v8.4s, v9.4s, v10.4s, v11.4s}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -47,16 +55,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -59,16 +67,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -47,16 +55,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -51,16 +59,19 @@ loop:
done:
mov sp, x24
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -56,16 +64,19 @@ loop:
done:
mov sp, x24
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -45,16 +53,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -56,16 +64,19 @@ loop:
done:
mov sp, x24
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -55,16 +63,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -63,16 +71,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
mov x24, sp
@@ -56,16 +64,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -104,16 +112,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -49,16 +57,19 @@ loop:
done:
mov sp, x24
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -62,16 +70,19 @@ loop:
bne loop
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -44,16 +52,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
mov x24, sp
@@ -54,16 +62,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
mov x24, sp
@@ -56,16 +64,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -40,16 +48,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -40,16 +48,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -40,16 +48,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -40,16 +48,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -51,16 +59,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -40,16 +48,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -41,16 +49,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

View File

@@ -13,16 +13,24 @@ ninst:
latency:
# push callee-save registers onto stack
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
stp x29, x30, [sp, -96]!
stp x19, x20, [sp, 16]
stp x21, x22, [sp, 32]
stp x24, x25, [sp, 48]
stp x26, x27, [sp, 64]
str x28, [sp, 80]
sub sp, sp, #64
st1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
sub sp, sp, #64
st1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
sub sp, sp, #64
st1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp]
sub sp, sp, #64
st1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp]
sub sp, sp, #64
st1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp]
sub sp, sp, #64
st1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp]
stp x19, x20, [sp, -96]!
stp x21, x22, [sp, 16]
stp x23, x24, [sp, 32]
stp x25, x26, [sp, 48]
stp x27, x28, [sp, 64]
stp x29, x30, [sp, 80]
mov x4, N
@@ -40,16 +48,19 @@ loop:
done:
# pop callee-save registers from stack
ldp x19, x20, [sp, 16]
ldp x21, x22, [sp, 32]
ldp x24, x25, [sp, 48]
ldp x26, x27, [sp, 64]
ldr x28, [sp, 80]
ldp x29, x30, [sp], 96
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp]
add sp, sp, #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp]
add sp, sp, #64
ldp x19, x20, [sp]
ldp x21, x22, [sp, 16]
ldp x23, x24, [sp, 32]
ldp x25, x26, [sp, 48]
ldp x27, x28, [sp, 64]
ldp x29, x30, [sp, 80]
add sp, sp, #96
ld1 {v28.2d, v29.2d, v30.2d, v31.2d}, [sp], #64
ld1 {v24.2d, v25.2d, v26.2d, v27.2d}, [sp], #64
ld1 {v20.2d, v21.2d, v22.2d, v23.2d}, [sp], #64
ld1 {v16.2d, v17.2d, v18.2d, v19.2d}, [sp], #64
ld1 {v12.2d, v13.2d, v14.2d, v15.2d}, [sp], #64
ld1 {v8.2d, v9.2d, v10.2d, v11.2d}, [sp], #64
ret

Some files were not shown because too many files have changed in this diff Show More