| .. | .. |
|---|
| 24 | 24 | |
|---|
| 25 | 25 | .text |
|---|
| 26 | 26 | |
|---|
| 27 | | -ENTRY(chacha_2block_xor_avx512vl) |
|---|
| 27 | +SYM_FUNC_START(chacha_2block_xor_avx512vl) |
|---|
| 28 | 28 | # %rdi: Input state matrix, s |
|---|
| 29 | 29 | # %rsi: up to 2 data blocks output, o |
|---|
| 30 | 30 | # %rdx: up to 2 data blocks input, i |
|---|
| .. | .. |
|---|
| 166 | 166 | |
|---|
| 167 | 167 | .Ldone2: |
|---|
| 168 | 168 | vzeroupper |
|---|
| 169 | | - ret |
|---|
| 169 | + RET |
|---|
| 170 | 170 | |
|---|
| 171 | 171 | .Lxorpart2: |
|---|
| 172 | 172 | # xor remaining bytes from partial register into output |
|---|
| 173 | 173 | mov %rcx,%rax |
|---|
| 174 | 174 | and $0xf,%rcx |
|---|
| 175 | | - jz .Ldone8 |
|---|
| 175 | + jz .Ldone2 |
|---|
| 176 | 176 | mov %rax,%r9 |
|---|
| 177 | 177 | and $~0xf,%r9 |
|---|
| 178 | 178 | |
|---|
| .. | .. |
|---|
| 187 | 187 | |
|---|
| 188 | 188 | jmp .Ldone2 |
|---|
| 189 | 189 | |
|---|
| 190 | | -ENDPROC(chacha_2block_xor_avx512vl) |
|---|
| 190 | +SYM_FUNC_END(chacha_2block_xor_avx512vl) |
|---|
| 191 | 191 | |
|---|
| 192 | | -ENTRY(chacha_4block_xor_avx512vl) |
|---|
| 192 | +SYM_FUNC_START(chacha_4block_xor_avx512vl) |
|---|
| 193 | 193 | # %rdi: Input state matrix, s |
|---|
| 194 | 194 | # %rsi: up to 4 data blocks output, o |
|---|
| 195 | 195 | # %rdx: up to 4 data blocks input, i |
|---|
| .. | .. |
|---|
| 432 | 432 | |
|---|
| 433 | 433 | .Ldone4: |
|---|
| 434 | 434 | vzeroupper |
|---|
| 435 | | - ret |
|---|
| 435 | + RET |
|---|
| 436 | 436 | |
|---|
| 437 | 437 | .Lxorpart4: |
|---|
| 438 | 438 | # xor remaining bytes from partial register into output |
|---|
| 439 | 439 | mov %rcx,%rax |
|---|
| 440 | 440 | and $0xf,%rcx |
|---|
| 441 | | - jz .Ldone8 |
|---|
| 441 | + jz .Ldone4 |
|---|
| 442 | 442 | mov %rax,%r9 |
|---|
| 443 | 443 | and $~0xf,%r9 |
|---|
| 444 | 444 | |
|---|
| .. | .. |
|---|
| 453 | 453 | |
|---|
| 454 | 454 | jmp .Ldone4 |
|---|
| 455 | 455 | |
|---|
| 456 | | -ENDPROC(chacha_4block_xor_avx512vl) |
|---|
| 456 | +SYM_FUNC_END(chacha_4block_xor_avx512vl) |
|---|
| 457 | 457 | |
|---|
| 458 | | -ENTRY(chacha_8block_xor_avx512vl) |
|---|
| 458 | +SYM_FUNC_START(chacha_8block_xor_avx512vl) |
|---|
| 459 | 459 | # %rdi: Input state matrix, s |
|---|
| 460 | 460 | # %rsi: up to 8 data blocks output, o |
|---|
| 461 | 461 | # %rdx: up to 8 data blocks input, i |
|---|
| .. | .. |
|---|
| 812 | 812 | |
|---|
| 813 | 813 | .Ldone8: |
|---|
| 814 | 814 | vzeroupper |
|---|
| 815 | | - ret |
|---|
| 815 | + RET |
|---|
| 816 | 816 | |
|---|
| 817 | 817 | .Lxorpart8: |
|---|
| 818 | 818 | # xor remaining bytes from partial register into output |
|---|
| .. | .. |
|---|
| 833 | 833 | |
|---|
| 834 | 834 | jmp .Ldone8 |
|---|
| 835 | 835 | |
|---|
| 836 | | -ENDPROC(chacha_8block_xor_avx512vl) |
|---|
| 836 | +SYM_FUNC_END(chacha_8block_xor_avx512vl) |
|---|