diff options
author | danlark <danlark@yandex-team.ru> | 2022-02-10 16:46:10 +0300 |
---|---|---|
committer | Daniil Cherednik <dcherednik@yandex-team.ru> | 2022-02-10 16:46:10 +0300 |
commit | baa58daefa91fde4b4769facdbd2903763b9c6a8 (patch) | |
tree | 1a2c5ffcf89eb53ecd79dbc9bc0a195c27404d0c /contrib/libs/openssl/asm/ppc64le/crypto/poly1305 | |
parent | 3426a9bc7f169ae9da54cef557ad2a33f6e8eee0 (diff) | |
download | ydb-baa58daefa91fde4b4769facdbd2903763b9c6a8.tar.gz |
Restoring authorship annotation for <danlark@yandex-team.ru>. Commit 2 of 2.
Diffstat (limited to 'contrib/libs/openssl/asm/ppc64le/crypto/poly1305')
-rw-r--r-- | contrib/libs/openssl/asm/ppc64le/crypto/poly1305/poly1305-ppc.s | 284 | ||||
-rw-r--r-- | contrib/libs/openssl/asm/ppc64le/crypto/poly1305/poly1305-ppcfp.s | 1032 |
2 files changed, 658 insertions, 658 deletions
diff --git a/contrib/libs/openssl/asm/ppc64le/crypto/poly1305/poly1305-ppc.s b/contrib/libs/openssl/asm/ppc64le/crypto/poly1305/poly1305-ppc.s index e2d8edb2d1..3fbf9185d1 100644 --- a/contrib/libs/openssl/asm/ppc64le/crypto/poly1305/poly1305-ppc.s +++ b/contrib/libs/openssl/asm/ppc64le/crypto/poly1305/poly1305-ppc.s @@ -1,21 +1,21 @@ -.machine "any" -.text -.globl poly1305_init_int -.type poly1305_init_int,@function +.machine "any" +.text +.globl poly1305_init_int +.type poly1305_init_int,@function .section ".opd","aw" .align 3 poly1305_init_int: .quad .poly1305_init_int,.TOC.@tocbase,0 .previous -.align 4 +.align 4 .poly1305_init_int: - xor 0,0,0 - std 0,0(3) - std 0,8(3) - std 0,16(3) - - cmpld 4,0 - beq- .Lno_key + xor 0,0,0 + std 0,0(3) + std 0,8(3) + std 0,16(3) + + cmpld 4,0 + beq- .Lno_key li 7,4 lwbrx 10,0,4 li 11,8 @@ -25,61 +25,61 @@ poly1305_init_int: lwbrx 8,8,4 insrdi 10,7,32,0 insrdi 11,8,32,0 - lis 8,0xfff - ori 8,8,0xfffc - insrdi 8,8,32,0 - ori 7,8,3 - - and 10,10,7 - and 11,11,8 - - std 10,32(3) - std 11,40(3) - -.Lno_key: - xor 3,3,3 - blr -.long 0 -.byte 0,12,0x14,0,0,0,2,0 + lis 8,0xfff + ori 8,8,0xfffc + insrdi 8,8,32,0 + ori 7,8,3 + + and 10,10,7 + and 11,11,8 + + std 10,32(3) + std 11,40(3) + +.Lno_key: + xor 3,3,3 + blr +.long 0 +.byte 0,12,0x14,0,0,0,2,0 .size .poly1305_init_int,.-.poly1305_init_int .size poly1305_init_int,.-.poly1305_init_int - -.globl poly1305_blocks -.type poly1305_blocks,@function + +.globl poly1305_blocks +.type poly1305_blocks,@function .section ".opd","aw" .align 3 poly1305_blocks: .quad .poly1305_blocks,.TOC.@tocbase,0 .previous -.align 4 +.align 4 .poly1305_blocks: - srdi. 5,5,4 - beq- .Labort - - stdu 1,-192(1) - mflr 0 - std 27,152(1) - std 28,160(1) - std 29,168(1) - std 30,176(1) - std 31,184(1) - std 0,208(1) - - ld 27,32(3) - ld 28,40(3) - - ld 7,0(3) - ld 8,8(3) - ld 9,16(3) - - srdi 29,28,2 - mtctr 5 - add 29,29,28 - li 0,3 - b .Loop - -.align 4 -.Loop: + srdi. 5,5,4 + beq- .Labort + + stdu 1,-192(1) + mflr 0 + std 27,152(1) + std 28,160(1) + std 29,168(1) + std 30,176(1) + std 31,184(1) + std 0,208(1) + + ld 27,32(3) + ld 28,40(3) + + ld 7,0(3) + ld 8,8(3) + ld 9,16(3) + + srdi 29,28,2 + mtctr 5 + add 29,29,28 + li 0,3 + b .Loop + +.align 4 +.Loop: li 10,4 lwbrx 30,0,4 li 31,8 @@ -89,94 +89,94 @@ poly1305_blocks: lwbrx 11,11,4 insrdi 30,10,32,0 insrdi 31,11,32,0 - addi 4,4,16 - - addc 7,7,30 - adde 8,8,31 - - mulld 10,7,27 - mulhdu 11,7,27 - adde 9,9,6 - - mulld 30,8,29 - mulhdu 31,8,29 - addc 10,10,30 - adde 11,11,31 - - mulld 30,7,28 - mulhdu 12,7,28 - addc 11,11,30 - addze 12,12 - - mulld 30,8,27 - mulhdu 31,8,27 - addc 11,11,30 - adde 12,12,31 - - mulld 30,9,29 - mulld 31,9,27 - addc 11,11,30 - adde 12,12,31 - - andc 30,12,0 - and 9,12,0 - srdi 31,30,2 - add 30,30,31 - addc 7,10,30 - addze 8,11 - addze 9,9 - - bdnz .Loop - - std 7,0(3) - std 8,8(3) - std 9,16(3) - - ld 27,152(1) - ld 28,160(1) - ld 29,168(1) - ld 30,176(1) - ld 31,184(1) - addi 1,1,192 -.Labort: - blr -.long 0 -.byte 0,12,4,1,0x80,5,4,0 + addi 4,4,16 + + addc 7,7,30 + adde 8,8,31 + + mulld 10,7,27 + mulhdu 11,7,27 + adde 9,9,6 + + mulld 30,8,29 + mulhdu 31,8,29 + addc 10,10,30 + adde 11,11,31 + + mulld 30,7,28 + mulhdu 12,7,28 + addc 11,11,30 + addze 12,12 + + mulld 30,8,27 + mulhdu 31,8,27 + addc 11,11,30 + adde 12,12,31 + + mulld 30,9,29 + mulld 31,9,27 + addc 11,11,30 + adde 12,12,31 + + andc 30,12,0 + and 9,12,0 + srdi 31,30,2 + add 30,30,31 + addc 7,10,30 + addze 8,11 + addze 9,9 + + bdnz .Loop + + std 7,0(3) + std 8,8(3) + std 9,16(3) + + ld 27,152(1) + ld 28,160(1) + ld 29,168(1) + ld 30,176(1) + ld 31,184(1) + addi 1,1,192 +.Labort: + blr +.long 0 +.byte 0,12,4,1,0x80,5,4,0 .size .poly1305_blocks,.-.poly1305_blocks .size poly1305_blocks,.-.poly1305_blocks - -.globl poly1305_emit -.type poly1305_emit,@function + +.globl poly1305_emit +.type poly1305_emit,@function .section ".opd","aw" .align 3 poly1305_emit: .quad .poly1305_emit,.TOC.@tocbase,0 .previous -.align 4 +.align 4 .poly1305_emit: - ld 7,0(3) - ld 8,8(3) - ld 9,16(3) - ld 6,0(5) - ld 5,8(5) - - addic 10,7,5 - addze 11,8 - addze 12,9 - - srdi 0,12,2 - neg 0,0 - - andc 7,7,0 - and 10,10,0 - andc 8,8,0 - and 11,11,0 - or 7,7,10 - or 8,8,11 + ld 7,0(3) + ld 8,8(3) + ld 9,16(3) + ld 6,0(5) + ld 5,8(5) + + addic 10,7,5 + addze 11,8 + addze 12,9 + + srdi 0,12,2 + neg 0,0 + + andc 7,7,0 + and 10,10,0 + andc 8,8,0 + and 11,11,0 + or 7,7,10 + or 8,8,11 rotldi 6,6,32 rotldi 5,5,32 - addc 7,7,6 - adde 8,8,5 + addc 7,7,6 + adde 8,8,5 rldicl 0,7,32,32 li 10,4 stwbrx 7,0,4 @@ -186,10 +186,10 @@ poly1305_emit: li 12,12 stwbrx 8,11,4 stwbrx 7,12,4 - blr -.long 0 -.byte 0,12,0x14,0,0,0,3,0 + blr +.long 0 +.byte 0,12,0x14,0,0,0,3,0 .size .poly1305_emit,.-.poly1305_emit .size poly1305_emit,.-.poly1305_emit -.byte 80,111,108,121,49,51,48,53,32,102,111,114,32,80,80,67,44,67,82,89,80,84,79,71,65,77,83,32,98,121,32,60,97,112,112,114,111,64,111,112,101,110,115,115,108,46,111,114,103,62,0 -.align 2 +.byte 80,111,108,121,49,51,48,53,32,102,111,114,32,80,80,67,44,67,82,89,80,84,79,71,65,77,83,32,98,121,32,60,97,112,112,114,111,64,111,112,101,110,115,115,108,46,111,114,103,62,0 +.align 2 diff --git a/contrib/libs/openssl/asm/ppc64le/crypto/poly1305/poly1305-ppcfp.s b/contrib/libs/openssl/asm/ppc64le/crypto/poly1305/poly1305-ppcfp.s index ef018b3a1e..481119cc35 100644 --- a/contrib/libs/openssl/asm/ppc64le/crypto/poly1305/poly1305-ppcfp.s +++ b/contrib/libs/openssl/asm/ppc64le/crypto/poly1305/poly1305-ppcfp.s @@ -1,500 +1,500 @@ -.machine "any" -.text - -.globl poly1305_init_fpu -.type poly1305_init_fpu,@function +.machine "any" +.text + +.globl poly1305_init_fpu +.type poly1305_init_fpu,@function .section ".opd","aw" .align 3 poly1305_init_fpu: .quad .poly1305_init_fpu,.TOC.@tocbase,0 .previous -.align 6 +.align 6 .poly1305_init_fpu: - stdu 1,-48(1) - mflr 6 - std 6,64(1) - - bl .LPICmeup - - xor 0,0,0 - mtlr 6 - - lfd 8,8*0(5) - lfd 9,8*1(5) - lfd 10,8*2(5) - lfd 11,8*3(5) - lfd 12,8*4(5) - lfd 13,8*5(5) - - stfd 8,8*0(3) - stfd 9,8*1(3) - stfd 10,8*2(3) - stfd 11,8*3(3) - - cmpld 4,0 - beq- .Lno_key - - lfd 6,8*13(5) - mffs 7 - - stfd 8,8*4(3) - stfd 9,8*5(3) - stfd 10,8*6(3) - stfd 11,8*7(3) - - li 8,4 - li 9,8 - li 10,12 + stdu 1,-48(1) + mflr 6 + std 6,64(1) + + bl .LPICmeup + + xor 0,0,0 + mtlr 6 + + lfd 8,8*0(5) + lfd 9,8*1(5) + lfd 10,8*2(5) + lfd 11,8*3(5) + lfd 12,8*4(5) + lfd 13,8*5(5) + + stfd 8,8*0(3) + stfd 9,8*1(3) + stfd 10,8*2(3) + stfd 11,8*3(3) + + cmpld 4,0 + beq- .Lno_key + + lfd 6,8*13(5) + mffs 7 + + stfd 8,8*4(3) + stfd 9,8*5(3) + stfd 10,8*6(3) + stfd 11,8*7(3) + + li 8,4 + li 9,8 + li 10,12 lwbrx 7,0,4 lwbrx 8,8,4 lwbrx 9,9,4 lwbrx 10,10,4 - - lis 11,0xf000 - ori 12,11,3 - andc 7,7,11 - andc 8,8,12 - andc 9,9,12 - andc 10,10,12 - + + lis 11,0xf000 + ori 12,11,3 + andc 7,7,11 + andc 8,8,12 + andc 9,9,12 + andc 10,10,12 + stw 7,36(3) stw 8,44(3) stw 9,52(3) stw 10,60(3) - - mtfsf 255,6 - stfd 8,8*18(3) - stfd 9,8*19(3) - stfd 10,8*20(3) - stfd 11,8*21(3) - stfd 12,8*22(3) - stfd 13,8*23(3) - - lfd 0,8*4(3) - lfd 2,8*5(3) - lfd 4,8*6(3) - lfd 6,8*7(3) - - fsub 0,0,8 - fsub 2,2,9 - fsub 4,4,10 - fsub 6,6,11 - - lfd 8,8*6(5) - lfd 9,8*7(5) - lfd 10,8*8(5) - lfd 11,8*9(5) - - fmul 3,2,13 - fmul 5,4,13 - stfd 7,8*15(3) - fmul 7,6,13 - - fadd 1,0,8 - stfd 3,8*12(3) - fadd 3,2,9 - stfd 5,8*13(3) - fadd 5,4,10 - stfd 7,8*14(3) - fadd 7,6,11 - - fsub 1,1,8 - fsub 3,3,9 - fsub 5,5,10 - fsub 7,7,11 - - lfd 8,8*10(5) - lfd 9,8*11(5) - lfd 10,8*12(5) - - fsub 0,0,1 - fsub 2,2,3 - fsub 4,4,5 - fsub 6,6,7 - - stfd 1,8*5(3) - stfd 3,8*7(3) - stfd 5,8*9(3) - stfd 7,8*11(3) - - stfd 0,8*4(3) - stfd 2,8*6(3) - stfd 4,8*8(3) - stfd 6,8*10(3) - - lfd 2,8*12(3) - lfd 4,8*13(3) - lfd 6,8*14(3) - lfd 0,8*15(3) - - fadd 3,2,8 - fadd 5,4,9 - fadd 7,6,10 - - fsub 3,3,8 - fsub 5,5,9 - fsub 7,7,10 - - fsub 2,2,3 - fsub 4,4,5 - fsub 6,6,7 - - stfd 3,8*13(3) - stfd 5,8*15(3) - stfd 7,8*17(3) - - stfd 2,8*12(3) - stfd 4,8*14(3) - stfd 6,8*16(3) - - mtfsf 255,0 -.Lno_key: - xor 3,3,3 - addi 1,1,48 - blr -.long 0 -.byte 0,12,4,1,0x80,0,2,0 + + mtfsf 255,6 + stfd 8,8*18(3) + stfd 9,8*19(3) + stfd 10,8*20(3) + stfd 11,8*21(3) + stfd 12,8*22(3) + stfd 13,8*23(3) + + lfd 0,8*4(3) + lfd 2,8*5(3) + lfd 4,8*6(3) + lfd 6,8*7(3) + + fsub 0,0,8 + fsub 2,2,9 + fsub 4,4,10 + fsub 6,6,11 + + lfd 8,8*6(5) + lfd 9,8*7(5) + lfd 10,8*8(5) + lfd 11,8*9(5) + + fmul 3,2,13 + fmul 5,4,13 + stfd 7,8*15(3) + fmul 7,6,13 + + fadd 1,0,8 + stfd 3,8*12(3) + fadd 3,2,9 + stfd 5,8*13(3) + fadd 5,4,10 + stfd 7,8*14(3) + fadd 7,6,11 + + fsub 1,1,8 + fsub 3,3,9 + fsub 5,5,10 + fsub 7,7,11 + + lfd 8,8*10(5) + lfd 9,8*11(5) + lfd 10,8*12(5) + + fsub 0,0,1 + fsub 2,2,3 + fsub 4,4,5 + fsub 6,6,7 + + stfd 1,8*5(3) + stfd 3,8*7(3) + stfd 5,8*9(3) + stfd 7,8*11(3) + + stfd 0,8*4(3) + stfd 2,8*6(3) + stfd 4,8*8(3) + stfd 6,8*10(3) + + lfd 2,8*12(3) + lfd 4,8*13(3) + lfd 6,8*14(3) + lfd 0,8*15(3) + + fadd 3,2,8 + fadd 5,4,9 + fadd 7,6,10 + + fsub 3,3,8 + fsub 5,5,9 + fsub 7,7,10 + + fsub 2,2,3 + fsub 4,4,5 + fsub 6,6,7 + + stfd 3,8*13(3) + stfd 5,8*15(3) + stfd 7,8*17(3) + + stfd 2,8*12(3) + stfd 4,8*14(3) + stfd 6,8*16(3) + + mtfsf 255,0 +.Lno_key: + xor 3,3,3 + addi 1,1,48 + blr +.long 0 +.byte 0,12,4,1,0x80,0,2,0 .size .poly1305_init_fpu,.-.poly1305_init_fpu .size poly1305_init_fpu,.-.poly1305_init_fpu - -.globl poly1305_blocks_fpu -.type poly1305_blocks_fpu,@function + +.globl poly1305_blocks_fpu +.type poly1305_blocks_fpu,@function .section ".opd","aw" .align 3 poly1305_blocks_fpu: .quad .poly1305_blocks_fpu,.TOC.@tocbase,0 .previous -.align 4 +.align 4 .poly1305_blocks_fpu: - srwi. 5,5,4 - beq- .Labort - - stdu 1,-240(1) - mflr 0 - stfd 14,96(1) - stfd 15,104(1) - stfd 16,112(1) - stfd 17,120(1) - stfd 18,128(1) - stfd 19,136(1) - stfd 20,144(1) - stfd 21,152(1) - stfd 22,160(1) - stfd 23,168(1) - stfd 24,176(1) - stfd 25,184(1) - stfd 26,192(1) - stfd 27,200(1) - stfd 28,208(1) - stfd 29,216(1) - stfd 30,224(1) - stfd 31,232(1) - std 0,256(1) - - xor 0,0,0 - li 10,1 - mtctr 5 - neg 5,5 + srwi. 5,5,4 + beq- .Labort + + stdu 1,-240(1) + mflr 0 + stfd 14,96(1) + stfd 15,104(1) + stfd 16,112(1) + stfd 17,120(1) + stfd 18,128(1) + stfd 19,136(1) + stfd 20,144(1) + stfd 21,152(1) + stfd 22,160(1) + stfd 23,168(1) + stfd 24,176(1) + stfd 25,184(1) + stfd 26,192(1) + stfd 27,200(1) + stfd 28,208(1) + stfd 29,216(1) + stfd 30,224(1) + stfd 31,232(1) + std 0,256(1) + + xor 0,0,0 + li 10,1 + mtctr 5 + neg 5,5 stw 0,80(1) stw 10,84(1) - - lfd 8,8*18(3) - lfd 9,8*19(3) - lfd 10,8*20(3) - lfd 11,8*21(3) - lfd 12,8*22(3) - lfd 13,8*23(3) - - lfd 0,8*0(3) - lfd 2,8*1(3) - lfd 4,8*2(3) - lfd 6,8*3(3) - - stfd 8,48(1) - oris 10,6,18736 - stfd 9,56(1) - stfd 10,64(1) + + lfd 8,8*18(3) + lfd 9,8*19(3) + lfd 10,8*20(3) + lfd 11,8*21(3) + lfd 12,8*22(3) + lfd 13,8*23(3) + + lfd 0,8*0(3) + lfd 2,8*1(3) + lfd 4,8*2(3) + lfd 6,8*3(3) + + stfd 8,48(1) + oris 10,6,18736 + stfd 9,56(1) + stfd 10,64(1) stw 10,72(1) - - li 11,4 - li 12,8 - li 6,12 + + li 11,4 + li 12,8 + li 6,12 lwbrx 7,0,4 lwbrx 8,11,4 lwbrx 9,12,4 lwbrx 10,6,4 - addi 4,4,16 - + addi 4,4,16 + stw 7,52(1) stw 8,60(1) stw 9,68(1) stw 10,76(1) - - mffs 28 - lfd 29,80(1) - lfd 14,8*4(3) - lfd 15,8*5(3) - lfd 16,8*6(3) - lfd 17,8*7(3) - lfd 18,8*8(3) - lfd 19,8*9(3) - lfd 24,8*10(3) - lfd 25,8*11(3) - lfd 26,8*12(3) - lfd 27,8*13(3) - lfd 20,8*14(3) - lfd 21,8*15(3) - lfd 22,8*16(3) - lfd 23,8*17(3) - - stfd 28,80(1) - mtfsf 255,29 - - addic 5,5,1 - addze 0,0 - slwi. 0,0,4 - sub 4,4,0 - - lfd 28,48(1) - lfd 29,56(1) - lfd 30,64(1) - lfd 31,72(1) - - fsub 0,0,8 + + mffs 28 + lfd 29,80(1) + lfd 14,8*4(3) + lfd 15,8*5(3) + lfd 16,8*6(3) + lfd 17,8*7(3) + lfd 18,8*8(3) + lfd 19,8*9(3) + lfd 24,8*10(3) + lfd 25,8*11(3) + lfd 26,8*12(3) + lfd 27,8*13(3) + lfd 20,8*14(3) + lfd 21,8*15(3) + lfd 22,8*16(3) + lfd 23,8*17(3) + + stfd 28,80(1) + mtfsf 255,29 + + addic 5,5,1 + addze 0,0 + slwi. 0,0,4 + sub 4,4,0 + + lfd 28,48(1) + lfd 29,56(1) + lfd 30,64(1) + lfd 31,72(1) + + fsub 0,0,8 lwbrx 7,0,4 - fsub 2,2,9 + fsub 2,2,9 lwbrx 8,11,4 - fsub 4,4,10 + fsub 4,4,10 lwbrx 9,12,4 - fsub 6,6,11 + fsub 6,6,11 lwbrx 10,6,4 - - fsub 28,28,8 - addi 4,4,16 - fsub 29,29,9 - fsub 30,30,10 - fsub 31,31,11 - - fadd 28,28,0 + + fsub 28,28,8 + addi 4,4,16 + fsub 29,29,9 + fsub 30,30,10 + fsub 31,31,11 + + fadd 28,28,0 stw 7,52(1) - fadd 29,29,2 + fadd 29,29,2 stw 8,60(1) - fadd 30,30,4 + fadd 30,30,4 stw 9,68(1) - fadd 31,31,6 + fadd 31,31,6 stw 10,76(1) - - b .Lentry - -.align 4 -.Loop: - fsub 30,30,8 - addic 5,5,1 - fsub 31,31,9 - addze 0,0 - fsub 26,26,10 - slwi. 0,0,4 - fsub 27,27,11 - sub 4,4,0 - - fadd 0,0,30 - fadd 1,1,31 - fadd 4,4,26 - fadd 5,5,27 - - - fadd 26,2,10 + + b .Lentry + +.align 4 +.Loop: + fsub 30,30,8 + addic 5,5,1 + fsub 31,31,9 + addze 0,0 + fsub 26,26,10 + slwi. 0,0,4 + fsub 27,27,11 + sub 4,4,0 + + fadd 0,0,30 + fadd 1,1,31 + fadd 4,4,26 + fadd 5,5,27 + + + fadd 26,2,10 lwbrx 7,0,4 - fadd 27,3,10 + fadd 27,3,10 lwbrx 8,11,4 - fadd 30,6,12 + fadd 30,6,12 lwbrx 9,12,4 - fadd 31,7,12 + fadd 31,7,12 lwbrx 10,6,4 - fadd 24,0,9 - addi 4,4,16 - fadd 25,1,9 - fadd 28,4,11 - fadd 29,5,11 - - fsub 26,26,10 + fadd 24,0,9 + addi 4,4,16 + fadd 25,1,9 + fadd 28,4,11 + fadd 29,5,11 + + fsub 26,26,10 stw 7,52(1) - fsub 27,27,10 + fsub 27,27,10 stw 8,60(1) - fsub 30,30,12 + fsub 30,30,12 stw 9,68(1) - fsub 31,31,12 + fsub 31,31,12 stw 10,76(1) - fsub 24,24,9 - fsub 25,25,9 - fsub 28,28,11 - fsub 29,29,11 - - fsub 2,2,26 - fsub 3,3,27 - fsub 6,6,30 - fsub 7,7,31 - fsub 4,4,28 - fsub 5,5,29 - fsub 0,0,24 - fsub 1,1,25 - - fadd 2,2,24 - fadd 3,3,25 - fadd 6,6,28 - fadd 7,7,29 - fadd 4,4,26 - fadd 5,5,27 - fmadd 0,30,13,0 - fmadd 1,31,13,1 - - fadd 29,2,3 - lfd 26,8*12(3) - fadd 31,6,7 - lfd 27,8*13(3) - fadd 30,4,5 - lfd 24,8*10(3) - fadd 28,0,1 - lfd 25,8*11(3) -.Lentry: - fmul 0,22,29 - fmul 1,23,29 - fmul 4,16,29 - fmul 5,17,29 - fmul 2,14,29 - fmul 3,15,29 - fmul 6,18,29 - fmul 7,19,29 - - fmadd 0,26,31,0 - fmadd 1,27,31,1 - fmadd 4,22,31,4 - fmadd 5,23,31,5 - fmadd 2,20,31,2 - fmadd 3,21,31,3 - fmadd 6,14,31,6 - fmadd 7,15,31,7 - - fmadd 0,20,30,0 - fmadd 1,21,30,1 - fmadd 4,14,30,4 - fmadd 5,15,30,5 - fmadd 2,22,30,2 - fmadd 3,23,30,3 - fmadd 6,16,30,6 - fmadd 7,17,30,7 - - fmadd 0,14,28,0 - lfd 30,48(1) - fmadd 1,15,28,1 - lfd 31,56(1) - fmadd 4,18,28,4 - lfd 26,64(1) - fmadd 5,19,28,5 - lfd 27,72(1) - fmadd 2,16,28,2 - fmadd 3,17,28,3 - fmadd 6,24,28,6 - fmadd 7,25,28,7 - - bdnz .Loop - - - fadd 24,0,9 - fadd 25,1,9 - fadd 28,4,11 - fadd 29,5,11 - fadd 26,2,10 - fadd 27,3,10 - fadd 30,6,12 - fadd 31,7,12 - - fsub 24,24,9 - fsub 25,25,9 - fsub 28,28,11 - fsub 29,29,11 - fsub 26,26,10 - fsub 27,27,10 - fsub 30,30,12 - fsub 31,31,12 - - fsub 2,2,26 - fsub 3,3,27 - fsub 6,6,30 - fsub 7,7,31 - fsub 4,4,28 - fsub 5,5,29 - fsub 0,0,24 - fsub 1,1,25 - - fadd 2,2,24 - fadd 3,3,25 - fadd 6,6,28 - fadd 7,7,29 - fadd 4,4,26 - fadd 5,5,27 - fmadd 0,30,13,0 - fmadd 1,31,13,1 - - fadd 29,2,3 - fadd 31,6,7 - fadd 30,4,5 - fadd 28,0,1 - - lfd 0,80(1) - fadd 29,29,9 - fadd 31,31,11 - fadd 30,30,10 - fadd 28,28,8 - - stfd 29,8*1(3) - stfd 31,8*3(3) - stfd 30,8*2(3) - stfd 28,8*0(3) - - mtfsf 255,0 - lfd 14,96(1) - lfd 15,104(1) - lfd 16,112(1) - lfd 17,120(1) - lfd 18,128(1) - lfd 19,136(1) - lfd 20,144(1) - lfd 21,152(1) - lfd 22,160(1) - lfd 23,168(1) - lfd 24,176(1) - lfd 25,184(1) - lfd 26,192(1) - lfd 27,200(1) - lfd 28,208(1) - lfd 29,216(1) - lfd 30,224(1) - lfd 31,232(1) - addi 1,1,240 -.Labort: - blr -.long 0 -.byte 0,12,4,1,0x80,0,4,0 + fsub 24,24,9 + fsub 25,25,9 + fsub 28,28,11 + fsub 29,29,11 + + fsub 2,2,26 + fsub 3,3,27 + fsub 6,6,30 + fsub 7,7,31 + fsub 4,4,28 + fsub 5,5,29 + fsub 0,0,24 + fsub 1,1,25 + + fadd 2,2,24 + fadd 3,3,25 + fadd 6,6,28 + fadd 7,7,29 + fadd 4,4,26 + fadd 5,5,27 + fmadd 0,30,13,0 + fmadd 1,31,13,1 + + fadd 29,2,3 + lfd 26,8*12(3) + fadd 31,6,7 + lfd 27,8*13(3) + fadd 30,4,5 + lfd 24,8*10(3) + fadd 28,0,1 + lfd 25,8*11(3) +.Lentry: + fmul 0,22,29 + fmul 1,23,29 + fmul 4,16,29 + fmul 5,17,29 + fmul 2,14,29 + fmul 3,15,29 + fmul 6,18,29 + fmul 7,19,29 + + fmadd 0,26,31,0 + fmadd 1,27,31,1 + fmadd 4,22,31,4 + fmadd 5,23,31,5 + fmadd 2,20,31,2 + fmadd 3,21,31,3 + fmadd 6,14,31,6 + fmadd 7,15,31,7 + + fmadd 0,20,30,0 + fmadd 1,21,30,1 + fmadd 4,14,30,4 + fmadd 5,15,30,5 + fmadd 2,22,30,2 + fmadd 3,23,30,3 + fmadd 6,16,30,6 + fmadd 7,17,30,7 + + fmadd 0,14,28,0 + lfd 30,48(1) + fmadd 1,15,28,1 + lfd 31,56(1) + fmadd 4,18,28,4 + lfd 26,64(1) + fmadd 5,19,28,5 + lfd 27,72(1) + fmadd 2,16,28,2 + fmadd 3,17,28,3 + fmadd 6,24,28,6 + fmadd 7,25,28,7 + + bdnz .Loop + + + fadd 24,0,9 + fadd 25,1,9 + fadd 28,4,11 + fadd 29,5,11 + fadd 26,2,10 + fadd 27,3,10 + fadd 30,6,12 + fadd 31,7,12 + + fsub 24,24,9 + fsub 25,25,9 + fsub 28,28,11 + fsub 29,29,11 + fsub 26,26,10 + fsub 27,27,10 + fsub 30,30,12 + fsub 31,31,12 + + fsub 2,2,26 + fsub 3,3,27 + fsub 6,6,30 + fsub 7,7,31 + fsub 4,4,28 + fsub 5,5,29 + fsub 0,0,24 + fsub 1,1,25 + + fadd 2,2,24 + fadd 3,3,25 + fadd 6,6,28 + fadd 7,7,29 + fadd 4,4,26 + fadd 5,5,27 + fmadd 0,30,13,0 + fmadd 1,31,13,1 + + fadd 29,2,3 + fadd 31,6,7 + fadd 30,4,5 + fadd 28,0,1 + + lfd 0,80(1) + fadd 29,29,9 + fadd 31,31,11 + fadd 30,30,10 + fadd 28,28,8 + + stfd 29,8*1(3) + stfd 31,8*3(3) + stfd 30,8*2(3) + stfd 28,8*0(3) + + mtfsf 255,0 + lfd 14,96(1) + lfd 15,104(1) + lfd 16,112(1) + lfd 17,120(1) + lfd 18,128(1) + lfd 19,136(1) + lfd 20,144(1) + lfd 21,152(1) + lfd 22,160(1) + lfd 23,168(1) + lfd 24,176(1) + lfd 25,184(1) + lfd 26,192(1) + lfd 27,200(1) + lfd 28,208(1) + lfd 29,216(1) + lfd 30,224(1) + lfd 31,232(1) + addi 1,1,240 +.Labort: + blr +.long 0 +.byte 0,12,4,1,0x80,0,4,0 .size .poly1305_blocks_fpu,.-.poly1305_blocks_fpu .size poly1305_blocks_fpu,.-.poly1305_blocks_fpu -.globl poly1305_emit_fpu -.type poly1305_emit_fpu,@function +.globl poly1305_emit_fpu +.type poly1305_emit_fpu,@function .section ".opd","aw" .align 3 poly1305_emit_fpu: .quad .poly1305_emit_fpu,.TOC.@tocbase,0 .previous -.align 4 +.align 4 .poly1305_emit_fpu: - stdu 1,-80(1) - mflr 0 - std 28,48(1) - std 29,56(1) - std 30,64(1) - std 31,72(1) - std 0,96(1) - + stdu 1,-80(1) + mflr 0 + std 28,48(1) + std 29,56(1) + std 30,64(1) + std 31,72(1) + std 0,96(1) + lwz 28,0(3) lwz 7,4(3) lwz 29,8(3) @@ -503,58 +503,58 @@ poly1305_emit_fpu: lwz 9,20(3) lwz 31,24(3) lwz 10,28(3) - - lis 0,0xfff0 - andc 28,28,0 - andc 29,29,0 - andc 30,30,0 - andc 31,31,0 - li 0,3 - - srwi 6,31,2 - and 11,31,0 - andc 31,31,0 - add 31,31,6 - add 7,7,31 - add 8,8,28 - add 9,9,29 - add 10,10,30 - - srdi 28,7,32 - add 8,8,28 - srdi 29,8,32 - add 9,9,29 - srdi 30,9,32 - add 10,10,30 - srdi 31,10,32 - add 11,11,31 - - insrdi 7,8,32,0 - insrdi 9,10,32,0 - - addic 28,7,5 - addze 29,9 - addze 30,11 - - srdi 0,30,2 - neg 0,0 - sradi 0,0,63 - ld 30,0(5) - ld 31,8(5) - - andc 7,7,0 - and 28,28,0 - andc 9,9,0 - and 29,29,0 - or 7,7,28 - or 9,9,29 + + lis 0,0xfff0 + andc 28,28,0 + andc 29,29,0 + andc 30,30,0 + andc 31,31,0 + li 0,3 + + srwi 6,31,2 + and 11,31,0 + andc 31,31,0 + add 31,31,6 + add 7,7,31 + add 8,8,28 + add 9,9,29 + add 10,10,30 + + srdi 28,7,32 + add 8,8,28 + srdi 29,8,32 + add 9,9,29 + srdi 30,9,32 + add 10,10,30 + srdi 31,10,32 + add 11,11,31 + + insrdi 7,8,32,0 + insrdi 9,10,32,0 + + addic 28,7,5 + addze 29,9 + addze 30,11 + + srdi 0,30,2 + neg 0,0 + sradi 0,0,63 + ld 30,0(5) + ld 31,8(5) + + andc 7,7,0 + and 28,28,0 + andc 9,9,0 + and 29,29,0 + or 7,7,28 + or 9,9,29 rotldi 30,30,32 rotldi 31,31,32 - addc 7,7,30 - adde 9,9,31 - - srdi 8,7,32 - srdi 10,9,32 + addc 7,7,30 + adde 9,9,31 + + srdi 8,7,32 + srdi 10,9,32 li 29,4 stwbrx 7,0,4 li 30,8 @@ -562,36 +562,36 @@ poly1305_emit_fpu: li 31,12 stwbrx 9,30,4 stwbrx 10,31,4 - ld 28,48(1) - ld 29,56(1) - ld 30,64(1) - ld 31,72(1) - addi 1,1,80 - blr -.long 0 -.byte 0,12,4,1,0x80,4,3,0 + ld 28,48(1) + ld 29,56(1) + ld 30,64(1) + ld 31,72(1) + addi 1,1,80 + blr +.long 0 +.byte 0,12,4,1,0x80,4,3,0 .size .poly1305_emit_fpu,.-.poly1305_emit_fpu .size poly1305_emit_fpu,.-.poly1305_emit_fpu -.align 6 -.LPICmeup: - mflr 0 - bcl 20,31,$+4 - mflr 5 - addi 5,5,56 - mtlr 0 - blr -.long 0 -.byte 0,12,0x14,0,0,0,0,0 -.space 28 - +.align 6 +.LPICmeup: + mflr 0 + bcl 20,31,$+4 + mflr 5 + addi 5,5,56 + mtlr 0 + blr +.long 0 +.byte 0,12,0x14,0,0,0,0,0 +.space 28 + .long 0x43300000,0x00000000 .long 0x45300000,0x00000000 .long 0x47300000,0x00000000 .long 0x49300000,0x00000000 .long 0x4b500000,0x00000000 - + .long 0x37f40000,0x00000000 - + .long 0x44300000,0x00000000 .long 0x46300000,0x00000000 .long 0x48300000,0x00000000 @@ -599,8 +599,8 @@ poly1305_emit_fpu: .long 0x3e300000,0x00000000 .long 0x40300000,0x00000000 .long 0x42300000,0x00000000 - + .long 0x00000000,0x00000001 -.byte 80,111,108,121,49,51,48,53,32,102,111,114,32,80,80,67,32,70,80,85,44,67,82,89,80,84,79,71,65,77,83,32,98,121,32,60,97,112,112,114,111,64,111,112,101,110,115,115,108,46,111,114,103,62,0 -.align 2 -.align 4 +.byte 80,111,108,121,49,51,48,53,32,102,111,114,32,80,80,67,32,70,80,85,44,67,82,89,80,84,79,71,65,77,83,32,98,121,32,60,97,112,112,114,111,64,111,112,101,110,115,115,108,46,111,114,103,62,0 +.align 2 +.align 4 |