Skip to content

Commit 8b94671

Browse files
committed
Update generated-src
1 parent 496470a commit 8b94671

File tree

3 files changed

+134
-176
lines changed

3 files changed

+134
-176
lines changed

generated-src/linux-x86/crypto/chacha/chacha-x86.S

Lines changed: 48 additions & 60 deletions
Original file line numberDiff line numberDiff line change
@@ -5,29 +5,16 @@
55

66
#if !defined(OPENSSL_NO_ASM) && defined(OPENSSL_X86) && defined(__ELF__)
77
.text
8-
.globl ChaCha20_ctr32
9-
.hidden ChaCha20_ctr32
10-
.type ChaCha20_ctr32,@function
8+
.globl ChaCha20_ctr32_nohw
9+
.hidden ChaCha20_ctr32_nohw
10+
.type ChaCha20_ctr32_nohw,@function
1111
.align 16
12-
ChaCha20_ctr32:
13-
.L_ChaCha20_ctr32_begin:
12+
ChaCha20_ctr32_nohw:
13+
.L_ChaCha20_ctr32_nohw_begin:
1414
pushl %ebp
1515
pushl %ebx
1616
pushl %esi
1717
pushl %edi
18-
xorl %eax,%eax
19-
cmpl 28(%esp),%eax
20-
je .L000no_data
21-
call .Lpic_point
22-
.Lpic_point:
23-
popl %eax
24-
leal OPENSSL_ia32cap_P-.Lpic_point(%eax),%ebp
25-
testl $16777216,(%ebp)
26-
jz .L001x86
27-
testl $512,4(%ebp)
28-
jz .L001x86
29-
jmp .Lssse3_shortcut
30-
.L001x86:
3118
movl 32(%esp),%esi
3219
movl 36(%esp),%edi
3320
subl $132,%esp
@@ -56,13 +43,13 @@ ChaCha20_ctr32:
5643
movl %ebx,116(%esp)
5744
movl %ecx,120(%esp)
5845
movl %edx,124(%esp)
59-
jmp .L002entry
46+
jmp .L000entry
6047
.align 16
61-
.L003outer_loop:
48+
.L001outer_loop:
6249
movl %ebx,156(%esp)
6350
movl %eax,152(%esp)
6451
movl %ecx,160(%esp)
65-
.L002entry:
52+
.L000entry:
6653
movl $1634760805,%eax
6754
movl $857760878,4(%esp)
6855
movl $2036477234,8(%esp)
@@ -90,9 +77,9 @@ ChaCha20_ctr32:
9077
movl %edi,60(%esp)
9178
movl %edx,112(%esp)
9279
movl $10,%ebx
93-
jmp .L004loop
80+
jmp .L002loop
9481
.align 16
95-
.L004loop:
82+
.L002loop:
9683
addl %ebp,%eax
9784
movl %ebx,128(%esp)
9885
movl %ebp,%ebx
@@ -246,14 +233,14 @@ ChaCha20_ctr32:
246233
xorl %esi,%ebp
247234
roll $7,%ebp
248235
decl %ebx
249-
jnz .L004loop
236+
jnz .L002loop
250237
movl 160(%esp),%ebx
251238
addl $1634760805,%eax
252239
addl 80(%esp),%ebp
253240
addl 96(%esp),%ecx
254241
addl 100(%esp),%esi
255242
cmpl $64,%ebx
256-
jb .L005tail
243+
jb .L003tail
257244
movl 156(%esp),%ebx
258245
addl 112(%esp),%edx
259246
addl 120(%esp),%edi
@@ -316,9 +303,9 @@ ChaCha20_ctr32:
316303
movl %ebp,(%eax)
317304
leal 64(%eax),%eax
318305
subl $64,%ecx
319-
jnz .L003outer_loop
320-
jmp .L006done
321-
.L005tail:
306+
jnz .L001outer_loop
307+
jmp .L004done
308+
.L003tail:
322309
addl 112(%esp),%edx
323310
addl 120(%esp),%edi
324311
movl %eax,(%esp)
@@ -362,34 +349,35 @@ ChaCha20_ctr32:
362349
movl %edi,60(%esp)
363350
xorl %eax,%eax
364351
xorl %edx,%edx
365-
.L007tail_loop:
352+
.L005tail_loop:
366353
movb (%esi,%ebp,1),%al
367354
movb (%esp,%esi,1),%dl
368355
leal 1(%esi),%esi
369356
xorb %dl,%al
370357
movb %al,-1(%ecx,%esi,1)
371358
decl %ebx
372-
jnz .L007tail_loop
373-
.L006done:
359+
jnz .L005tail_loop
360+
.L004done:
374361
addl $132,%esp
375-
.L000no_data:
376362
popl %edi
377363
popl %esi
378364
popl %ebx
379365
popl %ebp
380366
ret
381-
.size ChaCha20_ctr32,.-.L_ChaCha20_ctr32_begin
382-
.globl ChaCha20_ssse3
383-
.hidden ChaCha20_ssse3
384-
.type ChaCha20_ssse3,@function
367+
.size ChaCha20_ctr32_nohw,.-.L_ChaCha20_ctr32_nohw_begin
368+
.globl ChaCha20_ctr32_ssse3
369+
.hidden ChaCha20_ctr32_ssse3
370+
.type ChaCha20_ctr32_ssse3,@function
385371
.align 16
386-
ChaCha20_ssse3:
387-
.L_ChaCha20_ssse3_begin:
372+
ChaCha20_ctr32_ssse3:
373+
.L_ChaCha20_ctr32_ssse3_begin:
388374
pushl %ebp
389375
pushl %ebx
390376
pushl %esi
391377
pushl %edi
392-
.Lssse3_shortcut:
378+
call .Lpic_point
379+
.Lpic_point:
380+
popl %eax
393381
movl 20(%esp),%edi
394382
movl 24(%esp),%esi
395383
movl 28(%esp),%ecx
@@ -402,7 +390,7 @@ ChaCha20_ssse3:
402390
leal .Lssse3_data-.Lpic_point(%eax),%eax
403391
movdqu (%ebx),%xmm3
404392
cmpl $256,%ecx
405-
jb .L0081x
393+
jb .L0061x
406394
movl %edx,516(%esp)
407395
movl %ebx,520(%esp)
408396
subl $256,%ecx
@@ -447,9 +435,9 @@ ChaCha20_ssse3:
447435
movdqa %xmm7,-80(%ebp)
448436
leal 128(%esi),%esi
449437
leal 128(%edi),%edi
450-
jmp .L009outer_loop
438+
jmp .L007outer_loop
451439
.align 16
452-
.L009outer_loop:
440+
.L007outer_loop:
453441
movdqa -112(%ebp),%xmm1
454442
movdqa -96(%ebp),%xmm2
455443
movdqa -80(%ebp),%xmm3
@@ -484,7 +472,7 @@ ChaCha20_ssse3:
484472
movl $10,%edx
485473
nop
486474
.align 16
487-
.L010loop:
475+
.L008loop:
488476
paddd %xmm3,%xmm0
489477
movdqa %xmm3,%xmm2
490478
pxor %xmm0,%xmm6
@@ -684,7 +672,7 @@ ChaCha20_ssse3:
684672
psrld $25,%xmm1
685673
por %xmm1,%xmm3
686674
decl %edx
687-
jnz .L010loop
675+
jnz .L008loop
688676
movdqa %xmm3,-64(%ebx)
689677
movdqa %xmm4,(%ebx)
690678
movdqa %xmm5,16(%ebx)
@@ -826,9 +814,9 @@ ChaCha20_ssse3:
826814
movdqu %xmm7,64(%edi)
827815
leal 208(%edi),%edi
828816
subl $256,%ecx
829-
jnc .L009outer_loop
817+
jnc .L007outer_loop
830818
addl $256,%ecx
831-
jz .L011done
819+
jz .L009done
832820
movl 520(%esp),%ebx
833821
leal -128(%esi),%esi
834822
movl 516(%esp),%edx
@@ -838,7 +826,7 @@ ChaCha20_ssse3:
838826
paddd 96(%eax),%xmm2
839827
pand 112(%eax),%xmm3
840828
por %xmm2,%xmm3
841-
.L0081x:
829+
.L0061x:
842830
movdqa 32(%eax),%xmm0
843831
movdqu (%edx),%xmm1
844832
movdqu 16(%edx),%xmm2
@@ -850,19 +838,19 @@ ChaCha20_ssse3:
850838
movdqa %xmm2,32(%esp)
851839
movdqa %xmm3,48(%esp)
852840
movl $10,%edx
853-
jmp .L012loop1x
841+
jmp .L010loop1x
854842
.align 16
855-
.L013outer1x:
843+
.L011outer1x:
856844
movdqa 80(%eax),%xmm3
857845
movdqa (%esp),%xmm0
858846
movdqa 16(%esp),%xmm1
859847
movdqa 32(%esp),%xmm2
860848
paddd 48(%esp),%xmm3
861849
movl $10,%edx
862850
movdqa %xmm3,48(%esp)
863-
jmp .L012loop1x
851+
jmp .L010loop1x
864852
.align 16
865-
.L012loop1x:
853+
.L010loop1x:
866854
paddd %xmm1,%xmm0
867855
pxor %xmm0,%xmm3
868856
.byte 102,15,56,0,222
@@ -907,13 +895,13 @@ ChaCha20_ssse3:
907895
pshufd $147,%xmm1,%xmm1
908896
pshufd $57,%xmm3,%xmm3
909897
decl %edx
910-
jnz .L012loop1x
898+
jnz .L010loop1x
911899
paddd (%esp),%xmm0
912900
paddd 16(%esp),%xmm1
913901
paddd 32(%esp),%xmm2
914902
paddd 48(%esp),%xmm3
915903
cmpl $64,%ecx
916-
jb .L014tail
904+
jb .L012tail
917905
movdqu (%esi),%xmm4
918906
movdqu 16(%esi),%xmm5
919907
pxor %xmm4,%xmm0
@@ -929,32 +917,32 @@ ChaCha20_ssse3:
929917
movdqu %xmm3,48(%edi)
930918
leal 64(%edi),%edi
931919
subl $64,%ecx
932-
jnz .L013outer1x
933-
jmp .L011done
934-
.L014tail:
920+
jnz .L011outer1x
921+
jmp .L009done
922+
.L012tail:
935923
movdqa %xmm0,(%esp)
936924
movdqa %xmm1,16(%esp)
937925
movdqa %xmm2,32(%esp)
938926
movdqa %xmm3,48(%esp)
939927
xorl %eax,%eax
940928
xorl %edx,%edx
941929
xorl %ebp,%ebp
942-
.L015tail_loop:
930+
.L013tail_loop:
943931
movb (%esp,%ebp,1),%al
944932
movb (%esi,%ebp,1),%dl
945933
leal 1(%ebp),%ebp
946934
xorb %dl,%al
947935
movb %al,-1(%edi,%ebp,1)
948936
decl %ecx
949-
jnz .L015tail_loop
950-
.L011done:
937+
jnz .L013tail_loop
938+
.L009done:
951939
movl 512(%esp),%esp
952940
popl %edi
953941
popl %esi
954942
popl %ebx
955943
popl %ebp
956944
ret
957-
.size ChaCha20_ssse3,.-.L_ChaCha20_ssse3_begin
945+
.size ChaCha20_ctr32_ssse3,.-.L_ChaCha20_ctr32_ssse3_begin
958946
.align 64
959947
.Lssse3_data:
960948
.byte 2,3,0,1,6,7,4,5,10,11,8,9,14,15,12,13

0 commit comments

Comments
 (0)