Loading crypto/aes/asm/bsaes-x86_64.pl +2 −0 Original line number Diff line number Diff line Loading @@ -40,6 +40,7 @@ # Core 2 9.30 8.69 +7% # Nehalem(**) 7.63 6.88 +11% # Atom 17.1 16.4 +4% # Silvermont - 12.9 # # (*) Comparison is not completely fair, because "this" is ECB, # i.e. no extra processing such as counter values calculation Loading Loading @@ -78,6 +79,7 @@ # Core 2 9.98 # Nehalem 7.80 # Atom 17.9 # Silvermont 14.0 # # November 2011. # Loading crypto/aes/asm/vpaes-x86.pl +1 −0 Original line number Diff line number Diff line Loading @@ -30,6 +30,7 @@ # Core 2(**) 28.1/41.4/18.3 21.9/25.2(***) # Nehalem 27.9/40.4/18.1 10.2/11.9 # Atom 70.7/92.1/60.1 61.1/75.4(***) # Silvermont 45.4/62.9/24.1 49.2/61.1(***) # # (*) "Hyper-threading" in the context refers rather to cache shared # among multiple cores, than to specifically Intel HTT. As vast Loading crypto/aes/asm/vpaes-x86_64.pl +1 −0 Original line number Diff line number Diff line Loading @@ -30,6 +30,7 @@ # Core 2(**) 29.6/41.1/14.3 21.9/25.2(***) # Nehalem 29.6/40.3/14.6 10.0/11.8 # Atom 57.3/74.2/32.1 60.9/77.2(***) # Silvermont 52.7/64.0/19.5 48.8/60.8(***) # # (*) "Hyper-threading" in the context refers rather to cache shared # among multiple cores, than to specifically Intel HTT. As vast Loading crypto/modes/asm/ghash-x86_64.pl +1 −0 Original line number Diff line number Diff line Loading @@ -64,6 +64,7 @@ # Ivy Bridge 1.80(+7%) # Haswell 0.55(+93%) (if system doesn't support AVX) # Bulldozer 1.49(+27%) # Silvermont 2.88(+13%) # March 2013 # Loading crypto/sha/asm/sha1-586.pl +5 −2 Original line number Diff line number Diff line Loading @@ -93,16 +93,19 @@ # P4 10.6 - # AMD K8 7.1 - # Core2 7.3 6.0/+22% - # Atom 12.5 9.3(*)/+35% - # Westmere 7.3 5.5/+33% - # Sandy Bridge 8.8 6.2/+40% 5.1(**)/+73% # Ivy Bridge 7.2 4.8/+51% 4.7(**)/+53% # Haswell 6.5 4.3/+51% 4.1(**)/+58% # Bulldozer 11.6 6.0/+92% # VIA Nano 10.6 7.5/+41% # Atom 12.5 9.3(*)/+35% # Silvermont 14.5 9.9(*)/+46% # # (*) Loop is 1056 instructions long and expected result is ~8.25. # It remains mystery [to me] why ILP is limited to 1.7. # The discrepancy is because of front-end limitations, so # called MS-ROM penalties, and on Silvermont even rotate's # limited parallelism. # # (**) As per above comment, the result is for AVX *plus* sh[rl]d. Loading Loading
crypto/aes/asm/bsaes-x86_64.pl +2 −0 Original line number Diff line number Diff line Loading @@ -40,6 +40,7 @@ # Core 2 9.30 8.69 +7% # Nehalem(**) 7.63 6.88 +11% # Atom 17.1 16.4 +4% # Silvermont - 12.9 # # (*) Comparison is not completely fair, because "this" is ECB, # i.e. no extra processing such as counter values calculation Loading Loading @@ -78,6 +79,7 @@ # Core 2 9.98 # Nehalem 7.80 # Atom 17.9 # Silvermont 14.0 # # November 2011. # Loading
crypto/aes/asm/vpaes-x86.pl +1 −0 Original line number Diff line number Diff line Loading @@ -30,6 +30,7 @@ # Core 2(**) 28.1/41.4/18.3 21.9/25.2(***) # Nehalem 27.9/40.4/18.1 10.2/11.9 # Atom 70.7/92.1/60.1 61.1/75.4(***) # Silvermont 45.4/62.9/24.1 49.2/61.1(***) # # (*) "Hyper-threading" in the context refers rather to cache shared # among multiple cores, than to specifically Intel HTT. As vast Loading
crypto/aes/asm/vpaes-x86_64.pl +1 −0 Original line number Diff line number Diff line Loading @@ -30,6 +30,7 @@ # Core 2(**) 29.6/41.1/14.3 21.9/25.2(***) # Nehalem 29.6/40.3/14.6 10.0/11.8 # Atom 57.3/74.2/32.1 60.9/77.2(***) # Silvermont 52.7/64.0/19.5 48.8/60.8(***) # # (*) "Hyper-threading" in the context refers rather to cache shared # among multiple cores, than to specifically Intel HTT. As vast Loading
crypto/modes/asm/ghash-x86_64.pl +1 −0 Original line number Diff line number Diff line Loading @@ -64,6 +64,7 @@ # Ivy Bridge 1.80(+7%) # Haswell 0.55(+93%) (if system doesn't support AVX) # Bulldozer 1.49(+27%) # Silvermont 2.88(+13%) # March 2013 # Loading
crypto/sha/asm/sha1-586.pl +5 −2 Original line number Diff line number Diff line Loading @@ -93,16 +93,19 @@ # P4 10.6 - # AMD K8 7.1 - # Core2 7.3 6.0/+22% - # Atom 12.5 9.3(*)/+35% - # Westmere 7.3 5.5/+33% - # Sandy Bridge 8.8 6.2/+40% 5.1(**)/+73% # Ivy Bridge 7.2 4.8/+51% 4.7(**)/+53% # Haswell 6.5 4.3/+51% 4.1(**)/+58% # Bulldozer 11.6 6.0/+92% # VIA Nano 10.6 7.5/+41% # Atom 12.5 9.3(*)/+35% # Silvermont 14.5 9.9(*)/+46% # # (*) Loop is 1056 instructions long and expected result is ~8.25. # It remains mystery [to me] why ILP is limited to 1.7. # The discrepancy is because of front-end limitations, so # called MS-ROM penalties, and on Silvermont even rotate's # limited parallelism. # # (**) As per above comment, the result is for AVX *plus* sh[rl]d. Loading