aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorDenys Vlasenko <vda.linux@googlemail.com>2023-03-29 15:44:08 +0200
committerDenys Vlasenko <vda.linux@googlemail.com>2023-03-29 15:46:32 +0200
commita59e5a7d08cb26ec029d00dd11e693765aca17be (patch)
tree8b2dc901386a888d15ee8a70d148586022ae67e4
parentbd76b75f72f717150b909e8c64edfda725cabe11 (diff)
downloadbusybox-w32-a59e5a7d08cb26ec029d00dd11e693765aca17be.tar.gz
busybox-w32-a59e5a7d08cb26ec029d00dd11e693765aca17be.tar.bz2
busybox-w32-a59e5a7d08cb26ec029d00dd11e693765aca17be.zip
libbb/sha: do not read shaNI variable twice, and factor out its setting
My gcc inlines both calls, so instead of "-20 bytes" I get only this: function old new delta sha256_begin 84 83 -1 sha1_begin 114 111 -3 ------------------------------------------------------------------------------ (add/remove: 0/0 grow/shrink: 0/2 up/down: 0/-4) Total: -4 bytes Signed-off-by: Denys Vlasenko <vda.linux@googlemail.com>
-rw-r--r--libbb/hash_md5_sha.c28
1 files changed, 16 insertions, 12 deletions
diff --git a/libbb/hash_md5_sha.c b/libbb/hash_md5_sha.c
index bbe58c77b..88baf51dc 100644
--- a/libbb/hash_md5_sha.c
+++ b/libbb/hash_md5_sha.c
@@ -23,6 +23,14 @@ static void cpuid(unsigned *eax, unsigned *ebx, unsigned *ecx, unsigned *edx)
23 ); 23 );
24} 24}
25static smallint shaNI; 25static smallint shaNI;
26static int get_shaNI(void)
27{
28 unsigned eax = 7, ebx = ebx, ecx = 0, edx = edx;
29 cpuid(&eax, &ebx, &ecx, &edx);
30 ebx = ((ebx >> 28) & 2) - 1; /* bit 29 -> 1 or -1 */
31 shaNI = (int)ebx;
32 return (int)ebx;
33}
26void FAST_FUNC sha1_process_block64_shaNI(sha1_ctx_t *ctx); 34void FAST_FUNC sha1_process_block64_shaNI(sha1_ctx_t *ctx);
27void FAST_FUNC sha256_process_block64_shaNI(sha256_ctx_t *ctx); 35void FAST_FUNC sha256_process_block64_shaNI(sha256_ctx_t *ctx);
28# if defined(__i386__) 36# if defined(__i386__)
@@ -1175,12 +1183,10 @@ void FAST_FUNC sha1_begin(sha1_ctx_t *ctx)
1175#if ENABLE_SHA1_HWACCEL 1183#if ENABLE_SHA1_HWACCEL
1176# if defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__)) 1184# if defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
1177 { 1185 {
1178 if (!shaNI) { 1186 int ni = shaNI;
1179 unsigned eax = 7, ebx = ebx, ecx = 0, edx = edx; 1187 if (!ni)
1180 cpuid(&eax, &ebx, &ecx, &edx); 1188 ni = get_shaNI();
1181 shaNI = ((ebx >> 28) & 2) - 1; /* bit 29 -> 1 or -1 */ 1189 if (ni > 0)
1182 }
1183 if (shaNI > 0)
1184 ctx->process_block = sha1_process_block64_shaNI; 1190 ctx->process_block = sha1_process_block64_shaNI;
1185 } 1191 }
1186# endif 1192# endif
@@ -1229,12 +1235,10 @@ void FAST_FUNC sha256_begin(sha256_ctx_t *ctx)
1229#if ENABLE_SHA256_HWACCEL 1235#if ENABLE_SHA256_HWACCEL
1230# if defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__)) 1236# if defined(__GNUC__) && (defined(__i386__) || defined(__x86_64__))
1231 { 1237 {
1232 if (!shaNI) { 1238 int ni = shaNI;
1233 unsigned eax = 7, ebx = ebx, ecx = 0, edx = edx; 1239 if (!ni)
1234 cpuid(&eax, &ebx, &ecx, &edx); 1240 ni = get_shaNI();
1235 shaNI = ((ebx >> 28) & 2) - 1; /* bit 29 -> 1 or -1 */ 1241 if (ni > 0)
1236 }
1237 if (shaNI > 0)
1238 ctx->process_block = sha256_process_block64_shaNI; 1242 ctx->process_block = sha256_process_block64_shaNI;
1239 } 1243 }
1240# endif 1244# endif