diff options
Diffstat (limited to 'C/CpuArch.h')
-rw-r--r-- | C/CpuArch.h | 218 |
1 files changed, 148 insertions, 70 deletions
diff --git a/C/CpuArch.h b/C/CpuArch.h index 4856fbb..8e5d8a5 100644 --- a/C/CpuArch.h +++ b/C/CpuArch.h | |||
@@ -1,8 +1,8 @@ | |||
1 | /* CpuArch.h -- CPU specific code | 1 | /* CpuArch.h -- CPU specific code |
2 | 2022-07-15 : Igor Pavlov : Public domain */ | 2 | 2023-04-02 : Igor Pavlov : Public domain */ |
3 | 3 | ||
4 | #ifndef __CPU_ARCH_H | 4 | #ifndef ZIP7_INC_CPU_ARCH_H |
5 | #define __CPU_ARCH_H | 5 | #define ZIP7_INC_CPU_ARCH_H |
6 | 6 | ||
7 | #include "7zTypes.h" | 7 | #include "7zTypes.h" |
8 | 8 | ||
@@ -51,7 +51,13 @@ MY_CPU_64BIT means that processor can work with 64-bit registers. | |||
51 | || defined(__AARCH64EB__) \ | 51 | || defined(__AARCH64EB__) \ |
52 | || defined(__aarch64__) | 52 | || defined(__aarch64__) |
53 | #define MY_CPU_ARM64 | 53 | #define MY_CPU_ARM64 |
54 | #define MY_CPU_NAME "arm64" | 54 | #ifdef __ILP32__ |
55 | #define MY_CPU_NAME "arm64-32" | ||
56 | #define MY_CPU_SIZEOF_POINTER 4 | ||
57 | #else | ||
58 | #define MY_CPU_NAME "arm64" | ||
59 | #define MY_CPU_SIZEOF_POINTER 8 | ||
60 | #endif | ||
55 | #define MY_CPU_64BIT | 61 | #define MY_CPU_64BIT |
56 | #endif | 62 | #endif |
57 | 63 | ||
@@ -68,8 +74,10 @@ MY_CPU_64BIT means that processor can work with 64-bit registers. | |||
68 | #define MY_CPU_ARM | 74 | #define MY_CPU_ARM |
69 | 75 | ||
70 | #if defined(__thumb__) || defined(__THUMBEL__) || defined(_M_ARMT) | 76 | #if defined(__thumb__) || defined(__THUMBEL__) || defined(_M_ARMT) |
77 | #define MY_CPU_ARMT | ||
71 | #define MY_CPU_NAME "armt" | 78 | #define MY_CPU_NAME "armt" |
72 | #else | 79 | #else |
80 | #define MY_CPU_ARM32 | ||
73 | #define MY_CPU_NAME "arm" | 81 | #define MY_CPU_NAME "arm" |
74 | #endif | 82 | #endif |
75 | /* #define MY_CPU_32BIT */ | 83 | /* #define MY_CPU_32BIT */ |
@@ -103,6 +111,8 @@ MY_CPU_64BIT means that processor can work with 64-bit registers. | |||
103 | || defined(__PPC__) \ | 111 | || defined(__PPC__) \ |
104 | || defined(_POWER) | 112 | || defined(_POWER) |
105 | 113 | ||
114 | #define MY_CPU_PPC_OR_PPC64 | ||
115 | |||
106 | #if defined(__ppc64__) \ | 116 | #if defined(__ppc64__) \ |
107 | || defined(__powerpc64__) \ | 117 | || defined(__powerpc64__) \ |
108 | || defined(_LP64) \ | 118 | || defined(_LP64) \ |
@@ -197,6 +207,9 @@ MY_CPU_64BIT means that processor can work with 64-bit registers. | |||
197 | #error Stop_Compiling_Bad_Endian | 207 | #error Stop_Compiling_Bad_Endian |
198 | #endif | 208 | #endif |
199 | 209 | ||
210 | #if !defined(MY_CPU_LE) && !defined(MY_CPU_BE) | ||
211 | #error Stop_Compiling_CPU_ENDIAN_must_be_detected_at_compile_time | ||
212 | #endif | ||
200 | 213 | ||
201 | #if defined(MY_CPU_32BIT) && defined(MY_CPU_64BIT) | 214 | #if defined(MY_CPU_32BIT) && defined(MY_CPU_64BIT) |
202 | #error Stop_Compiling_Bad_32_64_BIT | 215 | #error Stop_Compiling_Bad_32_64_BIT |
@@ -253,6 +266,67 @@ MY_CPU_64BIT means that processor can work with 64-bit registers. | |||
253 | 266 | ||
254 | 267 | ||
255 | 268 | ||
269 | #ifdef __has_builtin | ||
270 | #define Z7_has_builtin(x) __has_builtin(x) | ||
271 | #else | ||
272 | #define Z7_has_builtin(x) 0 | ||
273 | #endif | ||
274 | |||
275 | |||
276 | #define Z7_BSWAP32_CONST(v) \ | ||
277 | ( (((UInt32)(v) << 24) ) \ | ||
278 | | (((UInt32)(v) << 8) & (UInt32)0xff0000) \ | ||
279 | | (((UInt32)(v) >> 8) & (UInt32)0xff00 ) \ | ||
280 | | (((UInt32)(v) >> 24) )) | ||
281 | |||
282 | |||
283 | #if defined(_MSC_VER) && (_MSC_VER >= 1300) | ||
284 | |||
285 | #include <stdlib.h> | ||
286 | |||
287 | /* Note: these macros will use bswap instruction (486), that is unsupported in 386 cpu */ | ||
288 | |||
289 | #pragma intrinsic(_byteswap_ushort) | ||
290 | #pragma intrinsic(_byteswap_ulong) | ||
291 | #pragma intrinsic(_byteswap_uint64) | ||
292 | |||
293 | #define Z7_BSWAP16(v) _byteswap_ushort(v) | ||
294 | #define Z7_BSWAP32(v) _byteswap_ulong (v) | ||
295 | #define Z7_BSWAP64(v) _byteswap_uint64(v) | ||
296 | #define Z7_CPU_FAST_BSWAP_SUPPORTED | ||
297 | |||
298 | #elif (defined(__GNUC__) && (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 3))) \ | ||
299 | || (defined(__clang__) && Z7_has_builtin(__builtin_bswap16)) | ||
300 | |||
301 | #define Z7_BSWAP16(v) __builtin_bswap16(v) | ||
302 | #define Z7_BSWAP32(v) __builtin_bswap32(v) | ||
303 | #define Z7_BSWAP64(v) __builtin_bswap64(v) | ||
304 | #define Z7_CPU_FAST_BSWAP_SUPPORTED | ||
305 | |||
306 | #else | ||
307 | |||
308 | #define Z7_BSWAP16(v) ((UInt16) \ | ||
309 | ( ((UInt32)(v) << 8) \ | ||
310 | | ((UInt32)(v) >> 8) \ | ||
311 | )) | ||
312 | |||
313 | #define Z7_BSWAP32(v) Z7_BSWAP32_CONST(v) | ||
314 | |||
315 | #define Z7_BSWAP64(v) \ | ||
316 | ( ( ( (UInt64)(v) ) << 8 * 7 ) \ | ||
317 | | ( ( (UInt64)(v) & ((UInt32)0xff << 8 * 1) ) << 8 * 5 ) \ | ||
318 | | ( ( (UInt64)(v) & ((UInt32)0xff << 8 * 2) ) << 8 * 3 ) \ | ||
319 | | ( ( (UInt64)(v) & ((UInt32)0xff << 8 * 3) ) << 8 * 1 ) \ | ||
320 | | ( ( (UInt64)(v) >> 8 * 1 ) & ((UInt32)0xff << 8 * 3) ) \ | ||
321 | | ( ( (UInt64)(v) >> 8 * 3 ) & ((UInt32)0xff << 8 * 2) ) \ | ||
322 | | ( ( (UInt64)(v) >> 8 * 5 ) & ((UInt32)0xff << 8 * 1) ) \ | ||
323 | | ( ( (UInt64)(v) >> 8 * 7 ) ) \ | ||
324 | ) | ||
325 | |||
326 | #endif | ||
327 | |||
328 | |||
329 | |||
256 | #ifdef MY_CPU_LE | 330 | #ifdef MY_CPU_LE |
257 | #if defined(MY_CPU_X86_OR_AMD64) \ | 331 | #if defined(MY_CPU_X86_OR_AMD64) \ |
258 | || defined(MY_CPU_ARM64) | 332 | || defined(MY_CPU_ARM64) |
@@ -272,13 +346,11 @@ MY_CPU_64BIT means that processor can work with 64-bit registers. | |||
272 | #define GetUi32(p) (*(const UInt32 *)(const void *)(p)) | 346 | #define GetUi32(p) (*(const UInt32 *)(const void *)(p)) |
273 | #ifdef MY_CPU_LE_UNALIGN_64 | 347 | #ifdef MY_CPU_LE_UNALIGN_64 |
274 | #define GetUi64(p) (*(const UInt64 *)(const void *)(p)) | 348 | #define GetUi64(p) (*(const UInt64 *)(const void *)(p)) |
349 | #define SetUi64(p, v) { *(UInt64 *)(void *)(p) = (v); } | ||
275 | #endif | 350 | #endif |
276 | 351 | ||
277 | #define SetUi16(p, v) { *(UInt16 *)(void *)(p) = (v); } | 352 | #define SetUi16(p, v) { *(UInt16 *)(void *)(p) = (v); } |
278 | #define SetUi32(p, v) { *(UInt32 *)(void *)(p) = (v); } | 353 | #define SetUi32(p, v) { *(UInt32 *)(void *)(p) = (v); } |
279 | #ifdef MY_CPU_LE_UNALIGN_64 | ||
280 | #define SetUi64(p, v) { *(UInt64 *)(void *)(p) = (v); } | ||
281 | #endif | ||
282 | 354 | ||
283 | #else | 355 | #else |
284 | 356 | ||
@@ -305,51 +377,26 @@ MY_CPU_64BIT means that processor can work with 64-bit registers. | |||
305 | #endif | 377 | #endif |
306 | 378 | ||
307 | 379 | ||
308 | #ifndef MY_CPU_LE_UNALIGN_64 | 380 | #ifndef GetUi64 |
309 | |||
310 | #define GetUi64(p) (GetUi32(p) | ((UInt64)GetUi32(((const Byte *)(p)) + 4) << 32)) | 381 | #define GetUi64(p) (GetUi32(p) | ((UInt64)GetUi32(((const Byte *)(p)) + 4) << 32)) |
382 | #endif | ||
311 | 383 | ||
384 | #ifndef SetUi64 | ||
312 | #define SetUi64(p, v) { Byte *_ppp2_ = (Byte *)(p); UInt64 _vvv2_ = (v); \ | 385 | #define SetUi64(p, v) { Byte *_ppp2_ = (Byte *)(p); UInt64 _vvv2_ = (v); \ |
313 | SetUi32(_ppp2_ , (UInt32)_vvv2_); \ | 386 | SetUi32(_ppp2_ , (UInt32)_vvv2_) \ |
314 | SetUi32(_ppp2_ + 4, (UInt32)(_vvv2_ >> 32)); } | 387 | SetUi32(_ppp2_ + 4, (UInt32)(_vvv2_ >> 32)) } |
315 | |||
316 | #endif | 388 | #endif |
317 | 389 | ||
318 | 390 | ||
391 | #if defined(MY_CPU_LE_UNALIGN) && defined(Z7_CPU_FAST_BSWAP_SUPPORTED) | ||
319 | 392 | ||
393 | #define GetBe32(p) Z7_BSWAP32 (*(const UInt32 *)(const void *)(p)) | ||
394 | #define SetBe32(p, v) { (*(UInt32 *)(void *)(p)) = Z7_BSWAP32(v); } | ||
320 | 395 | ||
321 | #ifdef __has_builtin | 396 | #if defined(MY_CPU_LE_UNALIGN_64) |
322 | #define MY__has_builtin(x) __has_builtin(x) | 397 | #define GetBe64(p) Z7_BSWAP64 (*(const UInt64 *)(const void *)(p)) |
323 | #else | ||
324 | #define MY__has_builtin(x) 0 | ||
325 | #endif | 398 | #endif |
326 | 399 | ||
327 | #if defined(MY_CPU_LE_UNALIGN) && /* defined(_WIN64) && */ defined(_MSC_VER) && (_MSC_VER >= 1300) | ||
328 | |||
329 | /* Note: we use bswap instruction, that is unsupported in 386 cpu */ | ||
330 | |||
331 | #include <stdlib.h> | ||
332 | |||
333 | #pragma intrinsic(_byteswap_ushort) | ||
334 | #pragma intrinsic(_byteswap_ulong) | ||
335 | #pragma intrinsic(_byteswap_uint64) | ||
336 | |||
337 | /* #define GetBe16(p) _byteswap_ushort(*(const UInt16 *)(const Byte *)(p)) */ | ||
338 | #define GetBe32(p) _byteswap_ulong (*(const UInt32 *)(const void *)(p)) | ||
339 | #define GetBe64(p) _byteswap_uint64(*(const UInt64 *)(const void *)(p)) | ||
340 | |||
341 | #define SetBe32(p, v) (*(UInt32 *)(void *)(p)) = _byteswap_ulong(v) | ||
342 | |||
343 | #elif defined(MY_CPU_LE_UNALIGN) && ( \ | ||
344 | (defined(__GNUC__) && (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 3))) \ | ||
345 | || (defined(__clang__) && MY__has_builtin(__builtin_bswap16)) ) | ||
346 | |||
347 | /* #define GetBe16(p) __builtin_bswap16(*(const UInt16 *)(const void *)(p)) */ | ||
348 | #define GetBe32(p) __builtin_bswap32(*(const UInt32 *)(const void *)(p)) | ||
349 | #define GetBe64(p) __builtin_bswap64(*(const UInt64 *)(const void *)(p)) | ||
350 | |||
351 | #define SetBe32(p, v) (*(UInt32 *)(void *)(p)) = __builtin_bswap32(v) | ||
352 | |||
353 | #else | 400 | #else |
354 | 401 | ||
355 | #define GetBe32(p) ( \ | 402 | #define GetBe32(p) ( \ |
@@ -358,8 +405,6 @@ MY_CPU_64BIT means that processor can work with 64-bit registers. | |||
358 | ((UInt32)((const Byte *)(p))[2] << 8) | \ | 405 | ((UInt32)((const Byte *)(p))[2] << 8) | \ |
359 | ((const Byte *)(p))[3] ) | 406 | ((const Byte *)(p))[3] ) |
360 | 407 | ||
361 | #define GetBe64(p) (((UInt64)GetBe32(p) << 32) | GetBe32(((const Byte *)(p)) + 4)) | ||
362 | |||
363 | #define SetBe32(p, v) { Byte *_ppp_ = (Byte *)(p); UInt32 _vvv_ = (v); \ | 408 | #define SetBe32(p, v) { Byte *_ppp_ = (Byte *)(p); UInt32 _vvv_ = (v); \ |
364 | _ppp_[0] = (Byte)(_vvv_ >> 24); \ | 409 | _ppp_[0] = (Byte)(_vvv_ >> 24); \ |
365 | _ppp_[1] = (Byte)(_vvv_ >> 16); \ | 410 | _ppp_[1] = (Byte)(_vvv_ >> 16); \ |
@@ -368,50 +413,83 @@ MY_CPU_64BIT means that processor can work with 64-bit registers. | |||
368 | 413 | ||
369 | #endif | 414 | #endif |
370 | 415 | ||
416 | #ifndef GetBe64 | ||
417 | #define GetBe64(p) (((UInt64)GetBe32(p) << 32) | GetBe32(((const Byte *)(p)) + 4)) | ||
418 | #endif | ||
371 | 419 | ||
372 | #ifndef GetBe16 | 420 | #ifndef GetBe16 |
373 | |||
374 | #define GetBe16(p) ( (UInt16) ( \ | 421 | #define GetBe16(p) ( (UInt16) ( \ |
375 | ((UInt16)((const Byte *)(p))[0] << 8) | \ | 422 | ((UInt16)((const Byte *)(p))[0] << 8) | \ |
376 | ((const Byte *)(p))[1] )) | 423 | ((const Byte *)(p))[1] )) |
424 | #endif | ||
425 | |||
377 | 426 | ||
427 | #if defined(MY_CPU_BE) | ||
428 | #define Z7_CONV_BE_TO_NATIVE_CONST32(v) (v) | ||
429 | #define Z7_CONV_LE_TO_NATIVE_CONST32(v) Z7_BSWAP32_CONST(v) | ||
430 | #define Z7_CONV_NATIVE_TO_BE_32(v) (v) | ||
431 | #elif defined(MY_CPU_LE) | ||
432 | #define Z7_CONV_BE_TO_NATIVE_CONST32(v) Z7_BSWAP32_CONST(v) | ||
433 | #define Z7_CONV_LE_TO_NATIVE_CONST32(v) (v) | ||
434 | #define Z7_CONV_NATIVE_TO_BE_32(v) Z7_BSWAP32(v) | ||
435 | #else | ||
436 | #error Stop_Compiling_Unknown_Endian_CONV | ||
378 | #endif | 437 | #endif |
379 | 438 | ||
380 | 439 | ||
440 | #if defined(MY_CPU_BE) | ||
381 | 441 | ||
382 | #ifdef MY_CPU_X86_OR_AMD64 | 442 | #define GetBe32a(p) (*(const UInt32 *)(const void *)(p)) |
443 | #define GetBe16a(p) (*(const UInt16 *)(const void *)(p)) | ||
444 | #define SetBe32a(p, v) { *(UInt32 *)(void *)(p) = (v); } | ||
445 | #define SetBe16a(p, v) { *(UInt16 *)(void *)(p) = (v); } | ||
446 | |||
447 | #define GetUi32a(p) GetUi32(p) | ||
448 | #define GetUi16a(p) GetUi16(p) | ||
449 | #define SetUi32a(p, v) SetUi32(p, v) | ||
450 | #define SetUi16a(p, v) SetUi16(p, v) | ||
451 | |||
452 | #elif defined(MY_CPU_LE) | ||
383 | 453 | ||
384 | typedef struct | 454 | #define GetUi32a(p) (*(const UInt32 *)(const void *)(p)) |
385 | { | 455 | #define GetUi16a(p) (*(const UInt16 *)(const void *)(p)) |
386 | UInt32 maxFunc; | 456 | #define SetUi32a(p, v) { *(UInt32 *)(void *)(p) = (v); } |
387 | UInt32 vendor[3]; | 457 | #define SetUi16a(p, v) { *(UInt16 *)(void *)(p) = (v); } |
388 | UInt32 ver; | ||
389 | UInt32 b; | ||
390 | UInt32 c; | ||
391 | UInt32 d; | ||
392 | } Cx86cpuid; | ||
393 | 458 | ||
394 | enum | 459 | #define GetBe32a(p) GetBe32(p) |
395 | { | 460 | #define GetBe16a(p) GetBe16(p) |
396 | CPU_FIRM_INTEL, | 461 | #define SetBe32a(p, v) SetBe32(p, v) |
397 | CPU_FIRM_AMD, | 462 | #define SetBe16a(p, v) SetBe16(p, v) |
398 | CPU_FIRM_VIA | 463 | |
399 | }; | 464 | #else |
465 | #error Stop_Compiling_Unknown_Endian_CPU_a | ||
466 | #endif | ||
400 | 467 | ||
401 | void MyCPUID(UInt32 function, UInt32 *a, UInt32 *b, UInt32 *c, UInt32 *d); | ||
402 | 468 | ||
403 | BoolInt x86cpuid_CheckAndRead(Cx86cpuid *p); | 469 | #if defined(MY_CPU_X86_OR_AMD64) \ |
404 | int x86cpuid_GetFirm(const Cx86cpuid *p); | 470 | || defined(MY_CPU_ARM_OR_ARM64) \ |
471 | || defined(MY_CPU_PPC_OR_PPC64) | ||
472 | #define Z7_CPU_FAST_ROTATE_SUPPORTED | ||
473 | #endif | ||
405 | 474 | ||
406 | #define x86cpuid_GetFamily(ver) (((ver >> 16) & 0xFF0) | ((ver >> 8) & 0xF)) | ||
407 | #define x86cpuid_GetModel(ver) (((ver >> 12) & 0xF0) | ((ver >> 4) & 0xF)) | ||
408 | #define x86cpuid_GetStepping(ver) (ver & 0xF) | ||
409 | 475 | ||
410 | BoolInt CPU_Is_InOrder(void); | 476 | #ifdef MY_CPU_X86_OR_AMD64 |
477 | |||
478 | void Z7_FASTCALL z7_x86_cpuid(UInt32 a[4], UInt32 function); | ||
479 | UInt32 Z7_FASTCALL z7_x86_cpuid_GetMaxFunc(void); | ||
480 | #if defined(MY_CPU_AMD64) | ||
481 | #define Z7_IF_X86_CPUID_SUPPORTED | ||
482 | #else | ||
483 | #define Z7_IF_X86_CPUID_SUPPORTED if (z7_x86_cpuid_GetMaxFunc()) | ||
484 | #endif | ||
411 | 485 | ||
412 | BoolInt CPU_IsSupported_AES(void); | 486 | BoolInt CPU_IsSupported_AES(void); |
487 | BoolInt CPU_IsSupported_AVX(void); | ||
413 | BoolInt CPU_IsSupported_AVX2(void); | 488 | BoolInt CPU_IsSupported_AVX2(void); |
414 | BoolInt CPU_IsSupported_VAES_AVX2(void); | 489 | BoolInt CPU_IsSupported_VAES_AVX2(void); |
490 | BoolInt CPU_IsSupported_CMOV(void); | ||
491 | BoolInt CPU_IsSupported_SSE(void); | ||
492 | BoolInt CPU_IsSupported_SSE2(void); | ||
415 | BoolInt CPU_IsSupported_SSSE3(void); | 493 | BoolInt CPU_IsSupported_SSSE3(void); |
416 | BoolInt CPU_IsSupported_SSE41(void); | 494 | BoolInt CPU_IsSupported_SSE41(void); |
417 | BoolInt CPU_IsSupported_SHA(void); | 495 | BoolInt CPU_IsSupported_SHA(void); |
@@ -436,8 +514,8 @@ BoolInt CPU_IsSupported_AES(void); | |||
436 | #endif | 514 | #endif |
437 | 515 | ||
438 | #if defined(__APPLE__) | 516 | #if defined(__APPLE__) |
439 | int My_sysctlbyname_Get(const char *name, void *buf, size_t *bufSize); | 517 | int z7_sysctlbyname_Get(const char *name, void *buf, size_t *bufSize); |
440 | int My_sysctlbyname_Get_UInt32(const char *name, UInt32 *val); | 518 | int z7_sysctlbyname_Get_UInt32(const char *name, UInt32 *val); |
441 | #endif | 519 | #endif |
442 | 520 | ||
443 | EXTERN_C_END | 521 | EXTERN_C_END |