aboutsummaryrefslogtreecommitdiff
path: root/C/CpuArch.h
diff options
context:
space:
mode:
Diffstat (limited to 'C/CpuArch.h')
-rw-r--r--C/CpuArch.h218
1 files changed, 148 insertions, 70 deletions
diff --git a/C/CpuArch.h b/C/CpuArch.h
index 4856fbb..8e5d8a5 100644
--- a/C/CpuArch.h
+++ b/C/CpuArch.h
@@ -1,8 +1,8 @@
1/* CpuArch.h -- CPU specific code 1/* CpuArch.h -- CPU specific code
22022-07-15 : Igor Pavlov : Public domain */ 22023-04-02 : Igor Pavlov : Public domain */
3 3
4#ifndef __CPU_ARCH_H 4#ifndef ZIP7_INC_CPU_ARCH_H
5#define __CPU_ARCH_H 5#define ZIP7_INC_CPU_ARCH_H
6 6
7#include "7zTypes.h" 7#include "7zTypes.h"
8 8
@@ -51,7 +51,13 @@ MY_CPU_64BIT means that processor can work with 64-bit registers.
51 || defined(__AARCH64EB__) \ 51 || defined(__AARCH64EB__) \
52 || defined(__aarch64__) 52 || defined(__aarch64__)
53 #define MY_CPU_ARM64 53 #define MY_CPU_ARM64
54 #define MY_CPU_NAME "arm64" 54 #ifdef __ILP32__
55 #define MY_CPU_NAME "arm64-32"
56 #define MY_CPU_SIZEOF_POINTER 4
57 #else
58 #define MY_CPU_NAME "arm64"
59 #define MY_CPU_SIZEOF_POINTER 8
60 #endif
55 #define MY_CPU_64BIT 61 #define MY_CPU_64BIT
56#endif 62#endif
57 63
@@ -68,8 +74,10 @@ MY_CPU_64BIT means that processor can work with 64-bit registers.
68 #define MY_CPU_ARM 74 #define MY_CPU_ARM
69 75
70 #if defined(__thumb__) || defined(__THUMBEL__) || defined(_M_ARMT) 76 #if defined(__thumb__) || defined(__THUMBEL__) || defined(_M_ARMT)
77 #define MY_CPU_ARMT
71 #define MY_CPU_NAME "armt" 78 #define MY_CPU_NAME "armt"
72 #else 79 #else
80 #define MY_CPU_ARM32
73 #define MY_CPU_NAME "arm" 81 #define MY_CPU_NAME "arm"
74 #endif 82 #endif
75 /* #define MY_CPU_32BIT */ 83 /* #define MY_CPU_32BIT */
@@ -103,6 +111,8 @@ MY_CPU_64BIT means that processor can work with 64-bit registers.
103 || defined(__PPC__) \ 111 || defined(__PPC__) \
104 || defined(_POWER) 112 || defined(_POWER)
105 113
114#define MY_CPU_PPC_OR_PPC64
115
106#if defined(__ppc64__) \ 116#if defined(__ppc64__) \
107 || defined(__powerpc64__) \ 117 || defined(__powerpc64__) \
108 || defined(_LP64) \ 118 || defined(_LP64) \
@@ -197,6 +207,9 @@ MY_CPU_64BIT means that processor can work with 64-bit registers.
197 #error Stop_Compiling_Bad_Endian 207 #error Stop_Compiling_Bad_Endian
198#endif 208#endif
199 209
210#if !defined(MY_CPU_LE) && !defined(MY_CPU_BE)
211 #error Stop_Compiling_CPU_ENDIAN_must_be_detected_at_compile_time
212#endif
200 213
201#if defined(MY_CPU_32BIT) && defined(MY_CPU_64BIT) 214#if defined(MY_CPU_32BIT) && defined(MY_CPU_64BIT)
202 #error Stop_Compiling_Bad_32_64_BIT 215 #error Stop_Compiling_Bad_32_64_BIT
@@ -253,6 +266,67 @@ MY_CPU_64BIT means that processor can work with 64-bit registers.
253 266
254 267
255 268
269#ifdef __has_builtin
270 #define Z7_has_builtin(x) __has_builtin(x)
271#else
272 #define Z7_has_builtin(x) 0
273#endif
274
275
276#define Z7_BSWAP32_CONST(v) \
277 ( (((UInt32)(v) << 24) ) \
278 | (((UInt32)(v) << 8) & (UInt32)0xff0000) \
279 | (((UInt32)(v) >> 8) & (UInt32)0xff00 ) \
280 | (((UInt32)(v) >> 24) ))
281
282
283#if defined(_MSC_VER) && (_MSC_VER >= 1300)
284
285#include <stdlib.h>
286
287/* Note: these macros will use bswap instruction (486), that is unsupported in 386 cpu */
288
289#pragma intrinsic(_byteswap_ushort)
290#pragma intrinsic(_byteswap_ulong)
291#pragma intrinsic(_byteswap_uint64)
292
293#define Z7_BSWAP16(v) _byteswap_ushort(v)
294#define Z7_BSWAP32(v) _byteswap_ulong (v)
295#define Z7_BSWAP64(v) _byteswap_uint64(v)
296#define Z7_CPU_FAST_BSWAP_SUPPORTED
297
298#elif (defined(__GNUC__) && (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 3))) \
299 || (defined(__clang__) && Z7_has_builtin(__builtin_bswap16))
300
301#define Z7_BSWAP16(v) __builtin_bswap16(v)
302#define Z7_BSWAP32(v) __builtin_bswap32(v)
303#define Z7_BSWAP64(v) __builtin_bswap64(v)
304#define Z7_CPU_FAST_BSWAP_SUPPORTED
305
306#else
307
308#define Z7_BSWAP16(v) ((UInt16) \
309 ( ((UInt32)(v) << 8) \
310 | ((UInt32)(v) >> 8) \
311 ))
312
313#define Z7_BSWAP32(v) Z7_BSWAP32_CONST(v)
314
315#define Z7_BSWAP64(v) \
316 ( ( ( (UInt64)(v) ) << 8 * 7 ) \
317 | ( ( (UInt64)(v) & ((UInt32)0xff << 8 * 1) ) << 8 * 5 ) \
318 | ( ( (UInt64)(v) & ((UInt32)0xff << 8 * 2) ) << 8 * 3 ) \
319 | ( ( (UInt64)(v) & ((UInt32)0xff << 8 * 3) ) << 8 * 1 ) \
320 | ( ( (UInt64)(v) >> 8 * 1 ) & ((UInt32)0xff << 8 * 3) ) \
321 | ( ( (UInt64)(v) >> 8 * 3 ) & ((UInt32)0xff << 8 * 2) ) \
322 | ( ( (UInt64)(v) >> 8 * 5 ) & ((UInt32)0xff << 8 * 1) ) \
323 | ( ( (UInt64)(v) >> 8 * 7 ) ) \
324 )
325
326#endif
327
328
329
256#ifdef MY_CPU_LE 330#ifdef MY_CPU_LE
257 #if defined(MY_CPU_X86_OR_AMD64) \ 331 #if defined(MY_CPU_X86_OR_AMD64) \
258 || defined(MY_CPU_ARM64) 332 || defined(MY_CPU_ARM64)
@@ -272,13 +346,11 @@ MY_CPU_64BIT means that processor can work with 64-bit registers.
272#define GetUi32(p) (*(const UInt32 *)(const void *)(p)) 346#define GetUi32(p) (*(const UInt32 *)(const void *)(p))
273#ifdef MY_CPU_LE_UNALIGN_64 347#ifdef MY_CPU_LE_UNALIGN_64
274#define GetUi64(p) (*(const UInt64 *)(const void *)(p)) 348#define GetUi64(p) (*(const UInt64 *)(const void *)(p))
349#define SetUi64(p, v) { *(UInt64 *)(void *)(p) = (v); }
275#endif 350#endif
276 351
277#define SetUi16(p, v) { *(UInt16 *)(void *)(p) = (v); } 352#define SetUi16(p, v) { *(UInt16 *)(void *)(p) = (v); }
278#define SetUi32(p, v) { *(UInt32 *)(void *)(p) = (v); } 353#define SetUi32(p, v) { *(UInt32 *)(void *)(p) = (v); }
279#ifdef MY_CPU_LE_UNALIGN_64
280#define SetUi64(p, v) { *(UInt64 *)(void *)(p) = (v); }
281#endif
282 354
283#else 355#else
284 356
@@ -305,51 +377,26 @@ MY_CPU_64BIT means that processor can work with 64-bit registers.
305#endif 377#endif
306 378
307 379
308#ifndef MY_CPU_LE_UNALIGN_64 380#ifndef GetUi64
309
310#define GetUi64(p) (GetUi32(p) | ((UInt64)GetUi32(((const Byte *)(p)) + 4) << 32)) 381#define GetUi64(p) (GetUi32(p) | ((UInt64)GetUi32(((const Byte *)(p)) + 4) << 32))
382#endif
311 383
384#ifndef SetUi64
312#define SetUi64(p, v) { Byte *_ppp2_ = (Byte *)(p); UInt64 _vvv2_ = (v); \ 385#define SetUi64(p, v) { Byte *_ppp2_ = (Byte *)(p); UInt64 _vvv2_ = (v); \
313 SetUi32(_ppp2_ , (UInt32)_vvv2_); \ 386 SetUi32(_ppp2_ , (UInt32)_vvv2_) \
314 SetUi32(_ppp2_ + 4, (UInt32)(_vvv2_ >> 32)); } 387 SetUi32(_ppp2_ + 4, (UInt32)(_vvv2_ >> 32)) }
315
316#endif 388#endif
317 389
318 390
391#if defined(MY_CPU_LE_UNALIGN) && defined(Z7_CPU_FAST_BSWAP_SUPPORTED)
319 392
393#define GetBe32(p) Z7_BSWAP32 (*(const UInt32 *)(const void *)(p))
394#define SetBe32(p, v) { (*(UInt32 *)(void *)(p)) = Z7_BSWAP32(v); }
320 395
321#ifdef __has_builtin 396#if defined(MY_CPU_LE_UNALIGN_64)
322 #define MY__has_builtin(x) __has_builtin(x) 397#define GetBe64(p) Z7_BSWAP64 (*(const UInt64 *)(const void *)(p))
323#else
324 #define MY__has_builtin(x) 0
325#endif 398#endif
326 399
327#if defined(MY_CPU_LE_UNALIGN) && /* defined(_WIN64) && */ defined(_MSC_VER) && (_MSC_VER >= 1300)
328
329/* Note: we use bswap instruction, that is unsupported in 386 cpu */
330
331#include <stdlib.h>
332
333#pragma intrinsic(_byteswap_ushort)
334#pragma intrinsic(_byteswap_ulong)
335#pragma intrinsic(_byteswap_uint64)
336
337/* #define GetBe16(p) _byteswap_ushort(*(const UInt16 *)(const Byte *)(p)) */
338#define GetBe32(p) _byteswap_ulong (*(const UInt32 *)(const void *)(p))
339#define GetBe64(p) _byteswap_uint64(*(const UInt64 *)(const void *)(p))
340
341#define SetBe32(p, v) (*(UInt32 *)(void *)(p)) = _byteswap_ulong(v)
342
343#elif defined(MY_CPU_LE_UNALIGN) && ( \
344 (defined(__GNUC__) && (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 3))) \
345 || (defined(__clang__) && MY__has_builtin(__builtin_bswap16)) )
346
347/* #define GetBe16(p) __builtin_bswap16(*(const UInt16 *)(const void *)(p)) */
348#define GetBe32(p) __builtin_bswap32(*(const UInt32 *)(const void *)(p))
349#define GetBe64(p) __builtin_bswap64(*(const UInt64 *)(const void *)(p))
350
351#define SetBe32(p, v) (*(UInt32 *)(void *)(p)) = __builtin_bswap32(v)
352
353#else 400#else
354 401
355#define GetBe32(p) ( \ 402#define GetBe32(p) ( \
@@ -358,8 +405,6 @@ MY_CPU_64BIT means that processor can work with 64-bit registers.
358 ((UInt32)((const Byte *)(p))[2] << 8) | \ 405 ((UInt32)((const Byte *)(p))[2] << 8) | \
359 ((const Byte *)(p))[3] ) 406 ((const Byte *)(p))[3] )
360 407
361#define GetBe64(p) (((UInt64)GetBe32(p) << 32) | GetBe32(((const Byte *)(p)) + 4))
362
363#define SetBe32(p, v) { Byte *_ppp_ = (Byte *)(p); UInt32 _vvv_ = (v); \ 408#define SetBe32(p, v) { Byte *_ppp_ = (Byte *)(p); UInt32 _vvv_ = (v); \
364 _ppp_[0] = (Byte)(_vvv_ >> 24); \ 409 _ppp_[0] = (Byte)(_vvv_ >> 24); \
365 _ppp_[1] = (Byte)(_vvv_ >> 16); \ 410 _ppp_[1] = (Byte)(_vvv_ >> 16); \
@@ -368,50 +413,83 @@ MY_CPU_64BIT means that processor can work with 64-bit registers.
368 413
369#endif 414#endif
370 415
416#ifndef GetBe64
417#define GetBe64(p) (((UInt64)GetBe32(p) << 32) | GetBe32(((const Byte *)(p)) + 4))
418#endif
371 419
372#ifndef GetBe16 420#ifndef GetBe16
373
374#define GetBe16(p) ( (UInt16) ( \ 421#define GetBe16(p) ( (UInt16) ( \
375 ((UInt16)((const Byte *)(p))[0] << 8) | \ 422 ((UInt16)((const Byte *)(p))[0] << 8) | \
376 ((const Byte *)(p))[1] )) 423 ((const Byte *)(p))[1] ))
424#endif
425
377 426
427#if defined(MY_CPU_BE)
428#define Z7_CONV_BE_TO_NATIVE_CONST32(v) (v)
429#define Z7_CONV_LE_TO_NATIVE_CONST32(v) Z7_BSWAP32_CONST(v)
430#define Z7_CONV_NATIVE_TO_BE_32(v) (v)
431#elif defined(MY_CPU_LE)
432#define Z7_CONV_BE_TO_NATIVE_CONST32(v) Z7_BSWAP32_CONST(v)
433#define Z7_CONV_LE_TO_NATIVE_CONST32(v) (v)
434#define Z7_CONV_NATIVE_TO_BE_32(v) Z7_BSWAP32(v)
435#else
436#error Stop_Compiling_Unknown_Endian_CONV
378#endif 437#endif
379 438
380 439
440#if defined(MY_CPU_BE)
381 441
382#ifdef MY_CPU_X86_OR_AMD64 442#define GetBe32a(p) (*(const UInt32 *)(const void *)(p))
443#define GetBe16a(p) (*(const UInt16 *)(const void *)(p))
444#define SetBe32a(p, v) { *(UInt32 *)(void *)(p) = (v); }
445#define SetBe16a(p, v) { *(UInt16 *)(void *)(p) = (v); }
446
447#define GetUi32a(p) GetUi32(p)
448#define GetUi16a(p) GetUi16(p)
449#define SetUi32a(p, v) SetUi32(p, v)
450#define SetUi16a(p, v) SetUi16(p, v)
451
452#elif defined(MY_CPU_LE)
383 453
384typedef struct 454#define GetUi32a(p) (*(const UInt32 *)(const void *)(p))
385{ 455#define GetUi16a(p) (*(const UInt16 *)(const void *)(p))
386 UInt32 maxFunc; 456#define SetUi32a(p, v) { *(UInt32 *)(void *)(p) = (v); }
387 UInt32 vendor[3]; 457#define SetUi16a(p, v) { *(UInt16 *)(void *)(p) = (v); }
388 UInt32 ver;
389 UInt32 b;
390 UInt32 c;
391 UInt32 d;
392} Cx86cpuid;
393 458
394enum 459#define GetBe32a(p) GetBe32(p)
395{ 460#define GetBe16a(p) GetBe16(p)
396 CPU_FIRM_INTEL, 461#define SetBe32a(p, v) SetBe32(p, v)
397 CPU_FIRM_AMD, 462#define SetBe16a(p, v) SetBe16(p, v)
398 CPU_FIRM_VIA 463
399}; 464#else
465#error Stop_Compiling_Unknown_Endian_CPU_a
466#endif
400 467
401void MyCPUID(UInt32 function, UInt32 *a, UInt32 *b, UInt32 *c, UInt32 *d);
402 468
403BoolInt x86cpuid_CheckAndRead(Cx86cpuid *p); 469#if defined(MY_CPU_X86_OR_AMD64) \
404int x86cpuid_GetFirm(const Cx86cpuid *p); 470 || defined(MY_CPU_ARM_OR_ARM64) \
471 || defined(MY_CPU_PPC_OR_PPC64)
472 #define Z7_CPU_FAST_ROTATE_SUPPORTED
473#endif
405 474
406#define x86cpuid_GetFamily(ver) (((ver >> 16) & 0xFF0) | ((ver >> 8) & 0xF))
407#define x86cpuid_GetModel(ver) (((ver >> 12) & 0xF0) | ((ver >> 4) & 0xF))
408#define x86cpuid_GetStepping(ver) (ver & 0xF)
409 475
410BoolInt CPU_Is_InOrder(void); 476#ifdef MY_CPU_X86_OR_AMD64
477
478void Z7_FASTCALL z7_x86_cpuid(UInt32 a[4], UInt32 function);
479UInt32 Z7_FASTCALL z7_x86_cpuid_GetMaxFunc(void);
480#if defined(MY_CPU_AMD64)
481#define Z7_IF_X86_CPUID_SUPPORTED
482#else
483#define Z7_IF_X86_CPUID_SUPPORTED if (z7_x86_cpuid_GetMaxFunc())
484#endif
411 485
412BoolInt CPU_IsSupported_AES(void); 486BoolInt CPU_IsSupported_AES(void);
487BoolInt CPU_IsSupported_AVX(void);
413BoolInt CPU_IsSupported_AVX2(void); 488BoolInt CPU_IsSupported_AVX2(void);
414BoolInt CPU_IsSupported_VAES_AVX2(void); 489BoolInt CPU_IsSupported_VAES_AVX2(void);
490BoolInt CPU_IsSupported_CMOV(void);
491BoolInt CPU_IsSupported_SSE(void);
492BoolInt CPU_IsSupported_SSE2(void);
415BoolInt CPU_IsSupported_SSSE3(void); 493BoolInt CPU_IsSupported_SSSE3(void);
416BoolInt CPU_IsSupported_SSE41(void); 494BoolInt CPU_IsSupported_SSE41(void);
417BoolInt CPU_IsSupported_SHA(void); 495BoolInt CPU_IsSupported_SHA(void);
@@ -436,8 +514,8 @@ BoolInt CPU_IsSupported_AES(void);
436#endif 514#endif
437 515
438#if defined(__APPLE__) 516#if defined(__APPLE__)
439int My_sysctlbyname_Get(const char *name, void *buf, size_t *bufSize); 517int z7_sysctlbyname_Get(const char *name, void *buf, size_t *bufSize);
440int My_sysctlbyname_Get_UInt32(const char *name, UInt32 *val); 518int z7_sysctlbyname_Get_UInt32(const char *name, UInt32 *val);
441#endif 519#endif
442 520
443EXTERN_C_END 521EXTERN_C_END