ObjFW  Diff

Differences From Artifact [4a5cc32620]:

To Artifact [dde9f4593e]:


314
315
316
317
318
319
320


















321
322
323
324
325
326
327
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345







+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+







	);
# else
	memset(&regs, 0, sizeof(regs));
# endif

	return regs;
}

static OF_INLINE struct X86Regs
x86XCR(uint32_t ecx)
{
	struct X86Regs regs = { 0 };

	if (!(x86CPUID(1, 0).ecx & (1u << 27)))
		return regs;

	__asm__ (
	    "xgetbv"
	    : "=a" (regs.eax),
	      "=d" (regs.edx)
	    : "c" (ecx)
	);

	return regs;
}
#endif

@implementation OFSystemInfo
+ (void)initialize
{
	long tmp;

755
756
757
758
759
760
761
762


763
764
765
766
767


768
769
770
771
772


773
774
775
776
777


778
779
780
781
782


783
784
785
786
787


788
789
790
791
792


793
794
795
796
797


798
799
800
801
802
803
804
773
774
775
776
777
778
779

780
781
782
783
784
785

786
787
788
789
790
791

792
793
794
795
796
797

798
799
800
801
802
803

804
805
806
807
808
809

810
811
812
813
814
815

816
817
818
819
820
821

822
823
824
825
826
827
828
829
830







-
+
+




-
+
+




-
+
+




-
+
+




-
+
+




-
+
+




-
+
+




-
+
+







{
	return (x86CPUID(0x80000000, 0).eax >= 0x80000001 &&
	    x86CPUID(0x80000001, 0).edx & (1u << 30));
}

+ (bool)supportsSSE
{
	return (x86CPUID(0, 0).eax >= 1 && x86CPUID(1, 0).edx & (1u << 25));
	return ((x86CPUID(0, 0).eax >= 1 && x86CPUID(1, 0).edx & (1u << 25)) &&
	    x86XCR(0).eax & (1u << 1));
}

+ (bool)supportsSSE2
{
	return (x86CPUID(0, 0).eax >= 1 && x86CPUID(1, 0).edx & (1u << 26));
	return ((x86CPUID(0, 0).eax >= 1 && x86CPUID(1, 0).edx & (1u << 26)) &&
	    x86XCR(0).eax & (1u << 1));
}

+ (bool)supportsSSE3
{
	return (x86CPUID(0, 0).eax >= 1 && x86CPUID(1, 0).ecx & (1u << 0));
	return ((x86CPUID(0, 0).eax >= 1 && x86CPUID(1, 0).ecx & (1u << 0)) &&
	    x86XCR(0).eax & (1u << 1));
}

+ (bool)supportsSSSE3
{
	return (x86CPUID(0, 0).eax >= 1 && x86CPUID(1, 0).ecx & (1u << 9));
	return ((x86CPUID(0, 0).eax >= 1 && x86CPUID(1, 0).ecx & (1u << 9)) &&
	    x86XCR(0).eax & (1u << 1));
}

+ (bool)supportsSSE41
{
	return (x86CPUID(0, 0).eax >= 1 && x86CPUID(1, 0).ecx & (1u << 19));
	return ((x86CPUID(0, 0).eax >= 1 && x86CPUID(1, 0).ecx & (1u << 19)) &&
	    x86XCR(0).eax & (1u << 1));
}

+ (bool)supportsSSE42
{
	return (x86CPUID(0, 0).eax >= 1 && x86CPUID(1, 0).ecx & (1u << 20));
	return ((x86CPUID(0, 0).eax >= 1 && x86CPUID(1, 0).ecx & (1u << 20)) &&
	    x86XCR(0).eax & (1u << 1));
}

+ (bool)supportsAVX
{
	return (x86CPUID(0, 0).eax >= 1 && x86CPUID(1, 0).ecx & (1u << 28));
	return ((x86CPUID(0, 0).eax >= 1 && x86CPUID(1, 0).ecx & (1u << 28)) &&
	    x86XCR(0).eax & (1u << 2));
}

+ (bool)supportsAVX2
{
	return (x86CPUID(0, 0).eax >= 7 && (x86CPUID(7, 0).ebx & (1u << 5)));
	return ((x86CPUID(0, 0).eax >= 7 && (x86CPUID(7, 0).ebx & (1u << 5))) &&
	    x86XCR(0).eax & (1u << 2));
}

+ (bool)supportsAESNI
{
	return (x86CPUID(0, 0).eax >= 1 && x86CPUID(1, 0).ecx & (1u << 25));
}

815
816
817
818
819
820
821
822


823
824
825
826
827


828
829
830
831
832


833
834
835
836
837


838
839
840
841
842


843
844
845
846
847


848
849
850
851
852


853
854
855
856
857


858
859
860
861
862


863
864
865
866
867


868
869
870
871
872


873
874
875
876
877


878
879
880
881
882


883
884
885
886
887


888
889
890
891
892


893
894
895
896
897
898
899
841
842
843
844
845
846
847

848
849
850
851
852
853

854
855
856
857
858
859

860
861
862
863
864
865

866
867
868
869
870
871

872
873
874
875
876
877

878
879
880
881
882
883

884
885
886
887
888
889

890
891
892
893
894
895

896
897
898
899
900
901

902
903
904
905
906
907

908
909
910
911
912
913

914
915
916
917
918
919

920
921
922
923
924
925

926
927
928
929
930
931

932
933
934
935
936
937
938
939
940







-
+
+




-
+
+




-
+
+




-
+
+




-
+
+




-
+
+




-
+
+




-
+
+




-
+
+




-
+
+




-
+
+




-
+
+




-
+
+




-
+
+




-
+
+







+ (bool)supportsF16C
{
	return (x86CPUID(0, 0).eax >= 1 && x86CPUID(1, 0).ecx & (1u << 29));
}

+ (bool)supportsAVX512Foundation
{
	return (x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ebx & (1u << 16));
	return ((x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ebx & (1u << 16)) &&
	    x86XCR(0).eax & ((1u << 5) | (1u << 6) | (1u << 7)));
}

+ (bool)supportsAVX512ConflictDetectionInstructions
{
	return (x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ebx & (1u << 28));
	return ((x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ebx & (1u << 28)) &&
	    x86XCR(0).eax & ((1u << 5) | (1u << 6) | (1u << 7)));
}

+ (bool)supportsAVX512ExponentialAndReciprocalInstructions
{
	return (x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ebx & (1u << 27));
	return ((x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ebx & (1u << 27)) &&
	    x86XCR(0).eax & ((1u << 5) | (1u << 6) | (1u << 7)));
}

+ (bool)supportsAVX512PrefetchInstructions
{
	return (x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ebx & (1u << 26));
	return ((x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ebx & (1u << 26)) &&
	    x86XCR(0).eax & ((1u << 5) | (1u << 6) | (1u << 7)));
}

+ (bool)supportsAVX512VectorLengthExtensions
{
	return (x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ebx & (1u << 31));
	return ((x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ebx & (1u << 31)) &&
	    x86XCR(0).eax & ((1u << 5) | (1u << 6) | (1u << 7)));
}

+ (bool)supportsAVX512DoublewordAndQuadwordInstructions
{
	return (x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ebx & (1u << 17));
	return ((x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ebx & (1u << 17)) &&
	    x86XCR(0).eax & ((1u << 5) | (1u << 6) | (1u << 7)));
}

+ (bool)supportsAVX512ByteAndWordInstructions
{
	return (x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ebx & (1u << 30));
	return ((x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ebx & (1u << 30)) &&
	    x86XCR(0).eax & ((1u << 5) | (1u << 6) | (1u << 7)));
}

+ (bool)supportsAVX512IntegerFusedMultiplyAdd
{
	return (x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ebx & (1u << 21));
	return ((x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ebx & (1u << 21)) &&
	    x86XCR(0).eax & ((1u << 5) | (1u << 6) | (1u << 7)));
}

+ (bool)supportsAVX512VectorByteManipulationInstructions
{
	return (x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ecx & (1u << 1));
	return ((x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ecx & (1u << 1)) &&
	    x86XCR(0).eax & ((1u << 5) | (1u << 6) | (1u << 7)));
}

+ (bool)supportsAVX512VectorPopulationCountInstruction
{
	return (x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ecx & (1u << 14));
	return ((x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ecx & (1u << 14)) &&
	    x86XCR(0).eax & ((1u << 5) | (1u << 6) | (1u << 7)));
}

+ (bool)supportsAVX512VectorNeuralNetworkInstructions
{
	return (x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ecx & (1u << 11));
	return ((x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ecx & (1u << 11)) &&
	    x86XCR(0).eax & ((1u << 5) | (1u << 6) | (1u << 7)));
}

+ (bool)supportsAVX512VectorByteManipulationInstructions2
{
	return (x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ecx & (1u << 6));
	return ((x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ecx & (1u << 6)) &&
	    x86XCR(0).eax & ((1u << 5) | (1u << 6) | (1u << 7)));
}

+ (bool)supportsAVX512BitAlgorithms
{
	return (x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ecx & (1u << 12));
	return ((x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).ecx & (1u << 12)) &&
	    x86XCR(0).eax & ((1u << 5) | (1u << 6) | (1u << 7)));
}

+ (bool)supportsAVX512Float16Instructions
{
	return (x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).edx & (1u << 23));
	return ((x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 0).edx & (1u << 23)) &&
	    x86XCR(0).eax & ((1u << 5) | (1u << 6) | (1u << 7)));
}

+ (bool)supportsAVX512BFloat16Instructions
{
	return (x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 1).eax & (1u << 5));
	return ((x86CPUID(0, 0).eax >= 7 && x86CPUID(7, 1).eax & (1u << 5)) &&
	    x86XCR(0).eax & ((1u << 5) | (1u << 6) | (1u << 7)));
}
#endif

#if defined(OF_POWERPC) || defined(OF_POWERPC64)
+ (bool)supportsAltiVec
{
# if defined(OF_MACOS)