@@ -691,12 +691,14 @@ file(GLOB KERNEL_SRC
691
691
${PROJECT_SOURCE_DIR} /kernel/avx512/kernel_dgeqrf_8_lib8.c
692
692
${PROJECT_SOURCE_DIR} /kernel/avx512/kernel_dgelqf_lib8.S
693
693
694
- ${PROJECT_SOURCE_DIR} /kernel/sse3/kernel_align_x64.S
695
-
696
694
${PROJECT_SOURCE_DIR} /kernel/avx2/kernel_dgemm_4x4_lib4.S
697
695
${PROJECT_SOURCE_DIR} /kernel/avx/kernel_dpack_lib4.S
698
696
)
699
697
698
+ file (GLOB KERNEL_ALIGN_SRC
699
+ ${PROJECT_SOURCE_DIR} /kernel/sse3/kernel_align_x64.S
700
+ )
701
+
700
702
endif (${TARGET} MATCHES X64_INTEL_SKYLAKE_X )
701
703
702
704
if (${TARGET} MATCHES X64_INTEL_HASWELL )
@@ -743,11 +745,13 @@ file(GLOB KERNEL_SRC
743
745
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_sdot_lib.c
744
746
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_saxpy_lib.c
745
747
746
- ${PROJECT_SOURCE_DIR} /kernel/sse3/kernel_align_x64.S
747
-
748
748
${PROJECT_SOURCE_DIR} /kernel/avx/kernel_d_aux_lib.S
749
749
)
750
750
751
+ file (GLOB KERNEL_ALIGN_SRC
752
+ ${PROJECT_SOURCE_DIR} /kernel/sse3/kernel_align_x64.S
753
+ )
754
+
751
755
endif (${TARGET} MATCHES X64_INTEL_HASWELL )
752
756
if (${TARGET} MATCHES X64_INTEL_SANDY_BRIDGE )
753
757
@@ -791,11 +795,13 @@ file(GLOB KERNEL_SRC
791
795
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_sdot_lib.c
792
796
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_saxpy_lib.c
793
797
794
- ${PROJECT_SOURCE_DIR} /kernel/sse3/kernel_align_x64.S
795
-
796
798
${PROJECT_SOURCE_DIR} /kernel/avx/kernel_d_aux_lib.S
797
799
)
798
800
801
+ file (GLOB KERNEL_ALIGN_SRC
802
+ ${PROJECT_SOURCE_DIR} /kernel/sse3/kernel_align_x64.S
803
+ )
804
+
799
805
endif (${TARGET} MATCHES X64_INTEL_SANDY_BRIDGE )
800
806
if (${TARGET} MATCHES X64_INTEL_CORE )
801
807
@@ -829,11 +835,13 @@ file(GLOB KERNEL_SRC
829
835
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_sdot_lib.c
830
836
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_saxpy_lib.c
831
837
832
- ${PROJECT_SOURCE_DIR} /kernel/sse3/kernel_align_x64.S
833
-
834
838
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_d_aux_lib.c
835
839
)
836
840
841
+ file (GLOB KERNEL_ALIGN_SRC
842
+ ${PROJECT_SOURCE_DIR} /kernel/sse3/kernel_align_x64.S
843
+ )
844
+
837
845
endif (${TARGET} MATCHES X64_INTEL_CORE )
838
846
if (${TARGET} MATCHES X64_AMD_BULLDOZER )
839
847
@@ -865,11 +873,13 @@ file(GLOB KERNEL_SRC
865
873
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_sdot_lib.c
866
874
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_saxpy_lib.c
867
875
868
- ${PROJECT_SOURCE_DIR} /kernel/sse3/kernel_align_x64.S
869
-
870
876
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_d_aux_lib.c
871
877
)
872
878
879
+ file (GLOB KERNEL_ALIGN_SRC
880
+ ${PROJECT_SOURCE_DIR} /kernel/sse3/kernel_align_x64.S
881
+ )
882
+
873
883
endif (${TARGET} MATCHES X64_AMD_BULLDOZER )
874
884
if (${TARGET} MATCHES ARMV8A_ARM_CORTEX_A57 OR ${TARGET2} MATCHES ARMV8A_ARM_CORTEX_A57 )
875
885
@@ -914,11 +924,13 @@ file(GLOB KERNEL_SRC
914
924
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_sdot_lib.c
915
925
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_saxpy_lib.c
916
926
917
- ${PROJECT_SOURCE_DIR} /kernel/generic/kernel_align_generic.c
918
-
919
927
${PROJECT_SOURCE_DIR} /kernel/armv8a/kernel_d_aux_lib.S
920
928
)
921
929
930
+ file (GLOB KERNEL_ALIGN_SRC
931
+ ${PROJECT_SOURCE_DIR} /kernel/generic/kernel_align_generic.c
932
+ )
933
+
922
934
endif (${TARGET} MATCHES ARMV8A_ARM_CORTEX_A57 OR ${TARGET2} MATCHES ARMV8A_ARM_CORTEX_A57 )
923
935
if (${TARGET} MATCHES ARMV8A_ARM_CORTEX_A53 OR ${TARGET2} MATCHES ARMV8A_ARM_CORTEX_A53 )
924
936
@@ -965,11 +977,13 @@ file(GLOB KERNEL_SRC
965
977
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_sdot_lib.c
966
978
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_saxpy_lib.c
967
979
968
- ${PROJECT_SOURCE_DIR} /kernel/generic/kernel_align_generic.c
969
-
970
980
${PROJECT_SOURCE_DIR} /kernel/armv8a/kernel_d_aux_lib.S
971
981
)
972
982
983
+ file (GLOB KERNEL_ALIGN_SRC
984
+ ${PROJECT_SOURCE_DIR} /kernel/generic/kernel_align_generic.c
985
+ )
986
+
973
987
endif (${TARGET} MATCHES ARMV8A_ARM_CORTEX_A53 OR ${TARGET2} MATCHES ARMV8A_ARM_CORTEX_A53 )
974
988
if (${TARGET} MATCHES ARMV7A_ARM_CORTEX_A15 )
975
989
@@ -1004,11 +1018,13 @@ file(GLOB KERNEL_SRC
1004
1018
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_sdot_lib.c
1005
1019
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_saxpy_lib.c
1006
1020
1007
- ${PROJECT_SOURCE_DIR} /kernel/generic/kernel_align_generic.c
1008
-
1009
1021
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_d_aux_lib.c
1010
1022
)
1011
1023
1024
+ file (GLOB KERNEL_ALIGN_SRC
1025
+ ${PROJECT_SOURCE_DIR} /kernel/generic/kernel_align_generic.c
1026
+ )
1027
+
1012
1028
endif (${TARGET} MATCHES ARMV7A_ARM_CORTEX_A15 )
1013
1029
if (${TARGET} MATCHES ARMV7A_ARM_CORTEX_A7 )
1014
1030
@@ -1042,11 +1058,13 @@ file(GLOB KERNEL_SRC
1042
1058
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_sdot_lib.c
1043
1059
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_saxpy_lib.c
1044
1060
1045
- ${PROJECT_SOURCE_DIR} /kernel/generic/kernel_align_generic.c
1046
-
1047
1061
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_d_aux_lib.c
1048
1062
)
1049
1063
1064
+ file (GLOB KERNEL_ALIGN_SRC
1065
+ ${PROJECT_SOURCE_DIR} /kernel/generic/kernel_align_generic.c
1066
+ )
1067
+
1050
1068
endif (${TARGET} MATCHES ARMV7A_ARM_CORTEX_A7 )
1051
1069
if (${TARGET} MATCHES ARMV7A_ARM_CORTEX_A9 )
1052
1070
@@ -1080,11 +1098,13 @@ file(GLOB KERNEL_SRC
1080
1098
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_sdot_lib.c
1081
1099
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_saxpy_lib.c
1082
1100
1083
- ${PROJECT_SOURCE_DIR} /kernel/generic/kernel_align_generic.c
1084
-
1085
1101
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_d_aux_lib.c
1086
1102
)
1087
1103
1104
+ file (GLOB KERNEL_ALIGN_SRC
1105
+ ${PROJECT_SOURCE_DIR} /kernel/generic/kernel_align_generic.c
1106
+ )
1107
+
1088
1108
endif (${TARGET} MATCHES ARMV7A_ARM_CORTEX_A9 )
1089
1109
if (${TARGET} MATCHES GENERIC )
1090
1110
@@ -1115,11 +1135,13 @@ file(GLOB KERNEL_SRC
1115
1135
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_sdot_lib.c
1116
1136
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_saxpy_lib.c
1117
1137
1118
- ${PROJECT_SOURCE_DIR} /kernel/generic/kernel_align_generic.c
1119
-
1120
1138
${PROJECT_SOURCE_DIR} /kernel/generic/kernel_d_aux_lib.c
1121
1139
)
1122
1140
1141
+ file (GLOB KERNEL_ALIGN_SRC
1142
+ ${PROJECT_SOURCE_DIR} /kernel/generic/kernel_align_generic.c
1143
+ )
1144
+
1123
1145
endif (${TARGET} MATCHES GENERIC )
1124
1146
1125
1147
@@ -1129,6 +1151,7 @@ set(BLASFEO_SRC ${AUX_COMMON_SRC})
1129
1151
if (${LA} MATCHES HIGH_PERFORMANCE )
1130
1152
1131
1153
list (APPEND BLASFEO_SRC ${KERNEL_SRC} )
1154
+ list (APPEND BLASFEO_SRC ${KERNEL_ALIGN_SRC} )
1132
1155
1133
1156
if (${MF} MATCHES PANELMAJ )
1134
1157
@@ -1168,6 +1191,7 @@ if(${LA} MATCHES HIGH_PERFORMANCE)
1168
1191
endif ()
1169
1192
if (${LA} MATCHES REFERENCE )
1170
1193
1194
+ list (APPEND BLASFEO_SRC ${KERNEL_ALIGN_SRC} )
1171
1195
list (APPEND BLASFEO_SRC ${AUX_REF_SRC} )
1172
1196
list (APPEND BLASFEO_SRC ${BLASFEO_REF_SRC} )
1173
1197
0 commit comments