Improvements to detection of AMD architectures. (#13407)
New entry for K10 microarchitecture. Reorder Zen* microarchitectures to avoid triggering as k10. Remove some desktop-specific flags that were preventing Opteron Bulldozer/Piledriver/Steamroller/Excavator CPUs from being recognized as such. Remove one or two flags which weren't produced in /proc/cpuinfo on older OS (RHEL6 and friends).
This commit is contained in:
parent
a6ea0bbbae
commit
77af4684aa
6 changed files with 142 additions and 4 deletions
|
@ -694,6 +694,38 @@
|
|||
}
|
||||
}
|
||||
},
|
||||
"k10": {
|
||||
"from": "x86_64",
|
||||
"vendor": "AuthenticAMD",
|
||||
"features": [
|
||||
"mmx",
|
||||
"sse",
|
||||
"sse2",
|
||||
"sse4a",
|
||||
"abm",
|
||||
"cx16",
|
||||
"3dnow",
|
||||
"3dnowext"
|
||||
],
|
||||
"compilers": {
|
||||
"gcc": {
|
||||
"name": "amdfam10",
|
||||
"versions": "4.3:",
|
||||
"flags": "-march={name} -mtune={name}"
|
||||
},
|
||||
"clang": {
|
||||
"versions": "3.9:",
|
||||
"name": "amdfam10",
|
||||
"family": "x86-64",
|
||||
"flags": "-march={family} -mcpu={name}"
|
||||
},
|
||||
"intel": {
|
||||
"versions": "16.0:",
|
||||
"warnings": "Intel's compilers may or may not optimize to the same degree for non-Intel microprocessors for optimizations that are not unique to Intel microprocessors",
|
||||
"flags": "-msse2"
|
||||
}
|
||||
}
|
||||
},
|
||||
"bulldozer": {
|
||||
"from": "x86_64",
|
||||
"vendor": "AuthenticAMD",
|
||||
|
@ -705,7 +737,7 @@
|
|||
"abm",
|
||||
"avx",
|
||||
"xop",
|
||||
"lwp",
|
||||
"fma4",
|
||||
"aes",
|
||||
"pclmulqdq",
|
||||
"cx16",
|
||||
|
@ -743,7 +775,7 @@
|
|||
"abm",
|
||||
"avx",
|
||||
"xop",
|
||||
"lwp",
|
||||
"fma4",
|
||||
"aes",
|
||||
"pclmulqdq",
|
||||
"cx16",
|
||||
|
@ -785,7 +817,7 @@
|
|||
"abm",
|
||||
"avx",
|
||||
"xop",
|
||||
"lwp",
|
||||
"fma4",
|
||||
"aes",
|
||||
"pclmulqdq",
|
||||
"cx16",
|
||||
|
@ -828,7 +860,7 @@
|
|||
"abm",
|
||||
"avx",
|
||||
"xop",
|
||||
"lwp",
|
||||
"fma4",
|
||||
"aes",
|
||||
"pclmulqdq",
|
||||
"cx16",
|
||||
|
|
26
lib/spack/spack/test/data/targets/linux-scientific7-k10
Normal file
26
lib/spack/spack/test/data/targets/linux-scientific7-k10
Normal file
|
@ -0,0 +1,26 @@
|
|||
processor : 0
|
||||
vendor_id : AuthenticAMD
|
||||
cpu family : 16
|
||||
model : 9
|
||||
model name : AMD Opteron(tm) Processor 6136
|
||||
stepping : 1
|
||||
microcode : 0x10000d9
|
||||
cpu MHz : 800.000
|
||||
cache size : 512 KB
|
||||
physical id : 0
|
||||
siblings : 8
|
||||
core id : 0
|
||||
cpu cores : 8
|
||||
apicid : 16
|
||||
initial apicid : 0
|
||||
fpu : yes
|
||||
fpu_exception : yes
|
||||
cpuid level : 5
|
||||
wp : yes
|
||||
flags : fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush mmx fxsr sse sse2 ht syscall nx mmxext fxsr_opt pdpe1gb rdtscp lm 3dnowext 3dnow constant_tsc art rep_good nopl nonstop_tsc extd_apicid amd_dcm pni monitor cx16 popcnt lahf_lm cmp_legacy svm extapic cr8_legacy abm sse4a misalignsse 3dnowprefetch osvw ibs skinit wdt nodeid_msr hw_pstate retpoline_amd ibp_disable vmmcall npt lbrv svm_lock nrip_save pausefilter
|
||||
bogomips : 4800.19
|
||||
TLB size : 1024 4K pages
|
||||
clflush size : 64
|
||||
cache_alignment : 64
|
||||
address sizes : 48 bits physical, 48 bits virtual
|
||||
power management: ts ttp tm stc 100mhzsteps hwpstate
|
|
@ -0,0 +1,26 @@
|
|||
processor : 0
|
||||
vendor_id : AuthenticAMD
|
||||
cpu family : 21
|
||||
model : 2
|
||||
model name : AMD Opteron(tm) Processor 6320
|
||||
stepping : 0
|
||||
microcode : 0x6000852
|
||||
cpu MHz : 1400.000
|
||||
cache size : 2048 KB
|
||||
physical id : 0
|
||||
siblings : 8
|
||||
core id : 0
|
||||
cpu cores : 4
|
||||
apicid : 32
|
||||
initial apicid : 0
|
||||
fpu : yes
|
||||
fpu_exception : yes
|
||||
cpuid level : 13
|
||||
wp : yes
|
||||
flags : fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush mmx fxsr sse sse2 ht syscall nx mmxext fxsr_opt pdpe1gb rdtscp lm constant_tsc art rep_good nopl nonstop_tsc extd_apicid amd_dcm aperfmperf pni pclmulqdq monitor ssse3 fma cx16 sse4_1 sse4_2 popcnt aes xsave avx f16c lahf_lm cmp_legacy svm extapic cr8_legacy abm sse4a misalignsse 3dnowprefetch osvw ibs xop skinit wdt fma4 tce nodeid_msr tbm topoext perfctr_core perfctr_nb cpb hw_pstate retpoline_amd ssbd ibpb vmmcall bmi1 arat npt lbrv svm_lock nrip_save tsc_scale vmcb_clean flushbyasid decodeassists pausefilter pfthreshold
|
||||
bogomips : 5600.11
|
||||
TLB size : 1536 4K pages
|
||||
clflush size : 64
|
||||
cache_alignment : 64
|
||||
address sizes : 48 bits physical, 48 bits virtual
|
||||
power management: ts ttp tm 100mhzsteps hwpstate cpb eff_freq_ro
|
|
@ -0,0 +1,25 @@
|
|||
processor : 0
|
||||
vendor_id : AuthenticAMD
|
||||
cpu family : 21
|
||||
model : 1
|
||||
model name : AMD Opteron(TM) Processor 6212
|
||||
stepping : 2
|
||||
cpu MHz : 2600.188
|
||||
cache size : 2048 KB
|
||||
physical id : 0
|
||||
siblings : 8
|
||||
core id : 0
|
||||
cpu cores : 4
|
||||
apicid : 32
|
||||
initial apicid : 0
|
||||
fpu : yes
|
||||
fpu_exception : yes
|
||||
cpuid level : 13
|
||||
wp : yes
|
||||
flags : fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush mmx fxsr sse sse2 ht syscall nx mmxext fxsr_opt pdpe1gb rdtscp lm constant_tsc rep_good nonstop_tsc extd_apicid amd_dcm aperfmperf pni pclmulqdq monitor ssse3 cx16 sse4_1 sse4_2 popcnt aes xsave avx lahf_lm cmp_legacy svm extapic cr8_legacy abm sse4a misalignsse 3dnowprefetch osvw ibs xop skinit wdt lwp fma4 nodeid_msr topoext perfctr_core perfctr_nb cpb ssbd retpoline ibpb npt lbrv svm_lock nrip_save tsc_scale vmcb_clean flushbyasid decodeassists pausefilter pfthreshold
|
||||
bogomips : 5200.37
|
||||
TLB size : 1536 4K pages
|
||||
clflush size : 64
|
||||
cache_alignment : 64
|
||||
address sizes : 48 bits physical, 48 bits virtual
|
||||
power management: ts ttp tm 100mhzsteps hwpstate cpb
|
|
@ -0,0 +1,25 @@
|
|||
processor : 31
|
||||
vendor_id : AuthenticAMD
|
||||
cpu family : 21
|
||||
model : 2
|
||||
model name : AMD Opteron(tm) Processor 6320
|
||||
stepping : 0
|
||||
cpu MHz : 2800.154
|
||||
cache size : 2048 KB
|
||||
physical id : 3
|
||||
siblings : 8
|
||||
core id : 3
|
||||
cpu cores : 4
|
||||
apicid : 135
|
||||
initial apicid : 103
|
||||
fpu : yes
|
||||
fpu_exception : yes
|
||||
cpuid level : 13
|
||||
wp : yes
|
||||
flags : fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 clflush mmx fxsr sse sse2 ht syscall nx mmxext fxsr_opt pdpe1gb rdtscp lm constant_tsc rep_good nonstop_tsc extd_apicid amd_dcm aperfmperf pni pclmulqdq monitor ssse3 fma cx16 sse4_1 sse4_2 popcnt aes xsave avx f16c lahf_lm cmp_legacy svm extapic cr8_legacy abm sse4a misalignsse 3dnowprefetch osvw ibs xop skinit wdt lwp fma4 tce nodeid_msr tbm topoext perfctr_core perfctr_nb cpb ssbd retpoline ibpb npt lbrv svm_lock nrip_save tsc_scale vmcb_clean flushbyasid decodeassists pausefilter pfthreshold bmi1
|
||||
bogomips : 5599.22
|
||||
TLB size : 1536 4K pages
|
||||
clflush size : 64
|
||||
cache_alignment : 64
|
||||
address sizes : 48 bits physical, 48 bits virtual
|
||||
power management: ts ttp tm 100mhzsteps hwpstate cpb eff_freq_ro
|
|
@ -26,6 +26,10 @@
|
|||
'linux-rhel7-ivybridge',
|
||||
'linux-rhel7-haswell',
|
||||
'linux-rhel7-zen',
|
||||
'linux-scientific7-k10',
|
||||
'linux-scientificfermi6-bulldozer',
|
||||
'linux-scientificfermi6-piledriver',
|
||||
'linux-scientific7-piledriver',
|
||||
'linux-rhel6-piledriver',
|
||||
'linux-centos7-power8le',
|
||||
'darwin-mojave-ivybridge',
|
||||
|
|
Loading…
Reference in a new issue