/usr/include/gromacs/gmx_cpuid.h is in gromacs-dev 4.6.5-1build1.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 | /*
* This file is part of the GROMACS molecular simulation package.
*
* Copyright (c) 2012,2013, by the GROMACS development team, led by
* David van der Spoel, Berk Hess, Erik Lindahl, and including many
* others, as listed in the AUTHORS file in the top-level source
* directory and at http://www.gromacs.org.
*
* GROMACS is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public License
* as published by the Free Software Foundation; either version 2.1
* of the License, or (at your option) any later version.
*
* GROMACS is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with GROMACS; if not, see
* http://www.gnu.org/licenses, or write to the Free Software Foundation,
* Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
*
* If you want to redistribute modifications to GROMACS, please
* consider that scientific software is very special. Version
* control is crucial - bugs must be traceable. We will be happy to
* consider code for inclusion in the official distribution, but
* derived work must not be called official GROMACS. Details are found
* in the README & COPYING files - if they are missing, get the
* official version at http://www.gromacs.org.
*
* To help us fund GROMACS development, we humbly ask that you cite
* the research papers on the package. Check out http://www.gromacs.org.
*/
#ifndef GMX_CPUID_H_
#define GMX_CPUID_H_
#include <stdio.h>
#include "visibility.h"
#ifdef __cplusplus
extern "C" {
#endif
#if 0
} /* fixes auto-indentation problems */
#endif
/* Currently identifiable CPU Vendors */
enum gmx_cpuid_vendor
{
GMX_CPUID_VENDOR_CANNOTDETECT, /* Should only be used if something fails */
GMX_CPUID_VENDOR_UNKNOWN,
GMX_CPUID_VENDOR_INTEL,
GMX_CPUID_VENDOR_AMD,
GMX_CPUID_VENDOR_FUJITSU,
GMX_CPUID_VENDOR_IBM,
GMX_CPUID_NVENDORS
};
/* CPU feature/property list, to be used as indices into the feature array of the
* gmxcpuid_t data structure.
*
* To facilitate looking things up, we keep this list alphabetical.
* The list is NOT exhaustive - we have basically added stuff that might be
* useful in an application like Gromacs.
*
* AMD and Intel tend to share most architectural elements, and even if the
* flags might have to be detected in different ways (different cpuid registers),
* once the flag is present the functions should be identical. Unfortunately the
* trend right now (2012) seems to be that they are diverging. This means that
* we need to use specific flags to the compiler to maximize performance, and
* then the binaries might not be portable between Intel and AMD as they were
* before when we only needed to check for SSE and/or SSE2 support in Gromacs.
*/
enum gmx_cpuid_feature
{
GMX_CPUID_FEATURE_CANNOTDETECT, /* Flag set if we could not detect on this CPU */
GMX_CPUID_FEATURE_X86_AES, /* x86 advanced encryption standard accel. */
GMX_CPUID_FEATURE_X86_APIC, /* APIC support */
GMX_CPUID_FEATURE_X86_AVX, /* Advanced vector extensions */
GMX_CPUID_FEATURE_X86_AVX2, /* AVX2 including gather support (not used yet) */
GMX_CPUID_FEATURE_X86_CLFSH, /* Supports CLFLUSH instruction */
GMX_CPUID_FEATURE_X86_CMOV, /* Conditional move insn support */
GMX_CPUID_FEATURE_X86_CX8, /* Supports CMPXCHG8B (8-byte compare-exchange) */
GMX_CPUID_FEATURE_X86_CX16, /* Supports CMPXCHG16B (16-byte compare-exchg) */
GMX_CPUID_FEATURE_X86_F16C, /* Supports 16-bit FP conversion instructions */
GMX_CPUID_FEATURE_X86_FMA, /* Fused-multiply add support (mainly for AVX) */
GMX_CPUID_FEATURE_X86_FMA4, /* 4-operand FMA, only on AMD for now */
GMX_CPUID_FEATURE_X86_HTT, /* Hyper-Threading supported */
GMX_CPUID_FEATURE_X86_LAHF_LM, /* LAHF/SAHF support in 64 bits */
GMX_CPUID_FEATURE_X86_MISALIGNSSE, /* Support for misaligned SSE data instructions */
GMX_CPUID_FEATURE_X86_MMX, /* MMX registers and instructions */
GMX_CPUID_FEATURE_X86_MSR, /* Supports Intel model-specific-registers */
GMX_CPUID_FEATURE_X86_NONSTOP_TSC, /* Invariant TSC (constant rate in ACPI states) */
GMX_CPUID_FEATURE_X86_PCID, /* Process context identifier support */
GMX_CPUID_FEATURE_X86_PCLMULDQ, /* Carry-less 64-bit multiplication supported */
GMX_CPUID_FEATURE_X86_PDCM, /* Perfmon and Debug Capability */
GMX_CPUID_FEATURE_X86_PDPE1GB, /* Support for 1GB pages */
GMX_CPUID_FEATURE_X86_POPCNT, /* Supports the POPCNT (population count) insn */
GMX_CPUID_FEATURE_X86_PSE, /* Supports 4MB-pages (page size extension) */
GMX_CPUID_FEATURE_X86_RDRND, /* RDRAND high-quality hardware random numbers */
GMX_CPUID_FEATURE_X86_RDTSCP, /* Serializing rdtscp instruction available */
GMX_CPUID_FEATURE_X86_SSE2, /* SSE 2 */
GMX_CPUID_FEATURE_X86_SSE3, /* SSE 3 */
GMX_CPUID_FEATURE_X86_SSE4A, /* SSE 4A */
GMX_CPUID_FEATURE_X86_SSE4_1, /* SSE 4.1 */
GMX_CPUID_FEATURE_X86_SSE4_2, /* SSE 4.2 */
GMX_CPUID_FEATURE_X86_SSSE3, /* Supplemental SSE3 */
GMX_CPUID_FEATURE_X86_TDT, /* TSC deadline timer */
GMX_CPUID_FEATURE_X86_X2APIC, /* Extended xAPIC Support */
GMX_CPUID_FEATURE_X86_XOP, /* AMD extended instructions, only AMD for now */
GMX_CPUID_NFEATURES
};
/* Currently supported acceleration instruction sets, intrinsics or other similar combinations
* in Gromacs. There is not always a 1-to-1 correspondence with feature flags; on some AMD
* hardware we prefer to use 128bit AVX instructions (although 256-bit ones could be executed),
* and we still haven't written the AVX2 kernels.
*/
enum gmx_cpuid_acceleration
{
GMX_CPUID_ACCELERATION_CANNOTDETECT, /* Should only be used if something fails */
GMX_CPUID_ACCELERATION_NONE,
GMX_CPUID_ACCELERATION_X86_SSE2,
GMX_CPUID_ACCELERATION_X86_SSE4_1,
GMX_CPUID_ACCELERATION_X86_AVX_128_FMA,
GMX_CPUID_ACCELERATION_X86_AVX_256,
GMX_CPUID_ACCELERATION_SPARC64_HPC_ACE,
GMX_CPUID_ACCELERATION_IBM_QPX,
GMX_CPUID_NACCELERATIONS
};
/* Text strings corresponding to CPU vendors */
GMX_LIBGMX_EXPORT
extern const char *
gmx_cpuid_vendor_string[GMX_CPUID_NVENDORS];
/* Text strings for CPU feature indices */
extern const char *
gmx_cpuid_feature_string[GMX_CPUID_NFEATURES];
/* Text strings for Gromacs acceleration/instruction sets */
extern const char *
gmx_cpuid_acceleration_string[GMX_CPUID_NACCELERATIONS];
/* Abstract data type with CPU detection information. Set by gmx_cpuid_init(). */
typedef struct gmx_cpuid *
gmx_cpuid_t;
/* Fill the data structure by using CPU detection instructions.
* Return 0 on success, 1 if something bad happened.
*/
int
gmx_cpuid_init (gmx_cpuid_t * cpuid);
/* Return the vendor id as enumerated type. Use gmx_cpuid_vendor_string[]
* to get the corresponding text string.
*/
GMX_LIBGMX_EXPORT
enum gmx_cpuid_vendor
gmx_cpuid_vendor (gmx_cpuid_t cpuid);
/* Return a constant pointer to the processor brand string. */
const char *
gmx_cpuid_brand (gmx_cpuid_t cpuid);
/* Return processor family version. For a chip of version 1.2.3, this is 1 */
GMX_LIBGMX_EXPORT
int
gmx_cpuid_family (gmx_cpuid_t cpuid);
/* Return processor model version, For a chip of version 1.2.3, this is 2. */
GMX_LIBGMX_EXPORT
int
gmx_cpuid_model (gmx_cpuid_t cpuid);
/* Return processor stepping version, For a chip of version 1.2.3, this is 3. */
int
gmx_cpuid_stepping (gmx_cpuid_t cpuid);
/* Check whether a particular CPUID feature is set.
* Returns 0 if flag "feature" is not set, 1 if the flag is set. We cannot use
* gmx_bool here since this file must be possible to compile without simple.h.
*/
GMX_LIBGMX_EXPORT
int
gmx_cpuid_feature (gmx_cpuid_t cpuid,
enum gmx_cpuid_feature feature);
/* Return pointers to cpu topology information.
*
* Important: CPU topology requires more OS support than most other
* functions in this file, including support for thread pinning to hardware.
* This means it will not work on some platforms, including e.g. Mac OS X.
* Thus, it is IMPERATIVE that you check the return value from this routine
* before doing anything with the information. It is only if the return
* value is zero that the data is valid.
*
* For the returned values we have:
* - nprocessors Total number of logical processors reported by OS
* - npackages Usually number of CPU sockets
* - ncores_per_package Number of cores in each package
* - nhwthreads_per_core Number of hardware threads per core; 2 for hyperthreading.
* - package_id Array with the package index for each logical cpu
* - core_id Array with local core index for each logical cpu
* - hwthread_id Array with local hwthread index for each logical cpu
* - locality_order Array with logical cpu numbers, sorted in order
* of physical and logical locality in the system.
*
* All arrays are of length nprocessors.
*/
GMX_LIBGMX_EXPORT
int
gmx_cpuid_topology(gmx_cpuid_t cpuid,
int * nprocessors,
int * npackages,
int * ncores_per_package,
int * nhwthreads_per_core,
const int ** package_id,
const int ** core_id,
const int ** hwthread_id,
const int ** locality_order);
/* Enumerated values for x86 SMT enabled-status. Note that this does not refer
* to Hyper-Threading support (that is the flag GMX_CPUID_FEATURE_X86_HTT), but
* whether Hyper-Threading is _enabled_ and _used_ in bios right now.
*/
enum gmx_cpuid_x86_smt
{
GMX_CPUID_X86_SMT_CANNOTDETECT,
GMX_CPUID_X86_SMT_DISABLED,
GMX_CPUID_X86_SMT_ENABLED
};
/* Returns the status of x86 SMT support. IMPORTANT: There are non-zero
* return values for this routine that still do not indicate supported and
* enabled smt/Hyper-Threading. You need to carefully check the return value
* against the enumerated type values to see what you are getting.
*
* Long-term, this functionality will move to a new hardware topology detection
* layer, but that will require a lot of new code and a working interface to the
* hwloc library. Surprisingly, there is no simple way to find out that
* Hyper-Threading is actually turned on without fully enumerating and checking
* all the cores, which we presently can only do on Linux. This means a couple
* of things:
*
* 1) If you want to know whether your CPU _supports_ Hyper-Threading in the
* first place, check the GMX_CPUID_FEATURE_X86_HTT flag instead!
* 2) There are several scenarios where this routine will say that it cannot
* detect whether SMT is enabled and used right now.
* 3) If you need support on non-Linux x86, you have to write it :-)
* 4) Don't invest too much efforts, since this will be replaced with
* full hardware topology detection in the future.
* 5) Don't worry if the detection does not work. It is not a catastrophe, but
* but we get slightly better performance on x86 if we use Hyper-Threading
* cores in direct space, but not reciprocal space.
*
* Since this routine presently only supports Hyper-Threading we say X86_SMT
* in order not to give the impression we can detect any SMT. We haven't
* even tested the performance on other SMT implementations, so it is not
* obvious we shouldn't use SMT there.
*
* Note that you can get more complete topology information from
* gmx_cpuid_topology(), although that requires slightly more OS support.
*/
GMX_LIBGMX_EXPORT
enum gmx_cpuid_x86_smt
gmx_cpuid_x86_smt(gmx_cpuid_t cpuid);
/* Formats a text string (up to n characters) from the data structure.
* The output will have max 80 chars between newline characters.
*/
int
gmx_cpuid_formatstring (gmx_cpuid_t cpuid,
char * s,
int n);
/* Suggests a suitable gromacs acceleration based on the support in the
* hardware.
*/
enum gmx_cpuid_acceleration
gmx_cpuid_acceleration_suggest (gmx_cpuid_t cpuid);
/* Check if this binary was compiled with the same acceleration as we
* would suggest for the current hardware. Always print stats to the log file
* if it is non-NULL, and if we don't have a match, print a warning in log
* (if non-NULL) and if print_to_stderr!=0 also to stderr.
*/
int
gmx_cpuid_acceleration_check (gmx_cpuid_t cpuid,
FILE * log,
int print_to_stderr);
/* Release resources used by data structure. Note that the pointer to the
* CPU brand string will no longer be valid once this routine has been called.
*/
void
gmx_cpuid_done (gmx_cpuid_t cpuid);
#ifdef __cplusplus
}
#endif
#endif /* GMX_CPUID_H_ */
|