mirror of
https://github.com/jart/cosmopolitan.git
synced 2025-06-02 02:32:27 +00:00
Add OpenMP support
This commit is contained in:
parent
c1e18e7903
commit
5f8e9f14c1
742 changed files with 94643 additions and 1279 deletions
420
third_party/openmp/kmp_utility.cpp
vendored
Normal file
420
third_party/openmp/kmp_utility.cpp
vendored
Normal file
|
@ -0,0 +1,420 @@
|
|||
/*
|
||||
* kmp_utility.cpp -- Utility routines for the OpenMP support library.
|
||||
*/
|
||||
|
||||
//===----------------------------------------------------------------------===//
|
||||
//
|
||||
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
||||
// See https://llvm.org/LICENSE.txt for license information.
|
||||
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
||||
//
|
||||
//===----------------------------------------------------------------------===//
|
||||
|
||||
#include "kmp.h"
|
||||
#include "kmp_i18n.h"
|
||||
#include "kmp_str.h"
|
||||
#include "kmp_wrapper_getpid.h"
|
||||
#include <float.h>
|
||||
|
||||
static const char *unknown = "unknown";
|
||||
|
||||
#if KMP_ARCH_X86 || KMP_ARCH_X86_64
|
||||
|
||||
/* NOTE: If called before serial_initialize (i.e. from runtime_initialize), then
|
||||
the debugging package has not been initialized yet, and only "0" will print
|
||||
debugging output since the environment variables have not been read. */
|
||||
|
||||
#ifdef KMP_DEBUG
|
||||
static int trace_level = 5;
|
||||
#endif
|
||||
|
||||
/* LOG_ID_BITS = ( 1 + floor( log_2( max( log_per_phy - 1, 1 ))))
|
||||
* APIC_ID = (PHY_ID << LOG_ID_BITS) | LOG_ID
|
||||
* PHY_ID = APIC_ID >> LOG_ID_BITS
|
||||
*/
|
||||
int __kmp_get_physical_id(int log_per_phy, int apic_id) {
|
||||
int index_lsb, index_msb, temp;
|
||||
|
||||
if (log_per_phy > 1) {
|
||||
index_lsb = 0;
|
||||
index_msb = 31;
|
||||
|
||||
temp = log_per_phy;
|
||||
while ((temp & 1) == 0) {
|
||||
temp >>= 1;
|
||||
index_lsb++;
|
||||
}
|
||||
|
||||
temp = log_per_phy;
|
||||
while ((temp & 0x80000000) == 0) {
|
||||
temp <<= 1;
|
||||
index_msb--;
|
||||
}
|
||||
|
||||
/* If >1 bits were set in log_per_phy, choose next higher power of 2 */
|
||||
if (index_lsb != index_msb)
|
||||
index_msb++;
|
||||
|
||||
return ((int)(apic_id >> index_msb));
|
||||
}
|
||||
|
||||
return apic_id;
|
||||
}
|
||||
|
||||
/*
|
||||
* LOG_ID_BITS = ( 1 + floor( log_2( max( log_per_phy - 1, 1 ))))
|
||||
* APIC_ID = (PHY_ID << LOG_ID_BITS) | LOG_ID
|
||||
* LOG_ID = APIC_ID & (( 1 << LOG_ID_BITS ) - 1 )
|
||||
*/
|
||||
int __kmp_get_logical_id(int log_per_phy, int apic_id) {
|
||||
unsigned current_bit;
|
||||
int bits_seen;
|
||||
|
||||
if (log_per_phy <= 1)
|
||||
return (0);
|
||||
|
||||
bits_seen = 0;
|
||||
|
||||
for (current_bit = 1; log_per_phy != 0; current_bit <<= 1) {
|
||||
if (log_per_phy & current_bit) {
|
||||
log_per_phy &= ~current_bit;
|
||||
bits_seen++;
|
||||
}
|
||||
}
|
||||
|
||||
/* If exactly 1 bit was set in log_per_phy, choose next lower power of 2 */
|
||||
if (bits_seen == 1) {
|
||||
current_bit >>= 1;
|
||||
}
|
||||
|
||||
return ((int)((current_bit - 1) & apic_id));
|
||||
}
|
||||
|
||||
static kmp_uint64 __kmp_parse_frequency( // R: Frequency in Hz.
|
||||
char const *frequency // I: Float number and unit: MHz, GHz, or TGz.
|
||||
) {
|
||||
|
||||
double value = 0.0;
|
||||
char *unit = NULL;
|
||||
kmp_uint64 result = 0; /* Zero is a better unknown value than all ones. */
|
||||
|
||||
if (frequency == NULL) {
|
||||
return result;
|
||||
}
|
||||
value = strtod(frequency, &unit);
|
||||
if (0 < value &&
|
||||
value <= DBL_MAX) { // Good value (not overflow, underflow, etc).
|
||||
if (strcmp(unit, "MHz") == 0) {
|
||||
value = value * 1.0E+6;
|
||||
} else if (strcmp(unit, "GHz") == 0) {
|
||||
value = value * 1.0E+9;
|
||||
} else if (strcmp(unit, "THz") == 0) {
|
||||
value = value * 1.0E+12;
|
||||
} else { // Wrong unit.
|
||||
return result;
|
||||
}
|
||||
result = (kmp_uint64)value; // rounds down
|
||||
}
|
||||
return result;
|
||||
|
||||
} // func __kmp_parse_cpu_frequency
|
||||
|
||||
void __kmp_query_cpuid(kmp_cpuinfo_t *p) {
|
||||
struct kmp_cpuid buf;
|
||||
int max_arg;
|
||||
int log_per_phy;
|
||||
#ifdef KMP_DEBUG
|
||||
int cflush_size;
|
||||
#endif
|
||||
|
||||
p->initialized = 1;
|
||||
|
||||
p->flags.sse2 = 1; // Assume SSE2 by default.
|
||||
|
||||
__kmp_x86_cpuid(0, 0, &buf);
|
||||
|
||||
KA_TRACE(trace_level,
|
||||
("INFO: CPUID %d: EAX=0x%08X EBX=0x%08X ECX=0x%08X EDX=0x%08X\n", 0,
|
||||
buf.eax, buf.ebx, buf.ecx, buf.edx));
|
||||
|
||||
max_arg = buf.eax;
|
||||
|
||||
p->apic_id = -1;
|
||||
|
||||
if (max_arg >= 1) {
|
||||
int i;
|
||||
kmp_uint32 t, data[4];
|
||||
|
||||
__kmp_x86_cpuid(1, 0, &buf);
|
||||
KA_TRACE(trace_level,
|
||||
("INFO: CPUID %d: EAX=0x%08X EBX=0x%08X ECX=0x%08X EDX=0x%08X\n",
|
||||
1, buf.eax, buf.ebx, buf.ecx, buf.edx));
|
||||
|
||||
{
|
||||
#define get_value(reg, lo, mask) (((reg) >> (lo)) & (mask))
|
||||
|
||||
p->signature = buf.eax;
|
||||
p->family = get_value(buf.eax, 20, 0xff) + get_value(buf.eax, 8, 0x0f);
|
||||
p->model =
|
||||
(get_value(buf.eax, 16, 0x0f) << 4) + get_value(buf.eax, 4, 0x0f);
|
||||
p->stepping = get_value(buf.eax, 0, 0x0f);
|
||||
|
||||
#undef get_value
|
||||
|
||||
KA_TRACE(trace_level, (" family = %d, model = %d, stepping = %d\n",
|
||||
p->family, p->model, p->stepping));
|
||||
}
|
||||
|
||||
for (t = buf.ebx, i = 0; i < 4; t >>= 8, ++i) {
|
||||
data[i] = (t & 0xff);
|
||||
}
|
||||
|
||||
p->flags.sse2 = (buf.edx >> 26) & 1;
|
||||
|
||||
#ifdef KMP_DEBUG
|
||||
|
||||
if ((buf.edx >> 4) & 1) {
|
||||
/* TSC - Timestamp Counter Available */
|
||||
KA_TRACE(trace_level, (" TSC"));
|
||||
}
|
||||
if ((buf.edx >> 8) & 1) {
|
||||
/* CX8 - CMPXCHG8B Instruction Available */
|
||||
KA_TRACE(trace_level, (" CX8"));
|
||||
}
|
||||
if ((buf.edx >> 9) & 1) {
|
||||
/* APIC - Local APIC Present (multi-processor operation support */
|
||||
KA_TRACE(trace_level, (" APIC"));
|
||||
}
|
||||
if ((buf.edx >> 15) & 1) {
|
||||
/* CMOV - Conditional MOVe Instruction Available */
|
||||
KA_TRACE(trace_level, (" CMOV"));
|
||||
}
|
||||
if ((buf.edx >> 18) & 1) {
|
||||
/* PSN - Processor Serial Number Available */
|
||||
KA_TRACE(trace_level, (" PSN"));
|
||||
}
|
||||
if ((buf.edx >> 19) & 1) {
|
||||
/* CLFLUSH - Cache Flush Instruction Available */
|
||||
cflush_size =
|
||||
data[1] * 8; /* Bits 15-08: CLFLUSH line size = 8 (64 bytes) */
|
||||
KA_TRACE(trace_level, (" CLFLUSH(%db)", cflush_size));
|
||||
}
|
||||
if ((buf.edx >> 21) & 1) {
|
||||
/* DTES - Debug Trace & EMON Store */
|
||||
KA_TRACE(trace_level, (" DTES"));
|
||||
}
|
||||
if ((buf.edx >> 22) & 1) {
|
||||
/* ACPI - ACPI Support Available */
|
||||
KA_TRACE(trace_level, (" ACPI"));
|
||||
}
|
||||
if ((buf.edx >> 23) & 1) {
|
||||
/* MMX - Multimedia Extensions */
|
||||
KA_TRACE(trace_level, (" MMX"));
|
||||
}
|
||||
if ((buf.edx >> 25) & 1) {
|
||||
/* SSE - SSE Instructions */
|
||||
KA_TRACE(trace_level, (" SSE"));
|
||||
}
|
||||
if ((buf.edx >> 26) & 1) {
|
||||
/* SSE2 - SSE2 Instructions */
|
||||
KA_TRACE(trace_level, (" SSE2"));
|
||||
}
|
||||
if ((buf.edx >> 27) & 1) {
|
||||
/* SLFSNP - Self-Snooping Cache */
|
||||
KA_TRACE(trace_level, (" SLFSNP"));
|
||||
}
|
||||
#endif /* KMP_DEBUG */
|
||||
|
||||
if ((buf.edx >> 28) & 1) {
|
||||
/* Bits 23-16: Logical Processors per Physical Processor (1 for P4) */
|
||||
log_per_phy = data[2];
|
||||
p->apic_id = data[3]; /* Bits 31-24: Processor Initial APIC ID (X) */
|
||||
KA_TRACE(trace_level, (" HT(%d TPUs)", log_per_phy));
|
||||
p->physical_id = __kmp_get_physical_id(log_per_phy, p->apic_id);
|
||||
p->logical_id = __kmp_get_logical_id(log_per_phy, p->apic_id);
|
||||
}
|
||||
#ifdef KMP_DEBUG
|
||||
if ((buf.edx >> 29) & 1) {
|
||||
/* ATHROTL - Automatic Throttle Control */
|
||||
KA_TRACE(trace_level, (" ATHROTL"));
|
||||
}
|
||||
KA_TRACE(trace_level, (" ]\n"));
|
||||
|
||||
for (i = 2; i <= max_arg; ++i) {
|
||||
__kmp_x86_cpuid(i, 0, &buf);
|
||||
KA_TRACE(trace_level,
|
||||
("INFO: CPUID %d: EAX=0x%08X EBX=0x%08X ECX=0x%08X EDX=0x%08X\n",
|
||||
i, buf.eax, buf.ebx, buf.ecx, buf.edx));
|
||||
}
|
||||
#endif
|
||||
p->flags.rtm = 0;
|
||||
p->flags.hybrid = 0;
|
||||
if (max_arg > 7) {
|
||||
/* RTM bit CPUID.07:EBX, bit 11 */
|
||||
/* HYRBID bit CPUID.07:EDX, bit 15 */
|
||||
__kmp_x86_cpuid(7, 0, &buf);
|
||||
p->flags.rtm = (buf.ebx >> 11) & 1;
|
||||
p->flags.hybrid = (buf.edx >> 15) & 1;
|
||||
if (p->flags.rtm) {
|
||||
KA_TRACE(trace_level, (" RTM"));
|
||||
}
|
||||
if (p->flags.hybrid) {
|
||||
KA_TRACE(trace_level, (" HYBRID"));
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
{ // Parse CPU brand string for frequency, saving the string for later.
|
||||
int i;
|
||||
kmp_cpuid_t *base = (kmp_cpuid_t *)&p->name[0];
|
||||
|
||||
// Get CPU brand string.
|
||||
for (i = 0; i < 3; ++i) {
|
||||
__kmp_x86_cpuid(0x80000002 + i, 0, base + i);
|
||||
}
|
||||
p->name[sizeof(p->name) - 1] = 0; // Just in case. ;-)
|
||||
KA_TRACE(trace_level, ("cpu brand string: \"%s\"\n", &p->name[0]));
|
||||
|
||||
// Parse frequency.
|
||||
p->frequency = __kmp_parse_frequency(strrchr(&p->name[0], ' '));
|
||||
KA_TRACE(trace_level,
|
||||
("cpu frequency from brand string: %" KMP_UINT64_SPEC "\n",
|
||||
p->frequency));
|
||||
}
|
||||
}
|
||||
|
||||
#endif /* KMP_ARCH_X86 || KMP_ARCH_X86_64 */
|
||||
|
||||
void __kmp_expand_host_name(char *buffer, size_t size) {
|
||||
KMP_DEBUG_ASSERT(size >= sizeof(unknown));
|
||||
#if KMP_OS_WINDOWS
|
||||
{
|
||||
DWORD s = size;
|
||||
|
||||
if (!GetComputerNameA(buffer, &s))
|
||||
KMP_STRCPY_S(buffer, size, unknown);
|
||||
}
|
||||
#elif KMP_OS_WASI
|
||||
KMP_STRCPY_S(buffer, size, unknown);
|
||||
#else
|
||||
buffer[size - 2] = 0;
|
||||
if (gethostname(buffer, size) || buffer[size - 2] != 0)
|
||||
KMP_STRCPY_S(buffer, size, unknown);
|
||||
#endif
|
||||
}
|
||||
|
||||
/* Expand the meta characters in the filename:
|
||||
* Currently defined characters are:
|
||||
* %H the hostname
|
||||
* %P the number of threads used.
|
||||
* %I the unique identifier for this run.
|
||||
*/
|
||||
|
||||
void __kmp_expand_file_name(char *result, size_t rlen, char *pattern) {
|
||||
char *pos = result, *end = result + rlen - 1;
|
||||
char buffer[256];
|
||||
int default_cpu_width = 1;
|
||||
int snp_result;
|
||||
|
||||
KMP_DEBUG_ASSERT(rlen > 0);
|
||||
*end = 0;
|
||||
{
|
||||
int i;
|
||||
for (i = __kmp_xproc; i >= 10; i /= 10, ++default_cpu_width)
|
||||
;
|
||||
}
|
||||
|
||||
if (pattern != NULL) {
|
||||
while (*pattern != '\0' && pos < end) {
|
||||
if (*pattern != '%') {
|
||||
*pos++ = *pattern++;
|
||||
} else {
|
||||
char *old_pattern = pattern;
|
||||
int width = 1;
|
||||
int cpu_width = default_cpu_width;
|
||||
|
||||
++pattern;
|
||||
|
||||
if (*pattern >= '0' && *pattern <= '9') {
|
||||
width = 0;
|
||||
do {
|
||||
width = (width * 10) + *pattern++ - '0';
|
||||
} while (*pattern >= '0' && *pattern <= '9');
|
||||
if (width < 0 || width > 1024)
|
||||
width = 1;
|
||||
|
||||
cpu_width = width;
|
||||
}
|
||||
|
||||
switch (*pattern) {
|
||||
case 'H':
|
||||
case 'h': {
|
||||
__kmp_expand_host_name(buffer, sizeof(buffer));
|
||||
KMP_STRNCPY(pos, buffer, end - pos + 1);
|
||||
if (*end == 0) {
|
||||
while (*pos)
|
||||
++pos;
|
||||
++pattern;
|
||||
} else
|
||||
pos = end;
|
||||
} break;
|
||||
case 'P':
|
||||
case 'p': {
|
||||
snp_result = KMP_SNPRINTF(pos, end - pos + 1, "%0*d", cpu_width,
|
||||
__kmp_dflt_team_nth);
|
||||
if (snp_result >= 0 && snp_result <= end - pos) {
|
||||
while (*pos)
|
||||
++pos;
|
||||
++pattern;
|
||||
} else
|
||||
pos = end;
|
||||
} break;
|
||||
case 'I':
|
||||
case 'i': {
|
||||
pid_t id = getpid();
|
||||
#if (KMP_ARCH_X86_64 || KMP_ARCH_AARCH64) && defined(__MINGW32__)
|
||||
snp_result = KMP_SNPRINTF(pos, end - pos + 1, "%0*lld", width, id);
|
||||
#else
|
||||
snp_result = KMP_SNPRINTF(pos, end - pos + 1, "%0*d", width, id);
|
||||
#endif
|
||||
if (snp_result >= 0 && snp_result <= end - pos) {
|
||||
while (*pos)
|
||||
++pos;
|
||||
++pattern;
|
||||
} else
|
||||
pos = end;
|
||||
break;
|
||||
}
|
||||
case '%': {
|
||||
*pos++ = '%';
|
||||
++pattern;
|
||||
break;
|
||||
}
|
||||
default: {
|
||||
*pos++ = '%';
|
||||
pattern = old_pattern + 1;
|
||||
break;
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
/* TODO: How do we get rid of this? */
|
||||
if (*pattern != '\0')
|
||||
KMP_FATAL(FileNameTooLong);
|
||||
}
|
||||
|
||||
*pos = '\0';
|
||||
}
|
||||
|
||||
#if !OMPT_SUPPORT
|
||||
extern "C" {
|
||||
typedef struct ompt_start_tool_result_t ompt_start_tool_result_t;
|
||||
// Define symbols expected by VERSION script
|
||||
ompt_start_tool_result_t *ompt_start_tool(unsigned int omp_version,
|
||||
const char *runtime_version) {
|
||||
return nullptr;
|
||||
}
|
||||
|
||||
void ompt_libomp_connect(ompt_start_tool_result_t *result) { result = nullptr; }
|
||||
}
|
||||
#endif
|
Loading…
Add table
Add a link
Reference in a new issue