| /* |
| * ompt-general.cpp -- OMPT implementation of interface functions |
| */ |
| |
| //===----------------------------------------------------------------------===// |
| // |
| // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| // See https://llvm.org/LICENSE.txt for license information. |
| // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| // |
| //===----------------------------------------------------------------------===// |
| |
| #include "kmp_utils.h" |
| |
| /***************************************************************************** |
| * system include files |
| ****************************************************************************/ |
| #include <assert.h> |
| |
| #include <stdint.h> |
| #include <stdio.h> |
| #include <stdlib.h> |
| #include <string.h> |
| #if KMP_OS_UNIX |
| #include <dlfcn.h> |
| #endif |
| |
| /***************************************************************************** |
| * ompt include files |
| ****************************************************************************/ |
| |
| #include "ompt-specific.cpp" |
| |
| /***************************************************************************** |
| * macros |
| ****************************************************************************/ |
| |
| #define ompt_get_callback_success 1 |
| #define ompt_get_callback_failure 0 |
| |
| #define no_tool_present 0 |
| |
| #define OMPT_API_ROUTINE static |
| |
| #ifndef OMPT_STR_MATCH |
| #define OMPT_STR_MATCH(haystack, needle) (!strcasecmp(haystack, needle)) |
| #endif |
| |
| // prints for an enabled OMP_TOOL_VERBOSE_INIT. |
| // In the future a prefix could be added in the first define, the second define |
| // omits the prefix to allow for continued lines. Example: "PREFIX: Start |
| // tool... Success." instead of "PREFIX: Start tool... PREFIX: Success." |
| #define OMPT_VERBOSE_INIT_PRINT(...) \ |
| if (verbose_init) \ |
| fprintf(verbose_file, __VA_ARGS__) |
| #define OMPT_VERBOSE_INIT_CONTINUED_PRINT(...) \ |
| if (verbose_init) \ |
| fprintf(verbose_file, __VA_ARGS__) |
| |
| static FILE *verbose_file; |
| static int verbose_init; |
| |
| /***************************************************************************** |
| * types |
| ****************************************************************************/ |
| |
| typedef struct { |
| const char *state_name; |
| ompt_state_t state_id; |
| } ompt_state_info_t; |
| |
| typedef struct { |
| const char *name; |
| kmp_mutex_impl_t id; |
| } kmp_mutex_impl_info_t; |
| |
| enum tool_setting_e { |
| omp_tool_error, |
| omp_tool_unset, |
| omp_tool_disabled, |
| omp_tool_enabled |
| }; |
| |
| /***************************************************************************** |
| * global variables |
| ****************************************************************************/ |
| |
| ompt_callbacks_active_t ompt_enabled; |
| |
| ompt_state_info_t ompt_state_info[] = { |
| #define ompt_state_macro(state, code) {#state, state}, |
| FOREACH_OMPT_STATE(ompt_state_macro) |
| #undef ompt_state_macro |
| }; |
| |
| kmp_mutex_impl_info_t kmp_mutex_impl_info[] = { |
| #define kmp_mutex_impl_macro(name, id) {#name, name}, |
| FOREACH_KMP_MUTEX_IMPL(kmp_mutex_impl_macro) |
| #undef kmp_mutex_impl_macro |
| }; |
| |
| ompt_callbacks_internal_t ompt_callbacks; |
| |
| static ompt_start_tool_result_t *ompt_start_tool_result = NULL; |
| |
| #if KMP_OS_WINDOWS |
| static HMODULE ompt_tool_module = NULL; |
| static HMODULE ompt_archer_module = NULL; |
| #define OMPT_DLCLOSE(Lib) FreeLibrary(Lib) |
| #else |
| static void *ompt_tool_module = NULL; |
| static void *ompt_archer_module = NULL; |
| #define OMPT_DLCLOSE(Lib) dlclose(Lib) |
| #endif |
| |
| /// Used to track the initializer and the finalizer provided by libomptarget |
| static ompt_start_tool_result_t *libomptarget_ompt_result = NULL; |
| |
| /***************************************************************************** |
| * forward declarations |
| ****************************************************************************/ |
| |
| static ompt_interface_fn_t ompt_fn_lookup(const char *s); |
| |
| OMPT_API_ROUTINE ompt_data_t *ompt_get_thread_data(void); |
| |
| /***************************************************************************** |
| * initialization and finalization (private operations) |
| ****************************************************************************/ |
| |
| typedef ompt_start_tool_result_t *(*ompt_start_tool_t)(unsigned int, |
| const char *); |
| |
| #if KMP_OS_DARWIN |
| |
| // While Darwin supports weak symbols, the library that wishes to provide a new |
| // implementation has to link against this runtime which defeats the purpose |
| // of having tools that are agnostic of the underlying runtime implementation. |
| // |
| // Fortunately, the linker includes all symbols of an executable in the global |
| // symbol table by default so dlsym() even finds static implementations of |
| // ompt_start_tool. For this to work on Linux, -Wl,--export-dynamic needs to be |
| // passed when building the application which we don't want to rely on. |
| |
| static ompt_start_tool_result_t *ompt_tool_darwin(unsigned int omp_version, |
| const char *runtime_version) { |
| ompt_start_tool_result_t *ret = NULL; |
| // Search symbol in the current address space. |
| ompt_start_tool_t start_tool = |
| (ompt_start_tool_t)dlsym(RTLD_DEFAULT, "ompt_start_tool"); |
| if (start_tool) { |
| ret = start_tool(omp_version, runtime_version); |
| } |
| return ret; |
| } |
| |
| #elif OMPT_HAVE_WEAK_ATTRIBUTE |
| |
| // On Unix-like systems that support weak symbols the following implementation |
| // of ompt_start_tool() will be used in case no tool-supplied implementation of |
| // this function is present in the address space of a process. |
| |
| _OMP_EXTERN OMPT_WEAK_ATTRIBUTE ompt_start_tool_result_t * |
| ompt_start_tool(unsigned int omp_version, const char *runtime_version) { |
| ompt_start_tool_result_t *ret = NULL; |
| // Search next symbol in the current address space. This can happen if the |
| // runtime library is linked before the tool. Since glibc 2.2 strong symbols |
| // don't override weak symbols that have been found before unless the user |
| // sets the environment variable LD_DYNAMIC_WEAK. |
| ompt_start_tool_t next_tool = |
| (ompt_start_tool_t)dlsym(RTLD_NEXT, "ompt_start_tool"); |
| if (next_tool) { |
| ret = next_tool(omp_version, runtime_version); |
| } |
| return ret; |
| } |
| |
| #elif OMPT_HAVE_PSAPI |
| |
| // On Windows, the ompt_tool_windows function is used to find the |
| // ompt_start_tool symbol across all modules loaded by a process. If |
| // ompt_start_tool is found, ompt_start_tool's return value is used to |
| // initialize the tool. Otherwise, NULL is returned and OMPT won't be enabled. |
| |
| #include <psapi.h> |
| #pragma comment(lib, "psapi.lib") |
| |
| // The number of loaded modules to start enumeration with EnumProcessModules() |
| #define NUM_MODULES 128 |
| |
| static ompt_start_tool_result_t * |
| ompt_tool_windows(unsigned int omp_version, const char *runtime_version) { |
| int i; |
| DWORD needed, new_size; |
| HMODULE *modules; |
| HANDLE process = GetCurrentProcess(); |
| modules = (HMODULE *)malloc(NUM_MODULES * sizeof(HMODULE)); |
| ompt_start_tool_t ompt_tool_p = NULL; |
| |
| #if OMPT_DEBUG |
| printf("ompt_tool_windows(): looking for ompt_start_tool\n"); |
| #endif |
| if (!EnumProcessModules(process, modules, NUM_MODULES * sizeof(HMODULE), |
| &needed)) { |
| // Regardless of the error reason use the stub initialization function |
| free(modules); |
| return NULL; |
| } |
| // Check if NUM_MODULES is enough to list all modules |
| new_size = needed / sizeof(HMODULE); |
| if (new_size > NUM_MODULES) { |
| #if OMPT_DEBUG |
| printf("ompt_tool_windows(): resize buffer to %d bytes\n", needed); |
| #endif |
| modules = (HMODULE *)realloc(modules, needed); |
| // If resizing failed use the stub function. |
| if (!EnumProcessModules(process, modules, needed, &needed)) { |
| free(modules); |
| return NULL; |
| } |
| } |
| for (i = 0; i < new_size; ++i) { |
| (FARPROC &)ompt_tool_p = GetProcAddress(modules[i], "ompt_start_tool"); |
| if (ompt_tool_p) { |
| #if OMPT_DEBUG |
| TCHAR modName[MAX_PATH]; |
| if (GetModuleFileName(modules[i], modName, MAX_PATH)) |
| printf("ompt_tool_windows(): ompt_start_tool found in module %s\n", |
| modName); |
| #endif |
| free(modules); |
| return (*ompt_tool_p)(omp_version, runtime_version); |
| } |
| #if OMPT_DEBUG |
| else { |
| TCHAR modName[MAX_PATH]; |
| if (GetModuleFileName(modules[i], modName, MAX_PATH)) |
| printf("ompt_tool_windows(): ompt_start_tool not found in module %s\n", |
| modName); |
| } |
| #endif |
| } |
| free(modules); |
| return NULL; |
| } |
| #else |
| #error Activation of OMPT is not supported on this platform. |
| #endif |
| |
| static ompt_start_tool_result_t * |
| ompt_try_start_tool(unsigned int omp_version, const char *runtime_version) { |
| ompt_start_tool_result_t *ret = NULL; |
| ompt_start_tool_t start_tool = NULL; |
| #if KMP_OS_WINDOWS |
| // Cannot use colon to describe a list of absolute paths on Windows |
| const char *sep = ";"; |
| #else |
| const char *sep = ":"; |
| #endif |
| |
| OMPT_VERBOSE_INIT_PRINT("----- START LOGGING OF TOOL REGISTRATION -----\n"); |
| OMPT_VERBOSE_INIT_PRINT("Search for OMP tool in current address space... "); |
| |
| #if KMP_OS_DARWIN |
| // Try in the current address space |
| ret = ompt_tool_darwin(omp_version, runtime_version); |
| #elif OMPT_HAVE_WEAK_ATTRIBUTE |
| ret = ompt_start_tool(omp_version, runtime_version); |
| #elif OMPT_HAVE_PSAPI |
| ret = ompt_tool_windows(omp_version, runtime_version); |
| #else |
| #error Activation of OMPT is not supported on this platform. |
| #endif |
| if (ret) { |
| OMPT_VERBOSE_INIT_CONTINUED_PRINT("Success.\n"); |
| OMPT_VERBOSE_INIT_PRINT( |
| "Tool was started and is using the OMPT interface.\n"); |
| OMPT_VERBOSE_INIT_PRINT("----- END LOGGING OF TOOL REGISTRATION -----\n"); |
| return ret; |
| } |
| |
| // Try tool-libraries-var ICV |
| OMPT_VERBOSE_INIT_CONTINUED_PRINT("Failed.\n"); |
| const char *tool_libs = getenv("OMP_TOOL_LIBRARIES"); |
| if (tool_libs) { |
| OMPT_VERBOSE_INIT_PRINT("Searching tool libraries...\n"); |
| OMPT_VERBOSE_INIT_PRINT("OMP_TOOL_LIBRARIES = %s\n", tool_libs); |
| char *libs = __kmp_str_format("%s", tool_libs); |
| char *buf; |
| char *fname = __kmp_str_token(libs, sep, &buf); |
| // Reset dl-error |
| dlerror(); |
| |
| while (fname) { |
| #if KMP_OS_UNIX |
| OMPT_VERBOSE_INIT_PRINT("Opening %s... ", fname); |
| void *h = dlopen(fname, RTLD_LAZY); |
| if (!h) { |
| OMPT_VERBOSE_INIT_CONTINUED_PRINT("Failed: %s\n", dlerror()); |
| } else { |
| OMPT_VERBOSE_INIT_CONTINUED_PRINT("Success. \n"); |
| OMPT_VERBOSE_INIT_PRINT("Searching for ompt_start_tool in %s... ", |
| fname); |
| dlerror(); // Clear any existing error |
| start_tool = (ompt_start_tool_t)dlsym(h, "ompt_start_tool"); |
| if (!start_tool) { |
| char *error = dlerror(); |
| if (error != NULL) { |
| OMPT_VERBOSE_INIT_CONTINUED_PRINT("Failed: %s\n", error); |
| } else { |
| OMPT_VERBOSE_INIT_CONTINUED_PRINT("Failed: %s\n", |
| "ompt_start_tool = NULL"); |
| } |
| } else |
| #elif KMP_OS_WINDOWS |
| OMPT_VERBOSE_INIT_PRINT("Opening %s... ", fname); |
| HMODULE h = LoadLibrary(fname); |
| if (!h) { |
| OMPT_VERBOSE_INIT_CONTINUED_PRINT("Failed: Error %u\n", |
| (unsigned)GetLastError()); |
| } else { |
| OMPT_VERBOSE_INIT_CONTINUED_PRINT("Success. \n"); |
| OMPT_VERBOSE_INIT_PRINT("Searching for ompt_start_tool in %s... ", |
| fname); |
| start_tool = (ompt_start_tool_t)GetProcAddress(h, "ompt_start_tool"); |
| if (!start_tool) { |
| OMPT_VERBOSE_INIT_CONTINUED_PRINT("Failed: Error %u\n", |
| (unsigned)GetLastError()); |
| } else |
| #else |
| #error Activation of OMPT is not supported on this platform. |
| #endif |
| { // if (start_tool) |
| ret = (*start_tool)(omp_version, runtime_version); |
| if (ret) { |
| OMPT_VERBOSE_INIT_CONTINUED_PRINT("Success.\n"); |
| OMPT_VERBOSE_INIT_PRINT( |
| "Tool was started and is using the OMPT interface.\n"); |
| ompt_tool_module = h; |
| break; |
| } |
| OMPT_VERBOSE_INIT_CONTINUED_PRINT( |
| "Found but not using the OMPT interface.\n"); |
| OMPT_VERBOSE_INIT_PRINT("Continuing search...\n"); |
| } |
| OMPT_DLCLOSE(h); |
| } |
| fname = __kmp_str_token(NULL, sep, &buf); |
| } |
| __kmp_str_free(&libs); |
| } else { |
| OMPT_VERBOSE_INIT_PRINT("No OMP_TOOL_LIBRARIES defined.\n"); |
| } |
| |
| // usable tool found in tool-libraries |
| if (ret) { |
| OMPT_VERBOSE_INIT_PRINT("----- END LOGGING OF TOOL REGISTRATION -----\n"); |
| return ret; |
| } |
| |
| #if KMP_OS_UNIX |
| { // Non-standard: load archer tool if application is built with TSan |
| const char *fname = "libarcher.so"; |
| OMPT_VERBOSE_INIT_PRINT( |
| "...searching tool libraries failed. Using archer tool.\n"); |
| OMPT_VERBOSE_INIT_PRINT("Opening %s... ", fname); |
| void *h = dlopen(fname, RTLD_LAZY); |
| if (h) { |
| OMPT_VERBOSE_INIT_CONTINUED_PRINT("Success.\n"); |
| OMPT_VERBOSE_INIT_PRINT("Searching for ompt_start_tool in %s... ", fname); |
| start_tool = (ompt_start_tool_t)dlsym(h, "ompt_start_tool"); |
| if (start_tool) { |
| ret = (*start_tool)(omp_version, runtime_version); |
| if (ret) { |
| OMPT_VERBOSE_INIT_CONTINUED_PRINT("Success.\n"); |
| OMPT_VERBOSE_INIT_PRINT( |
| "Tool was started and is using the OMPT interface.\n"); |
| OMPT_VERBOSE_INIT_PRINT( |
| "----- END LOGGING OF TOOL REGISTRATION -----\n"); |
| ompt_archer_module = h; |
| return ret; |
| } |
| OMPT_VERBOSE_INIT_CONTINUED_PRINT( |
| "Found but not using the OMPT interface.\n"); |
| } else { |
| OMPT_VERBOSE_INIT_CONTINUED_PRINT("Failed: %s\n", dlerror()); |
| } |
| OMPT_DLCLOSE(h); |
| } |
| } |
| #endif |
| OMPT_VERBOSE_INIT_PRINT("No OMP tool loaded.\n"); |
| OMPT_VERBOSE_INIT_PRINT("----- END LOGGING OF TOOL REGISTRATION -----\n"); |
| return ret; |
| } |
| |
| void ompt_pre_init() { |
| //-------------------------------------------------- |
| // Execute the pre-initialization logic only once. |
| //-------------------------------------------------- |
| static int ompt_pre_initialized = 0; |
| |
| if (ompt_pre_initialized) |
| return; |
| |
| ompt_pre_initialized = 1; |
| |
| //-------------------------------------------------- |
| // Use a tool iff a tool is enabled and available. |
| //-------------------------------------------------- |
| const char *ompt_env_var = getenv("OMP_TOOL"); |
| tool_setting_e tool_setting = omp_tool_error; |
| |
| if (!ompt_env_var || !strcmp(ompt_env_var, "")) |
| tool_setting = omp_tool_unset; |
| else if (OMPT_STR_MATCH(ompt_env_var, "disabled")) |
| tool_setting = omp_tool_disabled; |
| else if (OMPT_STR_MATCH(ompt_env_var, "enabled")) |
| tool_setting = omp_tool_enabled; |
| |
| const char *ompt_env_verbose_init = getenv("OMP_TOOL_VERBOSE_INIT"); |
| // possible options: disabled | stdout | stderr | <filename> |
| // if set, not empty and not disabled -> prepare for logging |
| if (ompt_env_verbose_init && strcmp(ompt_env_verbose_init, "") && |
| !OMPT_STR_MATCH(ompt_env_verbose_init, "disabled")) { |
| verbose_init = 1; |
| if (OMPT_STR_MATCH(ompt_env_verbose_init, "STDERR")) |
| verbose_file = stderr; |
| else if (OMPT_STR_MATCH(ompt_env_verbose_init, "STDOUT")) |
| verbose_file = stdout; |
| else |
| verbose_file = fopen(ompt_env_verbose_init, "w"); |
| } else |
| verbose_init = 0; |
| |
| #if OMPT_DEBUG |
| printf("ompt_pre_init(): tool_setting = %d\n", tool_setting); |
| #endif |
| switch (tool_setting) { |
| case omp_tool_disabled: |
| OMPT_VERBOSE_INIT_PRINT("OMP tool disabled. \n"); |
| break; |
| |
| case omp_tool_unset: |
| case omp_tool_enabled: |
| |
| //-------------------------------------------------- |
| // Load tool iff specified in environment variable |
| //-------------------------------------------------- |
| ompt_start_tool_result = |
| ompt_try_start_tool(__kmp_openmp_version, ompt_get_runtime_version()); |
| |
| memset(&ompt_enabled, 0, sizeof(ompt_enabled)); |
| break; |
| |
| case omp_tool_error: |
| fprintf(stderr, |
| "Warning: OMP_TOOL has invalid value \"%s\".\n" |
| " legal values are (NULL,\"\",\"disabled\"," |
| "\"enabled\").\n", |
| ompt_env_var); |
| break; |
| } |
| if (verbose_init && verbose_file != stderr && verbose_file != stdout) |
| fclose(verbose_file); |
| #if OMPT_DEBUG |
| printf("ompt_pre_init(): ompt_enabled = %d\n", ompt_enabled.enabled); |
| #endif |
| } |
| |
| extern "C" int omp_get_initial_device(void); |
| |
| void ompt_post_init() { |
| //-------------------------------------------------- |
| // Execute the post-initialization logic only once. |
| //-------------------------------------------------- |
| static int ompt_post_initialized = 0; |
| |
| if (ompt_post_initialized) |
| return; |
| |
| ompt_post_initialized = 1; |
| |
| //-------------------------------------------------- |
| // Initialize the tool if so indicated. |
| //-------------------------------------------------- |
| if (ompt_start_tool_result) { |
| ompt_enabled.enabled = !!ompt_start_tool_result->initialize( |
| ompt_fn_lookup, omp_get_initial_device(), |
| &(ompt_start_tool_result->tool_data)); |
| |
| if (!ompt_enabled.enabled) { |
| // tool not enabled, zero out the bitmap, and done |
| memset(&ompt_enabled, 0, sizeof(ompt_enabled)); |
| return; |
| } |
| |
| kmp_info_t *root_thread = ompt_get_thread(); |
| |
| ompt_set_thread_state(root_thread, ompt_state_overhead); |
| __ompt_task_init(root_thread->th.th_current_task, 0); |
| |
| if (ompt_enabled.ompt_callback_thread_begin) { |
| ompt_callbacks.ompt_callback(ompt_callback_thread_begin)( |
| ompt_thread_initial, __ompt_get_thread_data_internal()); |
| } |
| ompt_data_t *task_data = nullptr; |
| ompt_data_t *parallel_data = nullptr; |
| __ompt_get_task_info_internal(0, NULL, &task_data, NULL, ¶llel_data, |
| NULL); |
| if (ompt_enabled.ompt_callback_implicit_task) { |
| ompt_callbacks.ompt_callback(ompt_callback_implicit_task)( |
| ompt_scope_begin, parallel_data, task_data, 1, 1, ompt_task_initial); |
| } |
| |
| ompt_set_thread_state(root_thread, ompt_state_work_serial); |
| } |
| } |
| |
| void ompt_fini() { |
| if (ompt_enabled.enabled) { |
| if (ompt_start_tool_result && ompt_start_tool_result->finalize) { |
| ompt_start_tool_result->finalize(&(ompt_start_tool_result->tool_data)); |
| } |
| if (libomptarget_ompt_result && libomptarget_ompt_result->finalize) { |
| libomptarget_ompt_result->finalize(NULL); |
| } |
| } |
| |
| if (ompt_archer_module) |
| OMPT_DLCLOSE(ompt_archer_module); |
| if (ompt_tool_module) |
| OMPT_DLCLOSE(ompt_tool_module); |
| memset(&ompt_enabled, 0, sizeof(ompt_enabled)); |
| } |
| |
| /***************************************************************************** |
| * interface operations |
| ****************************************************************************/ |
| |
| /***************************************************************************** |
| * state |
| ****************************************************************************/ |
| |
| OMPT_API_ROUTINE int ompt_enumerate_states(int current_state, int *next_state, |
| const char **next_state_name) { |
| const static int len = sizeof(ompt_state_info) / sizeof(ompt_state_info_t); |
| int i = 0; |
| |
| for (i = 0; i < len - 1; i++) { |
| if (ompt_state_info[i].state_id == current_state) { |
| *next_state = ompt_state_info[i + 1].state_id; |
| *next_state_name = ompt_state_info[i + 1].state_name; |
| return 1; |
| } |
| } |
| |
| return 0; |
| } |
| |
| OMPT_API_ROUTINE int ompt_enumerate_mutex_impls(int current_impl, |
| int *next_impl, |
| const char **next_impl_name) { |
| const static int len = |
| sizeof(kmp_mutex_impl_info) / sizeof(kmp_mutex_impl_info_t); |
| int i = 0; |
| for (i = 0; i < len - 1; i++) { |
| if (kmp_mutex_impl_info[i].id != current_impl) |
| continue; |
| *next_impl = kmp_mutex_impl_info[i + 1].id; |
| *next_impl_name = kmp_mutex_impl_info[i + 1].name; |
| return 1; |
| } |
| return 0; |
| } |
| |
| /***************************************************************************** |
| * callbacks |
| ****************************************************************************/ |
| |
| OMPT_API_ROUTINE ompt_set_result_t ompt_set_callback(ompt_callbacks_t which, |
| ompt_callback_t callback) { |
| switch (which) { |
| |
| #define ompt_event_macro(event_name, callback_type, event_id) \ |
| case event_name: \ |
| ompt_callbacks.ompt_callback(event_name) = (callback_type)callback; \ |
| ompt_enabled.event_name = (callback != 0); \ |
| if (callback) \ |
| return ompt_event_implementation_status(event_name); \ |
| else \ |
| return ompt_set_always; |
| |
| FOREACH_OMPT_EVENT(ompt_event_macro) |
| |
| #undef ompt_event_macro |
| |
| default: |
| return ompt_set_error; |
| } |
| } |
| |
| OMPT_API_ROUTINE int ompt_get_callback(ompt_callbacks_t which, |
| ompt_callback_t *callback) { |
| if (!ompt_enabled.enabled) |
| return ompt_get_callback_failure; |
| |
| switch (which) { |
| |
| #define ompt_event_macro(event_name, callback_type, event_id) \ |
| case event_name: { \ |
| ompt_callback_t mycb = \ |
| (ompt_callback_t)ompt_callbacks.ompt_callback(event_name); \ |
| if (ompt_enabled.event_name && mycb) { \ |
| *callback = mycb; \ |
| return ompt_get_callback_success; \ |
| } \ |
| return ompt_get_callback_failure; \ |
| } |
| |
| FOREACH_OMPT_EVENT(ompt_event_macro) |
| |
| #undef ompt_event_macro |
| |
| default: |
| return ompt_get_callback_failure; |
| } |
| } |
| |
| /***************************************************************************** |
| * parallel regions |
| ****************************************************************************/ |
| |
| OMPT_API_ROUTINE int ompt_get_parallel_info(int ancestor_level, |
| ompt_data_t **parallel_data, |
| int *team_size) { |
| if (!ompt_enabled.enabled) |
| return 0; |
| return __ompt_get_parallel_info_internal(ancestor_level, parallel_data, |
| team_size); |
| } |
| |
| OMPT_API_ROUTINE int ompt_get_state(ompt_wait_id_t *wait_id) { |
| if (!ompt_enabled.enabled) |
| return ompt_state_work_serial; |
| int thread_state = __ompt_get_state_internal(wait_id); |
| |
| if (thread_state == ompt_state_undefined) { |
| thread_state = ompt_state_work_serial; |
| } |
| |
| return thread_state; |
| } |
| |
| /***************************************************************************** |
| * tasks |
| ****************************************************************************/ |
| |
| OMPT_API_ROUTINE ompt_data_t *ompt_get_thread_data(void) { |
| if (!ompt_enabled.enabled) |
| return NULL; |
| return __ompt_get_thread_data_internal(); |
| } |
| |
| OMPT_API_ROUTINE int ompt_get_task_info(int ancestor_level, int *type, |
| ompt_data_t **task_data, |
| ompt_frame_t **task_frame, |
| ompt_data_t **parallel_data, |
| int *thread_num) { |
| if (!ompt_enabled.enabled) |
| return 0; |
| return __ompt_get_task_info_internal(ancestor_level, type, task_data, |
| task_frame, parallel_data, thread_num); |
| } |
| |
| OMPT_API_ROUTINE int ompt_get_task_memory(void **addr, size_t *size, |
| int block) { |
| return __ompt_get_task_memory_internal(addr, size, block); |
| } |
| |
| /***************************************************************************** |
| * num_procs |
| ****************************************************************************/ |
| |
| OMPT_API_ROUTINE int ompt_get_num_procs(void) { |
| // copied from kmp_ftn_entry.h (but modified: OMPT can only be called when |
| // runtime is initialized) |
| return __kmp_avail_proc; |
| } |
| |
| /***************************************************************************** |
| * places |
| ****************************************************************************/ |
| |
| OMPT_API_ROUTINE int ompt_get_num_places(void) { |
| // copied from kmp_ftn_entry.h (but modified) |
| #if !KMP_AFFINITY_SUPPORTED |
| return 0; |
| #else |
| if (!KMP_AFFINITY_CAPABLE()) |
| return 0; |
| return __kmp_affinity.num_masks; |
| #endif |
| } |
| |
| OMPT_API_ROUTINE int ompt_get_place_proc_ids(int place_num, int ids_size, |
| int *ids) { |
| // copied from kmp_ftn_entry.h (but modified) |
| #if !KMP_AFFINITY_SUPPORTED |
| return 0; |
| #else |
| int i, count; |
| SimpleVLA<int> tmp_ids(ids_size); |
| for (int j = 0; j < ids_size; j++) |
| tmp_ids[j] = 0; |
| if (!KMP_AFFINITY_CAPABLE()) |
| return 0; |
| if (place_num < 0 || place_num >= (int)__kmp_affinity.num_masks) |
| return 0; |
| /* TODO: Is this safe for asynchronous call from signal handler during runtime |
| * shutdown? */ |
| kmp_affin_mask_t *mask = KMP_CPU_INDEX(__kmp_affinity.masks, place_num); |
| count = 0; |
| KMP_CPU_SET_ITERATE(i, mask) { |
| if ((!KMP_CPU_ISSET(i, __kmp_affin_fullMask)) || |
| (!KMP_CPU_ISSET(i, mask))) { |
| continue; |
| } |
| if (count < ids_size) |
| tmp_ids[count] = i; |
| count++; |
| } |
| if (ids_size >= count) { |
| for (i = 0; i < count; i++) { |
| ids[i] = tmp_ids[i]; |
| } |
| } |
| return count; |
| #endif |
| } |
| |
| OMPT_API_ROUTINE int ompt_get_place_num(void) { |
| // copied from kmp_ftn_entry.h (but modified) |
| #if !KMP_AFFINITY_SUPPORTED |
| return -1; |
| #else |
| if (!ompt_enabled.enabled || __kmp_get_gtid() < 0) |
| return -1; |
| |
| int gtid; |
| kmp_info_t *thread; |
| if (!KMP_AFFINITY_CAPABLE()) |
| return -1; |
| gtid = __kmp_entry_gtid(); |
| thread = __kmp_thread_from_gtid(gtid); |
| if (thread == NULL || thread->th.th_current_place < 0) |
| return -1; |
| return thread->th.th_current_place; |
| #endif |
| } |
| |
| OMPT_API_ROUTINE int ompt_get_partition_place_nums(int place_nums_size, |
| int *place_nums) { |
| // copied from kmp_ftn_entry.h (but modified) |
| #if !KMP_AFFINITY_SUPPORTED |
| return 0; |
| #else |
| if (!ompt_enabled.enabled || __kmp_get_gtid() < 0) |
| return 0; |
| |
| int i, gtid, place_num, first_place, last_place, start, end; |
| kmp_info_t *thread; |
| if (!KMP_AFFINITY_CAPABLE()) |
| return 0; |
| gtid = __kmp_entry_gtid(); |
| thread = __kmp_thread_from_gtid(gtid); |
| if (thread == NULL) |
| return 0; |
| first_place = thread->th.th_first_place; |
| last_place = thread->th.th_last_place; |
| if (first_place < 0 || last_place < 0) |
| return 0; |
| if (first_place <= last_place) { |
| start = first_place; |
| end = last_place; |
| } else { |
| start = last_place; |
| end = first_place; |
| } |
| if (end - start <= place_nums_size) |
| for (i = 0, place_num = start; place_num <= end; ++place_num, ++i) { |
| place_nums[i] = place_num; |
| } |
| return end - start + 1; |
| #endif |
| } |
| |
| /***************************************************************************** |
| * places |
| ****************************************************************************/ |
| |
| OMPT_API_ROUTINE int ompt_get_proc_id(void) { |
| if (!ompt_enabled.enabled || __kmp_get_gtid() < 0) |
| return -1; |
| #if KMP_HAVE_SCHED_GETCPU |
| return sched_getcpu(); |
| #elif KMP_OS_WINDOWS |
| PROCESSOR_NUMBER pn; |
| GetCurrentProcessorNumberEx(&pn); |
| return 64 * pn.Group + pn.Number; |
| #else |
| return -1; |
| #endif |
| } |
| |
| /***************************************************************************** |
| * compatability |
| ****************************************************************************/ |
| |
| /* |
| * Currently unused function |
| OMPT_API_ROUTINE int ompt_get_ompt_version() { return OMPT_VERSION; } |
| */ |
| |
| /***************************************************************************** |
| * application-facing API |
| ****************************************************************************/ |
| |
| /*---------------------------------------------------------------------------- |
| | control |
| ---------------------------------------------------------------------------*/ |
| |
| int __kmp_control_tool(uint64_t command, uint64_t modifier, void *arg) { |
| |
| if (ompt_enabled.enabled) { |
| if (ompt_enabled.ompt_callback_control_tool) { |
| return ompt_callbacks.ompt_callback(ompt_callback_control_tool)( |
| command, modifier, arg, OMPT_LOAD_RETURN_ADDRESS(__kmp_entry_gtid())); |
| } else { |
| return -1; |
| } |
| } else { |
| return -2; |
| } |
| } |
| |
| /***************************************************************************** |
| * misc |
| ****************************************************************************/ |
| |
| OMPT_API_ROUTINE uint64_t ompt_get_unique_id(void) { |
| return __ompt_get_unique_id_internal(); |
| } |
| |
| OMPT_API_ROUTINE void ompt_finalize_tool(void) { __kmp_internal_end_atexit(); } |
| |
| /***************************************************************************** |
| * Target |
| ****************************************************************************/ |
| |
| OMPT_API_ROUTINE int ompt_get_target_info(uint64_t *device_num, |
| ompt_id_t *target_id, |
| ompt_id_t *host_op_id) { |
| return 0; // thread is not in a target region |
| } |
| |
| OMPT_API_ROUTINE int ompt_get_num_devices(void) { |
| return 1; // only one device (the current device) is available |
| } |
| |
| /***************************************************************************** |
| * API inquiry for tool |
| ****************************************************************************/ |
| |
| static ompt_interface_fn_t ompt_fn_lookup(const char *s) { |
| |
| #define ompt_interface_fn(fn) \ |
| fn##_t fn##_f = fn; \ |
| if (strcmp(s, #fn) == 0) \ |
| return (ompt_interface_fn_t)fn##_f; |
| |
| FOREACH_OMPT_INQUIRY_FN(ompt_interface_fn) |
| |
| #undef ompt_interface_fn |
| |
| return NULL; |
| } |
| |
| static ompt_data_t *ompt_get_task_data() { return __ompt_get_task_data(); } |
| |
| static ompt_data_t *ompt_get_target_task_data() { |
| return __ompt_get_target_task_data(); |
| } |
| |
| /// Lookup function to query libomp callbacks registered by the tool |
| static ompt_interface_fn_t ompt_libomp_target_fn_lookup(const char *s) { |
| #define provide_fn(fn) \ |
| if (strcmp(s, #fn) == 0) \ |
| return (ompt_interface_fn_t)fn; |
| |
| provide_fn(ompt_get_callback); |
| provide_fn(ompt_get_task_data); |
| provide_fn(ompt_get_target_task_data); |
| #undef provide_fn |
| |
| #define ompt_interface_fn(fn, type, code) \ |
| if (strcmp(s, #fn) == 0) \ |
| return (ompt_interface_fn_t)ompt_callbacks.ompt_callback(fn); |
| |
| FOREACH_OMPT_DEVICE_EVENT(ompt_interface_fn) |
| FOREACH_OMPT_EMI_EVENT(ompt_interface_fn) |
| FOREACH_OMPT_NOEMI_EVENT(ompt_interface_fn) |
| #undef ompt_interface_fn |
| |
| return (ompt_interface_fn_t)0; |
| } |
| |
| /// This function is called by the libomptarget connector to assign |
| /// callbacks already registered with libomp. |
| _OMP_EXTERN void ompt_libomp_connect(ompt_start_tool_result_t *result) { |
| OMPT_VERBOSE_INIT_PRINT("libomp --> OMPT: Enter ompt_libomp_connect\n"); |
| |
| // Ensure libomp callbacks have been added if not already |
| __ompt_force_initialization(); |
| |
| if (ompt_enabled.enabled && result) { |
| OMPT_VERBOSE_INIT_PRINT("libomp --> OMPT: Connecting with libomptarget\n"); |
| // Pass in the libomp lookup function so that the already registered |
| // functions can be extracted and assigned to the callbacks in |
| // libomptarget |
| result->initialize(ompt_libomp_target_fn_lookup, |
| /* initial_device_num */ 0, /* tool_data */ nullptr); |
| // Track the object provided by libomptarget so that the finalizer can be |
| // called during OMPT finalization |
| libomptarget_ompt_result = result; |
| } |
| OMPT_VERBOSE_INIT_PRINT("libomp --> OMPT: Exit ompt_libomp_connect\n"); |
| } |