AMDGPU provides a fixed frequency clock since some generations back. However, the frequency is variable by card and must be looked up at runtime. This patch adds a new device environment line for the clock frequency so that we can use it in the same way as NVPTX. This is the correct implementation and the version in ASO should be replaced. Reviewed By: tianshilei1992 Differential Revision: https://reviews.llvm.org/D154456
58 lines
1.7 KiB
C++
58 lines
1.7 KiB
C++
//===--- Configuration.h - OpenMP device configuration interface -- C++ -*-===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// API to query the global (constant) device environment.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#ifndef OMPTARGET_CONFIGURATION_H
|
|
#define OMPTARGET_CONFIGURATION_H
|
|
|
|
#include "Types.h"
|
|
|
|
namespace ompx {
|
|
namespace config {
|
|
|
|
enum DebugKind : uint32_t {
|
|
Assertion = 1U << 0,
|
|
FunctionTracing = 1U << 1,
|
|
CommonIssues = 1U << 2,
|
|
};
|
|
|
|
/// Return the number of devices in the system, same number as returned on the
|
|
/// host by omp_get_num_devices.
|
|
uint32_t getNumDevices();
|
|
|
|
/// Return the device number in the system for omp_get_device_num.
|
|
uint32_t getDeviceNum();
|
|
|
|
/// Return the user choosen debug level.
|
|
uint32_t getDebugKind();
|
|
|
|
/// Return the amount of dynamic shared memory that was allocated at launch.
|
|
uint64_t getDynamicMemorySize();
|
|
|
|
/// Returns the cycles per second of the device's fixed frequency clock.
|
|
uint64_t getClockFrequency();
|
|
|
|
/// Return if debugging is enabled for the given debug kind.
|
|
bool isDebugMode(DebugKind Level);
|
|
|
|
/// Indicates if this kernel may require thread-specific states, or if it was
|
|
/// explicitly disabled by the user.
|
|
bool mayUseThreadStates();
|
|
|
|
/// Indicates if this kernel may require data environments for nested
|
|
/// parallelism, or if it was explicitly disabled by the user.
|
|
bool mayUseNestedParallelism();
|
|
|
|
} // namespace config
|
|
} // namespace ompx
|
|
|
|
#endif
|