mirror of
https://github.com/zebrajr/pytorch.git
synced 2025-12-07 12:21:27 +01:00
avoid unnecessary static_cast Pull Request resolved: https://github.com/pytorch/pytorch/pull/93898 Approved by: https://github.com/Skylion007
82 lines
2.6 KiB
C++
82 lines
2.6 KiB
C++
#include <c10/core/Allocator.h>
|
|
|
|
#include <c10/util/ThreadLocalDebugInfo.h>
|
|
|
|
namespace c10 {
|
|
|
|
static void deleteInefficientStdFunctionContext(void* ptr) {
|
|
delete static_cast<InefficientStdFunctionContext*>(ptr);
|
|
}
|
|
|
|
at::DataPtr InefficientStdFunctionContext::makeDataPtr(
|
|
void* ptr,
|
|
const std::function<void(void*)>& deleter,
|
|
Device device) {
|
|
return {
|
|
ptr,
|
|
new InefficientStdFunctionContext({ptr, deleter}),
|
|
&deleteInefficientStdFunctionContext,
|
|
device};
|
|
}
|
|
|
|
// NOLINTNEXTLINE(cppcoreguidelines-avoid-non-const-global-variables,modernize-avoid-c-arrays,cppcoreguidelines-avoid-c-arrays)
|
|
C10_API at::Allocator* allocator_array[at::COMPILE_TIME_MAX_DEVICE_TYPES];
|
|
// NOLINTNEXTLINE(cppcoreguidelines-avoid-non-const-global-variables,modernize-avoid-c-arrays,cppcoreguidelines-avoid-c-arrays)
|
|
C10_API uint8_t allocator_priority[at::COMPILE_TIME_MAX_DEVICE_TYPES] = {0};
|
|
|
|
void SetAllocator(at::DeviceType t, at::Allocator* alloc, uint8_t priority) {
|
|
if (priority >= allocator_priority[static_cast<int>(t)]) {
|
|
allocator_array[static_cast<int>(t)] = alloc;
|
|
allocator_priority[static_cast<int>(t)] = priority;
|
|
}
|
|
}
|
|
|
|
at::Allocator* GetAllocator(const at::DeviceType& t) {
|
|
auto* alloc = allocator_array[static_cast<int>(t)];
|
|
TORCH_INTERNAL_ASSERT_DEBUG_ONLY(alloc, "Allocator for ", t, " is not set.");
|
|
return alloc;
|
|
}
|
|
|
|
bool memoryProfilingEnabled() {
|
|
auto* reporter_ptr = static_cast<MemoryReportingInfoBase*>(
|
|
ThreadLocalDebugInfo::get(DebugInfoKind::PROFILER_STATE));
|
|
return reporter_ptr && reporter_ptr->memoryProfilingEnabled();
|
|
}
|
|
|
|
void reportMemoryUsageToProfiler(
|
|
void* ptr,
|
|
int64_t alloc_size,
|
|
size_t total_allocated,
|
|
size_t total_reserved,
|
|
Device device) {
|
|
auto* reporter_ptr = static_cast<MemoryReportingInfoBase*>(
|
|
ThreadLocalDebugInfo::get(DebugInfoKind::PROFILER_STATE));
|
|
if (reporter_ptr) {
|
|
reporter_ptr->reportMemoryUsage(
|
|
ptr, alloc_size, total_allocated, total_reserved, device);
|
|
}
|
|
}
|
|
|
|
void reportOutOfMemoryToProfiler(
|
|
int64_t alloc_size,
|
|
size_t total_allocated,
|
|
size_t total_reserved,
|
|
Device device) {
|
|
auto* reporter_ptr = static_cast<MemoryReportingInfoBase*>(
|
|
ThreadLocalDebugInfo::get(DebugInfoKind::PROFILER_STATE));
|
|
if (reporter_ptr) {
|
|
reporter_ptr->reportOutOfMemory(
|
|
alloc_size, total_allocated, total_reserved, device);
|
|
}
|
|
}
|
|
|
|
MemoryReportingInfoBase::MemoryReportingInfoBase() = default;
|
|
|
|
void MemoryReportingInfoBase::reportOutOfMemory(
|
|
int64_t /*alloc_size*/,
|
|
size_t /*total_allocated*/,
|
|
size_t /*total_reserved*/,
|
|
Device /*device*/) {}
|
|
|
|
} // namespace c10
|