You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
158 lines
4.8 KiB
158 lines
4.8 KiB
/*
|
|
* Copyright 2020 The Android Open Source Project
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
#undef LOG_TAG
|
|
#define LOG_TAG "GpuMem"
|
|
#define ATRACE_TAG ATRACE_TAG_GRAPHICS
|
|
|
|
#include "gpumem/GpuMem.h"
|
|
|
|
#include <android-base/stringprintf.h>
|
|
#include <libbpf.h>
|
|
#include <libbpf_android.h>
|
|
#include <log/log.h>
|
|
#include <unistd.h>
|
|
#include <utils/Timers.h>
|
|
#include <utils/Trace.h>
|
|
|
|
#include <unordered_map>
|
|
#include <vector>
|
|
|
|
namespace android {
|
|
|
|
using base::StringAppendF;
|
|
|
|
GpuMem::~GpuMem() {
|
|
bpf_detach_tracepoint(kGpuMemTraceGroup, kGpuMemTotalTracepoint);
|
|
}
|
|
|
|
void GpuMem::initialize() {
|
|
// Make sure bpf programs are loaded
|
|
bpf::waitForProgsLoaded();
|
|
|
|
errno = 0;
|
|
int fd = bpf::retrieveProgram(kGpuMemTotalProgPath);
|
|
if (fd < 0) {
|
|
ALOGE("Failed to retrieve pinned program from %s [%d(%s)]", kGpuMemTotalProgPath, errno,
|
|
strerror(errno));
|
|
return;
|
|
}
|
|
|
|
// Attach the program to the tracepoint, and the tracepoint is automatically enabled here.
|
|
errno = 0;
|
|
int count = 0;
|
|
while (bpf_attach_tracepoint(fd, kGpuMemTraceGroup, kGpuMemTotalTracepoint) < 0) {
|
|
if (++count > kGpuWaitTimeout) {
|
|
ALOGE("Failed to attach bpf program to %s/%s tracepoint [%d(%s)]", kGpuMemTraceGroup,
|
|
kGpuMemTotalTracepoint, errno, strerror(errno));
|
|
return;
|
|
}
|
|
// Retry until GPU driver loaded or timeout.
|
|
sleep(1);
|
|
}
|
|
|
|
// Use the read-only wrapper BpfMapRO to properly retrieve the read-only map.
|
|
errno = 0;
|
|
auto map = bpf::BpfMapRO<uint64_t, uint64_t>(kGpuMemTotalMapPath);
|
|
if (!map.isValid()) {
|
|
ALOGE("Failed to create bpf map from %s [%d(%s)]", kGpuMemTotalMapPath, errno,
|
|
strerror(errno));
|
|
return;
|
|
}
|
|
setGpuMemTotalMap(map);
|
|
|
|
mInitialized.store(true);
|
|
}
|
|
|
|
void GpuMem::setGpuMemTotalMap(bpf::BpfMap<uint64_t, uint64_t>& map) {
|
|
mGpuMemTotalMap = std::move(map);
|
|
}
|
|
|
|
// Dump the snapshots of global and per process memory usage on all gpus
|
|
void GpuMem::dump(const Vector<String16>& /* args */, std::string* result) {
|
|
ATRACE_CALL();
|
|
|
|
if (!mInitialized.load() || !mGpuMemTotalMap.isValid()) {
|
|
result->append("Failed to initialize GPU memory eBPF\n");
|
|
return;
|
|
}
|
|
|
|
auto res = mGpuMemTotalMap.getFirstKey();
|
|
if (!res.ok()) {
|
|
result->append("GPU memory total usage map is empty\n");
|
|
return;
|
|
}
|
|
uint64_t key = res.value();
|
|
// unordered_map<gpu_id, vector<pair<pid, size>>>
|
|
std::unordered_map<uint32_t, std::vector<std::pair<uint32_t, uint64_t>>> dumpMap;
|
|
while (true) {
|
|
uint32_t gpu_id = key >> 32;
|
|
uint32_t pid = key;
|
|
|
|
res = mGpuMemTotalMap.readValue(key);
|
|
if (!res.ok()) break;
|
|
uint64_t size = res.value();
|
|
|
|
dumpMap[gpu_id].emplace_back(pid, size);
|
|
|
|
res = mGpuMemTotalMap.getNextKey(key);
|
|
if (!res.ok()) break;
|
|
key = res.value();
|
|
}
|
|
|
|
for (auto& gpu : dumpMap) {
|
|
if (gpu.second.empty()) continue;
|
|
StringAppendF(result, "Memory snapshot for GPU %u:\n", gpu.first);
|
|
|
|
std::sort(gpu.second.begin(), gpu.second.end(),
|
|
[](auto& l, auto& r) { return l.first < r.first; });
|
|
|
|
int i = 0;
|
|
if (gpu.second[0].first != 0) {
|
|
StringAppendF(result, "Global total: N/A\n");
|
|
} else {
|
|
StringAppendF(result, "Global total: %" PRIu64 "\n", gpu.second[0].second);
|
|
i++;
|
|
}
|
|
for (; i < gpu.second.size(); i++) {
|
|
StringAppendF(result, "Proc %u total: %" PRIu64 "\n", gpu.second[i].first,
|
|
gpu.second[i].second);
|
|
}
|
|
}
|
|
}
|
|
|
|
void GpuMem::traverseGpuMemTotals(const std::function<void(int64_t ts, uint32_t gpuId, uint32_t pid,
|
|
uint64_t size)>& callback) {
|
|
auto res = mGpuMemTotalMap.getFirstKey();
|
|
if (!res.ok()) return;
|
|
uint64_t key = res.value();
|
|
while (true) {
|
|
uint32_t gpu_id = key >> 32;
|
|
uint32_t pid = key;
|
|
|
|
res = mGpuMemTotalMap.readValue(key);
|
|
if (!res.ok()) break;
|
|
uint64_t size = res.value();
|
|
|
|
callback(systemTime(), gpu_id, pid, size);
|
|
res = mGpuMemTotalMap.getNextKey(key);
|
|
if (!res.ok()) break;
|
|
key = res.value();
|
|
}
|
|
}
|
|
|
|
} // namespace android
|