/*
* Copyright (C) 2016 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include "perf_clock.h"
#include <sys/mman.h>
#include <sys/syscall.h>
#include <atomic>
#include <chrono>
#include <thread>
#include <android-base/logging.h>
#include "environment.h"
#include "event_attr.h"
#include "event_fd.h"
#include "event_type.h"
#include "record.h"
static bool perf_clock_initialized = false;
static int64_t perf_clock_and_system_clock_diff_in_ns = 0;
struct ThreadArg {
std::atomic<pid_t> thread_a_tid;
std::atomic<bool> start_mmap;
std::atomic<uint64_t> mmap_start_addr;
uint64_t system_time_in_ns;
std::atomic<bool> has_error;
};
static void ThreadA(ThreadArg* thread_arg) {
thread_arg->thread_a_tid = syscall(SYS_gettid);
while (!thread_arg->start_mmap) {
usleep(1000);
}
size_t TRY_MMAP_COUNT = 10;
struct TryMmap {
void* mmap_start_addr;
uint64_t start_system_time_in_ns;
uint64_t end_system_time_in_ns;
};
TryMmap array[TRY_MMAP_COUNT];
// In case current thread is preempted by other threads, we run mmap()
// multiple times and use the one with the smallest time interval.
for (size_t i = 0; i < TRY_MMAP_COUNT; ++i) {
array[i].start_system_time_in_ns = GetSystemClock();
array[i].mmap_start_addr =
mmap(NULL, 4096, PROT_WRITE, MAP_PRIVATE | MAP_ANONYMOUS, -1, 0);
if (array[i].mmap_start_addr == MAP_FAILED) {
PLOG(ERROR) << "mmap() failed";
thread_arg->has_error = true;
return;
}
array[i].end_system_time_in_ns = GetSystemClock();
}
size_t best_index = 0;
uint64_t min_duration_in_ns = UINT64_MAX;
for (size_t i = 0; i < TRY_MMAP_COUNT; ++i) {
uint64_t d =
array[i].end_system_time_in_ns - array[i].start_system_time_in_ns;
if (min_duration_in_ns > d) {
min_duration_in_ns = d;
best_index = i;
}
munmap(array[i].mmap_start_addr, 4096);
}
thread_arg->mmap_start_addr =
reinterpret_cast<uint64_t>(array[best_index].mmap_start_addr);
// Perf time is generated at the end of mmap() syscall, which is close to
// the end time instead of the start time.
thread_arg->system_time_in_ns = array[best_index].end_system_time_in_ns;
}
static bool GetClockDiff(int64_t* clock_diff_in_ns) {
ThreadArg thread_arg;
thread_arg.thread_a_tid = 0;
thread_arg.start_mmap = false;
thread_arg.has_error = false;
std::thread thread_a(ThreadA, &thread_arg);
while (thread_arg.thread_a_tid == 0) {
usleep(1000);
}
std::unique_ptr<EventTypeAndModifier> event_type =
ParseEventType("cpu-clock");
if (event_type == nullptr) {
return false;
}
perf_event_attr attr = CreateDefaultPerfEventAttr(event_type->event_type);
attr.comm = 0;
attr.mmap_data = 1;
attr.mmap = 0;
attr.inherit = 0;
attr.sample_id_all = 1;
attr.freq = 0;
attr.sample_period = 1ULL << 62; // Sample records are not needed.
std::unique_ptr<EventFd> event_fd =
EventFd::OpenEventFile(attr, thread_arg.thread_a_tid, -1, nullptr);
if (event_fd == nullptr) {
return false;
}
if (!event_fd->CreateMappedBuffer(4, true)) {
return false;
}
thread_arg.start_mmap = true;
thread_a.join();
if (thread_arg.has_error) {
return false;
}
std::vector<char> buffer;
size_t buffer_pos = 0;
size_t size = event_fd->GetAvailableMmapData(buffer, buffer_pos);
std::vector<std::unique_ptr<Record>> records =
ReadRecordsFromBuffer(attr, buffer.data(), size);
uint64_t perf_time_in_ns = 0;
for (auto& r : records) {
if (r->type() == PERF_RECORD_MMAP) {
auto& record = *static_cast<MmapRecord*>(r.get());
if (record.data->addr == thread_arg.mmap_start_addr) {
perf_time_in_ns = record.Timestamp();
}
}
}
if (perf_time_in_ns == 0) {
LOG(ERROR) << "GetPerfClockAndSystemClockDiff: can't get perf time.";
return false;
}
*clock_diff_in_ns = perf_time_in_ns - thread_arg.system_time_in_ns;
LOG(VERBOSE) << "perf_time is " << perf_time_in_ns << " ns, system_time is "
<< thread_arg.system_time_in_ns << " ns , clock_diff is "
<< *clock_diff_in_ns << " ns.";
return true;
}
bool InitPerfClock() {
if (!perf_clock_initialized) {
if (!GetClockDiff(&perf_clock_and_system_clock_diff_in_ns)) {
return false;
}
perf_clock_initialized = true;
}
return true;
}
uint64_t GetPerfClock() {
CHECK(perf_clock_initialized);
return GetSystemClock() + perf_clock_and_system_clock_diff_in_ns;
}