You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
graphengine/ge/hybrid/executor/hybrid_profiler.cc

98 lines
3.2 KiB

/**
* Copyright 2019-2020 Huawei Technologies Co., Ltd
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include "hybrid_profiler.h"
#include <iomanip>
#include <iostream>
#include <cstdarg>
#include "framework/common/debug/ge_log.h"
#include "securec.h"
namespace ge {
namespace hybrid {
namespace {
const int kMaxEvents = 1024 * 500;
const int kEventDescMax = 512;
const int kMaxEventTypes = 8;
const int kIndent = 8;
}
HybridProfiler::HybridProfiler(): counter_(0) {
Reset();
}
void HybridProfiler::RecordEvent(EventType event_type, const char *fmt, ...) {
va_list args;
va_start(args, fmt);
char buf[kEventDescMax];
if (vsnprintf_s(buf, kEventDescMax, kEventDescMax - 1, fmt, args) == -1) {
GELOGE(FAILED, "[Parse][Param:fmt]Format %s failed.", fmt);
REPORT_CALL_ERROR("E19999", "Parse Format %s failed when HybridProfiler %s.", fmt, __FUNCTION__);
va_end(args);
return;
}
va_end(args);
auto index = counter_++;
if (index >= static_cast<int>(events_.size())) {
GELOGE(INTERNAL_ERROR,
"[Check][Range]index out of range. index = %d, max event size = %zu", index, events_.size());
REPORT_INNER_ERROR("E19999", "index out of range when HybridProfiler %s. index = %d, max event size = %zu",
__FUNCTION__, index, events_.size());
return;
}
auto &evt = events_[index];
evt.timestamp = std::chrono::system_clock::now();
evt.desc = std::string(buf);
evt.event_type = event_type;
}
void HybridProfiler::Dump(std::ostream &output_stream) {
if (events_.empty()) {
return;
}
auto start_dump = std::chrono::system_clock::now();
auto first_evt = events_[0];
auto start = first_evt.timestamp;
std::vector<decltype(start)> prev_timestamps;
prev_timestamps.resize(kMaxEventTypes, start);
for (int i = 0; i < counter_; ++i) {
auto &evt = events_[i];
auto elapsed = std::chrono::duration_cast<std::chrono::microseconds>(evt.timestamp - start).count();
auto &prev_ts = prev_timestamps[evt.event_type];
auto cost = std::chrono::duration_cast<std::chrono::microseconds>(evt.timestamp - prev_ts).count();
prev_ts = evt.timestamp;
output_stream << std::setw(kIndent) << elapsed << "\t\t" << cost << "\t\t" << evt.desc << std::endl;
}
auto end_dump = std::chrono::system_clock::now();
auto elapsed_dump = std::chrono::duration_cast<std::chrono::microseconds>(end_dump - start).count();
auto cost_dump = std::chrono::duration_cast<std::chrono::microseconds>(end_dump - start_dump).count();
output_stream << std::setw(kIndent) << elapsed_dump << "\t\t" << cost_dump
<< "\t\t" << "[Dump profiling]" << std::endl;
Reset();
}
void HybridProfiler::Reset() {
counter_ = 0;
events_.clear();
events_.resize(kMaxEvents);
}
} // namespace hybrid
} // namespace ge