blob: ba0acbd80798526fe70a10b51e34eedba790a58f [file] [log] [blame]
/*
* Copyright (C) 2018 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include "src/trace_processor/importers/systrace/systrace_trace_parser.h"
#include "perfetto/base/logging.h"
#include "perfetto/ext/base/string_splitter.h"
#include "perfetto/ext/base/string_utils.h"
#include "src/trace_processor/importers/common/process_tracker.h"
#include "src/trace_processor/trace_sorter.h"
#include <inttypes.h>
#include <cctype>
#include <string>
#include <unordered_map>
namespace perfetto {
namespace trace_processor {
namespace {
std::vector<base::StringView> SplitOnSpaces(base::StringView str) {
std::vector<base::StringView> result;
for (size_t i = 0; i < str.size(); ++i) {
// Consume all spaces.
for (; i < str.size() && str.data()[i] == ' '; ++i)
;
// If we haven't reached the end consume all non-spaces and add result.
if (i != str.size()) {
size_t start = i;
for (; i < str.size() && str.data()[i] != ' '; ++i)
;
result.push_back(base::StringView(str.data() + start, i - start));
}
}
return result;
}
bool IsProcessDumpShortHeader(const std::vector<base::StringView>& tokens) {
return tokens.size() == 4 && tokens[0] == "USER" && tokens[1] == "PID" &&
tokens[2] == "TID" && tokens[3] == "CMD";
}
bool IsProcessDumpLongHeader(const std::vector<base::StringView>& tokens) {
return tokens.size() > 4 && tokens[0] == "USER" && tokens[1] == "PID" &&
tokens[2] == "PPID" && tokens[3] == "VSZ";
}
} // namespace
SystraceTraceParser::SystraceTraceParser(TraceProcessorContext* ctx)
: line_parser_(ctx), ctx_(ctx) {}
SystraceTraceParser::~SystraceTraceParser() = default;
util::Status SystraceTraceParser::Parse(std::unique_ptr<uint8_t[]> owned_buf,
size_t size) {
if (state_ == ParseState::kEndOfSystrace)
return util::OkStatus();
partial_buf_.insert(partial_buf_.end(), &owned_buf[0], &owned_buf[size]);
if (state_ == ParseState::kBeforeParse) {
state_ = partial_buf_[0] == '<' ? ParseState::kHtmlBeforeSystrace
: ParseState::kSystrace;
}
// There can be multiple trace data sections in an HTML trace, we want to
// ignore any that don't contain systrace data. In the future it would be
// good to also parse the process dump section.
const char kTraceDataSection[] =
R"(<script class="trace-data" type="application/text">)";
auto start_it = partial_buf_.begin();
for (;;) {
auto line_it = std::find(start_it, partial_buf_.end(), '\n');
if (line_it == partial_buf_.end())
break;
std::string buffer(start_it, line_it);
if (state_ == ParseState::kHtmlBeforeSystrace) {
if (base::Contains(buffer, kTraceDataSection)) {
state_ = ParseState::kTraceDataSection;
}
} else if (state_ == ParseState::kTraceDataSection) {
if (base::StartsWith(buffer, "#")) {
state_ = ParseState::kSystrace;
} else if (base::StartsWith(buffer, "PROCESS DUMP")) {
state_ = ParseState::kProcessDumpLong;
} else if (base::Contains(buffer, R"(</script>)")) {
state_ = ParseState::kHtmlBeforeSystrace;
}
} else if (state_ == ParseState::kSystrace) {
if (base::Contains(buffer, R"(</script>)")) {
state_ = ParseState::kEndOfSystrace;
break;
} else if (!base::StartsWith(buffer, "#") && !buffer.empty()) {
SystraceLine line;
util::Status status = line_tokenizer_.Tokenize(buffer, &line);
if (!status.ok())
return status;
line_parser_.ParseLine(std::move(line));
}
} else if (state_ == ParseState::kProcessDumpLong ||
state_ == ParseState::kProcessDumpShort) {
if (base::Contains(buffer, R"(</script>)")) {
state_ = ParseState::kHtmlBeforeSystrace;
} else {
std::vector<base::StringView> tokens =
SplitOnSpaces(base::StringView(buffer));
if (IsProcessDumpShortHeader(tokens)) {
state_ = ParseState::kProcessDumpShort;
} else if (IsProcessDumpLongHeader(tokens)) {
state_ = ParseState::kProcessDumpLong;
} else if (state_ == ParseState::kProcessDumpLong &&
tokens.size() >= 10) {
// Format is:
// user pid ppid vsz rss wchan pc s name my cmd line
const base::Optional<uint32_t> pid =
base::StringToUInt32(tokens[1].ToStdString());
const base::Optional<uint32_t> ppid =
base::StringToUInt32(tokens[2].ToStdString());
base::StringView name = tokens[8];
// Command line may contain spaces, merge all remaining tokens:
const char* cmd_start = tokens[9].data();
base::StringView cmd(
cmd_start,
static_cast<size_t>((buffer.data() + buffer.size()) - cmd_start));
if (!pid || !ppid) {
PERFETTO_ELOG("Could not parse line '%s'", buffer.c_str());
return util::ErrStatus("Could not parse PROCESS DUMP line");
}
ctx_->process_tracker->SetProcessMetadata(pid.value(), ppid, name);
} else if (state_ == ParseState::kProcessDumpShort &&
tokens.size() >= 4) {
// Format is:
// username pid tid my cmd line
const base::Optional<uint32_t> tgid =
base::StringToUInt32(tokens[1].ToStdString());
const base::Optional<uint32_t> tid =
base::StringToUInt32(tokens[2].ToStdString());
// Command line may contain spaces, merge all remaining tokens:
const char* cmd_start = tokens[3].data();
base::StringView cmd(
cmd_start,
static_cast<size_t>((buffer.data() + buffer.size()) - cmd_start));
StringId cmd_id =
ctx_->storage->mutable_string_pool()->InternString(cmd);
if (!tid || !tgid) {
PERFETTO_ELOG("Could not parse line '%s'", buffer.c_str());
return util::ErrStatus("Could not parse PROCESS DUMP line");
}
UniqueTid utid =
ctx_->process_tracker->UpdateThread(tid.value(), tgid.value());
ctx_->process_tracker->SetThreadNameIfUnset(utid, cmd_id);
}
}
}
start_it = line_it + 1;
}
if (state_ == ParseState::kEndOfSystrace) {
partial_buf_.clear();
} else {
partial_buf_.erase(partial_buf_.begin(), start_it);
}
return util::OkStatus();
}
void SystraceTraceParser::NotifyEndOfFile() {}
} // namespace trace_processor
} // namespace perfetto