v8/tools/profiling/linux-perf-d8.py

Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

233 lines
6.9 KiB
Python
Raw Normal View History

#!/usr/bin/env python3
# Copyright 2022 the V8 project authors. All rights reserved.
# Use of this source code is governed by a BSD-style license that can be
# found in the LICENSE file.
from datetime import datetime
from pathlib import Path
import optparse
import os
import psutil
import shlex
import signal
import subprocess
import time
# ==============================================================================
usage = """Usage: %prog $D8_BIN [OPTION]... -- [D8_OPTION]... [FILE]
This script runs linux-perf with custom V8 logging to get support to resolve
JS function names.
The perf data is written to OUT_DIR separate by renderer process.
See http://v8.dev//linux-perf for more detailed instructions.
See $D8_BIN --help for more options
"""
parser = optparse.OptionParser(usage=usage)
parser.add_option(
'--perf-data-dir',
default=None,
metavar="OUT_DIR",
help="Output directory for linux perf profile files")
parser.add_option("--timeout", type=float, help="Stop d8 after N seconds")
d8_options = optparse.OptionGroup(
parser, "d8-forwarded Options",
"THese options are for a better script experience that are forward directly"
"to d8. Any other d8 option can be passed after the '--' arguments"
"separator.")
d8_options.add_option(
"--perf-prof-annotate-wasm",
help="Load wasm source map and provide annotate wasm code.",
action="store_true",
default=False)
d8_options.add_option(
"--no-interpreted-frames-native-stack",
help="For profiling v8 copies the interpreter entry trampoline for every "
"interpreted function. This makes interpreted functions identifiable on the "
"native stack at cost of a slight performance and memory overhead.",
action="store_true",
default=False)
parser.add_option_group(d8_options)
perf_options = optparse.OptionGroup(
parser, "perf-forward options", """
These options are forward directly to the `perf record` command and can be
used to manually tweak how profiling works.
See `perf record --help for more` informationn
""")
perf_options.add_option(
"--freq",
default="max",
help="Sampling frequency, either 'max' or a number in herz. "
"Might be reduced depending on the platform.")
perf_options.add_option("--call-graph", default="fp", help="Defaults tp 'fp'")
perf_options.add_option("--event", default=None, help="Not set by default.")
perf_options.add_option(
"--raw-samples",
default=None,
help="Collect raw samples. Not set by default")
perf_options.add_option(
"--count", default=None, help="Event period to sample. Not set by default.")
perf_options.add_option(
"--no-inherit",
action="store_true",
default=False,
help=" Child tasks do not inherit counters.")
parser.add_option_group(perf_options)
# ==============================================================================
def log(*args):
print("")
print("=" * 80)
print(*args)
print("=" * 80)
# ==============================================================================
(options, args) = parser.parse_args()
if len(args) == 0:
parser.error("No d8 binary provided")
d8_bin = Path(args.pop(0)).absolute()
if not d8_bin.exists():
parser.error(f"D8 '{d8_bin}' does not exist")
if options.perf_data_dir is None:
options.perf_data_dir = Path.cwd()
else:
options.perf_data_dir = Path(options.perf_data_dir).absolute()
if not options.perf_data_dir.is_dir():
parser.error(f"--perf-data-dir={options.perf_data_dir} "
"is not an directory or does not exist.")
if options.timeout and options.timeout < 0:
parser.error("--timeout should be a positive number")
# ==============================================================================
def make_path_absolute(maybe_path):
if maybe_path.startswith("-"):
return maybe_path
path = Path(maybe_path)
if path.exists():
return str(path.absolute())
return maybe_path
def make_args_paths_absolute(args):
return list(map(make_path_absolute, args))
# Preprocess args if we change CWD to get cleaner output
if options.perf_data_dir != Path.cwd():
args = make_args_paths_absolute(args)
# ==============================================================================
old_cwd = Path.cwd()
os.chdir(options.perf_data_dir)
# ==============================================================================
cmd = [str(d8_bin), "--perf-prof"]
if not options.no_interpreted_frames_native_stack:
cmd += ["--interpreted-frames-native-stack"]
if options.perf_prof_annotate_wasm:
cmd += ["--perf-prof-annotate-wasm"]
cmd += args
log("D8 CMD: ", shlex.join(cmd))
datetime_str = datetime.now().strftime("%Y-%m-%d_%H%M%S")
perf_data_file = Path.cwd() / f"d8_{datetime_str}.perf.data"
perf_cmd = [
"perf", "record", f"--call-graph={options.call_graph}",
f"--freq={options.freq}", "--clockid=mono", f"--output={perf_data_file}"
]
if options.count:
perf_cmd += [f"--count={options.count}"]
if options.raw_samples:
perf_cmd += [f"--raw_samples={options.raw_samples}"]
if options.event:
perf_cmd += [f"--event={options.event}"]
if options.no_inherit:
perf_cmd += [f"--no-inherit"]
cmd = perf_cmd + ["--"] + cmd
log("LINUX PERF CMD: ", shlex.join(cmd))
def wait_for_process_timeout(process):
sleeping_time = 0
while (sleeping_time < options.timeout):
processHasStopped = process.poll() is not None
if processHasStopped:
return True
time.sleep(0.1)
return False
if options.timeout is None:
try:
subprocess.check_call(cmd)
except:
log("ERROR running perf record")
else:
process = subprocess.Popen(cmd)
if not wait_for_process_timeout(process):
log(f"QUITING d8 processes after {options.timeout}s timeout")
current_process = psutil.Process()
children = current_process.children(recursive=True)
for child in children:
if "d8" in child.name():
print(f" quitting PID={child.pid}")
child.send_signal(signal.SIGQUIT)
# Wait for linux-perf to write out files
time.sleep(1)
return_status = process.poll()
if return_status is None:
log("Force quitting linux-perf")
process.send_signal(signal.SIGQUIT)
process.wait()
elif return_status != 0:
log("ERROR running perf record")
# ==============================================================================
log("POST PROCESSING: Injecting JS symbols")
def inject_v8_symbols(perf_dat_file):
output_file = perf_dat_file.with_suffix(".data.jitted")
cmd = [
"perf", "inject", "--jit", f"--input={perf_dat_file}",
f"--output={output_file}"
]
try:
subprocess.check_call(cmd)
print(f"Processed: {output_file}")
except:
print(shlex.join(cmd))
return None
return output_file
result = inject_v8_symbols(perf_data_file)
if result is None:
print("No perf files were successfully processed"
" Check for errors or partial results in '{options.perf_data_dir}'")
exit(1)
log(f"RESULTS in '{options.perf_data_dir}'")
BYTES_TO_MIB = 1 / 1024 / 1024
print(f"{result.name:67}{(result.stat().st_size*BYTES_TO_MIB):10.2f}MiB")
log("PPROF")
print(f"pprof -flame {result}")