# firefox-gecko-converter.py - Convert perf record output to Firefox's gecko profile format # SPDX-License-Identifier: GPL-2.0 # # The script converts perf.data to Gecko Profile Format, # which can be read by https://profiler.firefox.com/. # # Usage: # # perf record -a -g -F 99 sleep 60 # perf script report gecko > output.json import os import sys import json import argparse from functools import reduce from dataclasses import dataclass, field from typing import List, Dict, Optional, NamedTuple, Set, Tuple, Any # Add the Perf-Trace-Util library to the Python path sys.path.append(os.environ['PERF_EXEC_PATH'] + \ '/scripts/python/Perf-Trace-Util/lib/Perf/Trace') from perf_trace_context import * from Core import * StringID = int StackID = int FrameID = int CategoryID = int Milliseconds = float # start_time is intialiazed only once for the all event traces. start_time = None # https://github.com/firefox-devtools/profiler/blob/53970305b51b9b472e26d7457fee1d66cd4e2737/src/types/profile.js#L425 # Follow Brendan Gregg's Flamegraph convention: orange for kernel and yellow for user space by default. CATEGORIES = None # The product name is used by the profiler UI to show the Operating system and Processor. PRODUCT = os.popen('uname -op').read().strip() # Here key = tid, value = Thread tid_to_thread = dict() # The category index is used by the profiler UI to show the color of the flame graph. USER_CATEGORY_INDEX = 0 KERNEL_CATEGORY_INDEX = 1 # https://github.com/firefox-devtools/profiler/blob/53970305b51b9b472e26d7457fee1d66cd4e2737/src/types/gecko-profile.js#L156 class Frame(NamedTuple): string_id: StringID relevantForJS: bool innerWindowID: int implementation: None optimizations: None line: None column: None category: CategoryID subcategory: int # https://github.com/firefox-devtools/profiler/blob/53970305b51b9b472e26d7457fee1d66cd4e2737/src/types/gecko-profile.js#L216 class Stack(NamedTuple): prefix_id: Optional[StackID] frame_id: FrameID # https://github.com/firefox-devtools/profiler/blob/53970305b51b9b472e26d7457fee1d66cd4e2737/src/types/gecko-profile.js#L90 class Sample(NamedTuple): stack_id: Optional[StackID] time_ms: Milliseconds responsiveness: int @dataclass class Thread: """A builder for a profile of the thread. Attributes: comm: Thread command-line (name). pid: process ID of containing process. tid: thread ID. samples: Timeline of profile samples. frameTable: interned stack frame ID -> stack frame. stringTable: interned string ID -> string. stringMap: interned string -> string ID. stackTable: interned stack ID -> stack. stackMap: (stack prefix ID, leaf stack frame ID) -> interned Stack ID. frameMap: Stack Frame string -> interned Frame ID. comm: str pid: int tid: int samples: List[Sample] = field(default_factory=list) frameTable: List[Frame] = field(default_factory=list) stringTable: List[str] = field(default_factory=list) stringMap: Dict[str, int] = field(default_factory=dict) stackTable: List[Stack] = field(default_factory=list) stackMap: Dict[Tuple[Optional[int], int], int] = field(default_factory=dict) frameMap: Dict[str, int] = field(default_factory=dict) """ comm: str pid: int tid: int samples: List[Sample] = field(default_factory=list) frameTable: List[Frame] = field(default_factory=list) stringTable: List[str] = field(default_factory=list) stringMap: Dict[str, int] = field(default_factory=dict) stackTable: List[Stack] = field(default_factory=list) stackMap: Dict[Tuple[Optional[int], int], int] = field(default_factory=dict) frameMap: Dict[str, int] = field(default_factory=dict) def _intern_stack(self, frame_id: int, prefix_id: Optional[int]) -> int: """Gets a matching stack, or saves the new stack. Returns a Stack ID.""" key = f"{frame_id}" if prefix_id is None else f"{frame_id},{prefix_id}" # key = (prefix_id, frame_id) stack_id = self.stackMap.get(key) if stack_id is None: # return stack_id stack_id = len(self.stackTable) self.stackTable.append(Stack(prefix_id=prefix_id, frame_id=frame_id)) self.stackMap[key] = stack_id return stack_id def _intern_string(self, string: str) -> int: """Gets a matching string, or saves the new string. Returns a String ID.""" string_id = self.stringMap.get(string) if string_id is not None: return string_id string_id = len(self.stringTable) self.stringTable.append(string) self.stringMap[string] = string_id return string_id def _intern_frame(self, frame_str: str) -> int: """Gets a matching stack frame, or saves the new frame. Returns a Frame ID.""" frame_id = self.frameMap.get(frame_str) if frame_id is not None: return frame_id frame_id = len(self.frameTable) self.frameMap[frame_str] = frame_id string_id = self._intern_string(frame_str) symbol_name_to_category = KERNEL_CATEGORY_INDEX if frame_str.find('kallsyms') != -1 \ or frame_str.find('/vmlinux') != -1 \ or frame_str.endswith('.ko)') \ else USER_CATEGORY_INDEX self.frameTable.append(Frame( string_id=string_id, relevantForJS=False, innerWindowID=0, implementation=None, optimizations=None, line=None, column=None, category=symbol_name_to_category, subcategory=None, )) return frame_id def _add_sample(self, comm: str, stack: List[str], time_ms: Milliseconds) -> None: """Add a timestamped stack trace sample to the thread builder. Args: comm: command-line (name) of the thread at this sample stack: sampled stack frames. Root first, leaf last. time_ms: timestamp of sample in milliseconds. """ # Ihreads may not set their names right after they are created. # Instead, they might do it later. In such situations, to use the latest name they have set. if self.comm != comm: self.comm = comm prefix_stack_id = reduce(lambda prefix_id, frame: self._intern_stack (self._intern_frame(frame), prefix_id), stack, None) if prefix_stack_id is not None: self.samples.append(Sample(stack_id=prefix_stack_id, time_ms=time_ms, responsiveness=0)) def _to_json_dict(self) -> Dict: """Converts current Thread to GeckoThread JSON format.""" # Gecko profile format is row-oriented data as List[List], # And a schema for interpreting each index. # Schema: # https://github.com/firefox-devtools/profiler/blob/main/docs-developer/gecko-profile-format.md # https://github.com/firefox-devtools/profiler/blob/53970305b51b9b472e26d7457fee1d66cd4e2737/src/types/gecko-profile.js#L230 return { "tid": self.tid, "pid": self.pid, "name": self.comm, # https://github.com/firefox-devtools/profiler/blob/53970305b51b9b472e26d7457fee1d66cd4e2737/src/types/gecko-profile.js#L51 "markers": { "schema": { "name": 0, "startTime": 1, "endTime": 2, "phase": 3, "category": 4, "data": 5, }, "data": [], }, # https://github.com/firefox-devtools/profiler/blob/53970305b51b9b472e26d7457fee1d66cd4e2737/src/types/gecko-profile.js#L90 "samples": { "schema": { "stack": 0, "time": 1, "responsiveness": 2, }, "data": self.samples }, # https://github.com/firefox-devtools/profiler/blob/53970305b51b9b472e26d7457fee1d66cd4e2737/src/types/gecko-profile.js#L156 "frameTable": { "schema": { "location": 0, "relevantForJS": 1, "innerWindowID": 2, "implementation": 3, "optimizations": 4, "line": 5, "column": 6, "category": 7, "subcategory": 8, }, "data": self.frameTable, }, # https://github.com/firefox-devtools/profiler/blob/53970305b51b9b472e26d7457fee1d66cd4e2737/src/types/gecko-profile.js#L216 "stackTable": { "schema": { "prefix": 0, "frame": 1, }, "data": self.stackTable, }, "stringTable": self.stringTable, "registerTime": 0, "unregisterTime": None, "processType": "default", } # Uses perf script python interface to parse each # event and store the data in the thread builder. def process_event(param_dict: Dict) -> None: global start_time global tid_to_thread time_stamp = (param_dict['sample']['time'] // 1000) / 1000 pid = param_dict['sample']['pid'] tid = param_dict['sample']['tid'] comm = param_dict['comm'] # Start time is the time of the first sample if not start_time: start_time = time_stamp # Parse and append the callchain of the current sample into a stack. stack = [] if param_dict['callchain']: for call in param_dict['callchain']: if 'sym' not in call: continue stack.append(f'{call["sym"]["name"]} (in {call["dso"]})') if len(stack) != 0: # Reverse the stack, as root come first and the leaf at the end. stack = stack[::-1] # During perf record if -g is not used, the callchain is not available. # In that case, the symbol and dso are available in the event parameters. else: func = param_dict['symbol'] if 'symbol' in param_dict else '[unknown]' dso = param_dict['dso'] if 'dso' in param_dict else '[unknown]' stack.append(f'{func} (in {dso})') # Add sample to the specific thread. thread = tid_to_thread.get(tid) if thread is None: thread = Thread(comm=comm, pid=pid, tid=tid) tid_to_thread[tid] = thread thread._add_sample(comm=comm, stack=stack, time_ms=time_stamp) # Trace_end runs at the end and will be used to aggregate # the data into the final json object and print it out to stdout. def trace_end() -> None: threads = [thread._to_json_dict() for thread in tid_to_thread.values()] # Schema: https://github.com/firefox-devtools/profiler/blob/53970305b51b9b472e26d7457fee1d66cd4e2737/src/types/gecko-profile.js#L305 gecko_profile_with_meta = { "meta": { "interval": 1, "processType": 0, "product": PRODUCT, "stackwalk": 1, "debug": 0, "gcpoison": 0, "asyncstack": 1, "startTime": start_time, "shutdownTime": None, "version": 24, "presymbolicated": True, "categories": CATEGORIES, "markerSchema": [], }, "libs": [], "threads": threads, "processes": [], "pausedRanges": [], } json.dump(gecko_profile_with_meta, sys.stdout, indent=2) def main() -> None: global CATEGORIES parser = argparse.ArgumentParser(description="Convert perf.data to Firefox\'s Gecko Profile format") # Add the command-line options # Colors must be defined according to this: # https://github.com/firefox-devtools/profiler/blob/50124adbfa488adba6e2674a8f2618cf34b59cd2/res/css/categories.css parser.add_argument('--user-color', default='yellow', help='Color for the User category') parser.add_argument('--kernel-color', default='orange', help='Color for the Kernel category') # Parse the command-line arguments args = parser.parse_args() # Access the values provided by the user user_color = args.user_color kernel_color = args.kernel_color CATEGORIES = [ { "name": 'User', "color": user_color, "subcategories": ['Other'] }, { "name": 'Kernel', "color": kernel_color, "subcategories": ['Other'] }, ] if __name__ == '__main__': main()