perf jevents: Sort strings in the big C string to reduce faults

author Ian Rogers <irogers@google.com>

Thu, 24 Aug 2023 04:13:29 +0000 (21:13 -0700)

committer Arnaldo Carvalho de Melo <acme@redhat.com>

Thu, 24 Aug 2023 14:11:09 +0000 (11:11 -0300)
author Ian Rogers <irogers@google.com>
Thu, 24 Aug 2023 04:13:29 +0000 (21:13 -0700)
committer Arnaldo Carvalho de Melo <acme@redhat.com>
Thu, 24 Aug 2023 14:11:09 +0000 (11:11 -0300)
diff --git a/tools/perf/pmu-events/jevents.py b/tools/perf/pmu-events/jevents.py

index 01335a4..e5bce57 100755 (executable)
--- a/tools/perf/pmu-events/jevents.py
+++ b/tools/perf/pmu-events/jevents.py
@@ -113,13 +113,24 @@ class BigCString:
    strings: Set[str]
    big_string: Sequence[str]
    offsets: Dict[str, int]
+  insert_number: int
+  insert_point: Dict[str, int]
+  metrics: Set[str]
  
    def __init__(self):
      self.strings = set()
+    self.insert_number = 0;
+    self.insert_point = {}
+    self.metrics = set()
  
-  def add(self, s: str) -> None:
+  def add(self, s: str, metric: bool) -> None:
      """Called to add to the big string."""
-    self.strings.add(s)
+    if s not in self.strings:
+      self.strings.add(s)
+      self.insert_point[s] = self.insert_number
+      self.insert_number += 1
+      if metric:
+        self.metrics.add(s)
  
    def compute(self) -> None:
      """Called once all strings are added to compute the string and offsets."""
@@ -160,8 +171,11 @@ class BigCString:
      self.big_string = []
      self.offsets = {}
  
+    def string_cmp_key(s: str) -> Tuple[bool, int, str]:
+      return (s in self.metrics, self.insert_point[s], s)
+
      # Emit all strings that aren't folded in a sorted manner.
-    for s in sorted(self.strings):
+    for s in sorted(self.strings, key=string_cmp_key):
        if s not in folded_strings:
          self.offsets[s] = big_string_offset
          self.big_string.append(f'/* offset={big_string_offset} */ "')
@@ -574,19 +588,20 @@ def preprocess_one_file(parents: Sequence[str], item: os.DirEntry) -> None:
        assert len(mgroup) > 1, parents
        description = f"{metricgroup_descriptions[mgroup]}\\000"
        mgroup = f"{mgroup}\\000"
-      _bcs.add(mgroup)
-      _bcs.add(description)
+      _bcs.add(mgroup, metric=True)
+      _bcs.add(description, metric=True)
        _metricgroups[mgroup] = description
      return
  
    topic = get_topic(item.name)
    for event in read_json_events(item.path, topic):
      pmu_name = f"{event.pmu}\\000"
-    _bcs.add(pmu_name)
      if event.name:
-      _bcs.add(event.build_c_string(metric=False))
+      _bcs.add(pmu_name, metric=False)
+      _bcs.add(event.build_c_string(metric=False), metric=False)
      if event.metric_name:
-      _bcs.add(event.build_c_string(metric=True))
+      _bcs.add(pmu_name, metric=True)
+      _bcs.add(event.build_c_string(metric=True), metric=True)
  
  def process_one_file(parents: Sequence[str], item: os.DirEntry) -> None:
    """Process a JSON file during the main walk."""
author	Ian Rogers <irogers@google.com>
	Thu, 24 Aug 2023 04:13:29 +0000 (21:13 -0700)
committer	Arnaldo Carvalho de Melo <acme@redhat.com>
	Thu, 24 Aug 2023 14:11:09 +0000 (11:11 -0300)