improve pahole script and pack a few classes

(*) fix: I was substracting the padding space instead of adding it when calculating how much free space we had to improve. (*) sort input data, so we process structs located in the same DSO together, which reduces GDB's memory usage (*) handle another error condition, where gdbs output is sufficiently mixed up that we miss the end of commands terminator Change-Id: Ic4bb92b736f38a2b3d90e4a14485152b7f869b43 Reviewed-on: https://gerrit.libreoffice.org/c/core/+/95041 Tested-by: Jenkins Reviewed-by: Noel Grandin <noel.grandin@collabora.co.uk>
author: Noel Grandin <noel.grandin@collabora.co.uk> 2020-05-28 13:18:41 +0200
committer: Noel Grandin <noel.grandin@collabora.co.uk> 2020-05-29 09:40:12 +0200
commit: 31b0be0f21479323408e128f2e8a1a795e037e74 (patch)
tree: 97f4d31113dc06084758042cd6e87f73c5c5a43e /compilerplugins
parent: f1ce5c3e7e621334be29df0fa425803ce77afb28 (diff)
1 files changed, 86 insertions, 69 deletions
diff --git a/compilerplugins/clang/pahole-all-classes.py b/compilerplugins/clang/pahole-all-classes.py
index b95b92543427..16e851d82c7a 100755
--- a/compilerplugins/clang/pahole-all-classes.py
+++ b/compilerplugins/clang/pahole-all-classes.py
@@ -8,10 +8,8 @@
 # (2) First run the unusedfields loplugin to generate a log file
 # (3) Install the pahole stuff into your gdb, I used this one:
 #     https://github.com/PhilArmstrong/pahole-gdb
-# (4) Edit the loop near the top of the script to only produce results for one of our modules.
-#     Note that this will make GDB soak up about 8G of RAM, which is why I don't do more than one module at a time
-# (5) Run the script
-#     ./compilerplugins/clang/pahole-all-classes.py > ./compilerplugins/clang/pahole.results
+# (4) Run the script
+#     ./compilerplugins/clang/pahole-all-classes.py
 #
 
 import _thread
@@ -27,6 +25,7 @@ a = subprocess.Popen("cat n1", stdout=subprocess.PIPE, shell=True)
 
 classSet = set()
 classSourceLocDict = dict()
+locToClassDict = dict()
 with a.stdout as txt:
     for line in txt:
         tokens = line.decode('utf8').strip().split("\t")
@@ -38,6 +37,7 @@ with a.stdout as txt:
         if className in classSet: continue
         classSet.add(className)
         classSourceLocDict[className] = srcLoc
+        locToClassDict[srcLoc] = className
 a.terminate()
 
 # Some of the pahole commands are going to fail, and I cannot read the error stream and the input stream
@@ -57,83 +57,100 @@ def write_pahole_commands(classes):
 # to split them up, and that creates a mess in the parsing logic.
 def read_generator(gdbOutput):
     while True:
-        line = gdbOutput.readline().decode('utf8').strip()
+        line = gdbOutput.readline();
+        if line == "": return # end of file
+        line = line.decode('utf8').strip()
+        print("gdb: " + line)
         for split in line.split("(gdb)"):
             split = split.strip()
             if len(split) == 0: continue
             if "all-done" in split: return
             yield split
 
-classList = sorted(classSet)
+# build list of classes sorted by source location to increase the chances of
+# processing stuff stored in the same DSO together
+sortedLocs = sorted(locToClassDict.keys())
+classList = list()
+for src in sortedLocs:
+    if "include/" in src:
+        classList.append(locToClassDict[src])
 
-# Process 200 classes at a time, otherwise gdb's memory usage blows up and kills the machine
-#
-while len(classList) > 0:
+with open("compilerplugins/clang/pahole.results", "wt") as f:
+    # Process 400 classes at a time, otherwise gdb's memory usage blows up and kills the machine
+    # This number is chosen to make gdb peak at around 8G.
+    while len(classList) > 0:
 
-    currClassList = classList[1:200];
-    classList = classList[200:]
+        currClassList = classList[0:500];
+        classList = classList[500:]
 
-    gdbProc = subprocess.Popen("gdb", stdin=subprocess.PIPE, stdout=subprocess.PIPE, stderr=subprocess.STDOUT, shell=True)
+        gdbProc = subprocess.Popen("gdb", stdin=subprocess.PIPE, stdout=subprocess.PIPE, stderr=subprocess.STDOUT, shell=True)
 
-    stdin = io.TextIOWrapper(gdbProc.stdin, 'utf-8')
+        stdin = io.TextIOWrapper(gdbProc.stdin, 'utf-8')
 
-    # make gdb load all the debugging info
-    stdin.write("set confirm off\n")
-    for filename in sorted(os.listdir('instdir/program')):
-        if filename.endswith(".so"):
-            stdin.write("add-symbol-file instdir/program/" + filename + "\n")
-    stdin.flush()
+        # make gdb load all the debugging info
+        stdin.write("set confirm off\n")
+        # make gdb not wrap output and mess up my parsing
+        stdin.write("set width unlimited\n")
+        for filename in sorted(os.listdir('instdir/program')):
+            if filename.endswith(".so"):
+                stdin.write("add-symbol-file instdir/program/" + filename + "\n")
+        stdin.flush()
 
 
-    _thread.start_new_thread( write_pahole_commands, (currClassList,) )
+        _thread.start_new_thread( write_pahole_commands, (currClassList,) )
 
-    firstLineRegex = re.compile("/\*\s+(\d+)\s+\*/ struct")
-    fieldLineRegex = re.compile("/\*\s+(\d+)\s+(\d+)\s+\*/ ")
-    holeLineRegex = re.compile("/\* XXX (\d+) bit hole, try to pack \*/")
-    # sometimes pahole can't determine the size of a sub-struct, and then it returns bad data
-    bogusLineRegex = re.compile("/\*\s+\d+\s+0\s+\*/")
-    structLines = list()
-    foundHole = False
-    cumulativeHoleBits = 0
-    structSize = 0
-    foundBogusLine = False
-    # pahole doesn't report space at the end of the structure, so work it out myself
-    sizeOfFields = 0
-    for line in read_generator(gdbProc.stdout):
-        structLines.append(line)
-        firstLineMatch = firstLineRegex.match(line)
-        if firstLineMatch:
-            structSize = int(firstLineMatch.group(1))
-        holeLineMatch = holeLineRegex.match(line)
-        if holeLineMatch:
-            foundHole = True
-            cumulativeHoleBits += int(holeLineMatch.group(1))
-        fieldLineMatch = fieldLineRegex.match(line)
-        if fieldLineMatch:
-            fieldSize = int(fieldLineMatch.group(2))
-            sizeOfFields = int(fieldLineMatch.group(1)) + fieldSize
-        if bogusLineRegex.match(line):
-            foundBogusLine = True
-        if line == "}":
-            # Ignore very large structs, packing those is not going to help much, and
-            # re-organising them can make them much less readable.
-            if foundHole and len(structLines) < 12 and structSize < 100 and not foundBogusLine:
-                # Verify that we have enough hole-space that removing it will result in a structure
-                # that still satisfies alignment requirements, otherwise the compiler will just put empty
-                # space at the end of the struct.
-                # TODO improve detection of the required alignment for a structure
-                potentialSpace = (cumulativeHoleBits / 8) + (sizeOfFields - structSize)
-                if potentialSpace >= 8:
-                    for line in structLines:
-                        print(line)
-                    if (sizeOfFields - structSize) > 0:
-                        print("hole at end of struct: " + str(sizeOfFields - structSize))
-            #  reset state
-            structLines.clear()
-            foundHole = False
-            cumulativeHoleBits = 0
-            structSize = 0
-            foundBogusLine = False
-            actualStructSize = 0
+        firstLineRegex = re.compile("/\*\s+(\d+)\s+\*/ struct") # /* 16 */ struct Foo
+        fieldLineRegex = re.compile("/\*\s+(\d+)\s+(\d+)\s+\*/ ") # /* 12 8 */ class rtl::OUString aName
+        holeLineRegex = re.compile("/\* XXX (\d+) bit hole, try to pack \*/")
+        # sometimes pahole can't determine the size of a sub-struct, and then it returns bad data
+        bogusLineRegex = re.compile("/\*\s+\d+\s+0\s+\*/")
+        structLines = list()
+        foundHole = False
+        cumulativeHoleBits = 0
+        alignedStructSize = 0
+        foundBogusLine = False
+        # pahole doesn't report space at the end of the structure, so work it out myself
+        sizeOfStructWithoutPadding = 0
+        for line in read_generator(gdbProc.stdout):
+            structLines.append(line)
+            firstLineMatch = firstLineRegex.match(line)
+            if firstLineMatch:
+                alignedStructSize = int(firstLineMatch.group(1))
+                structLines.clear()
+                structLines.append(line)
+            holeLineMatch = holeLineRegex.match(line)
+            if holeLineMatch:
+                foundHole = True
+                cumulativeHoleBits += int(holeLineMatch.group(1))
+            fieldLineMatch = fieldLineRegex.match(line)
+            if fieldLineMatch:
+                fieldPosInBytes = int(fieldLineMatch.group(1))
+                fieldSizeInBytes = int(fieldLineMatch.group(2))
+                sizeOfStructWithoutPadding = fieldPosInBytes + fieldSizeInBytes
+            if bogusLineRegex.match(line):
+                foundBogusLine = True
+            if line == "}":
+                # Ignore very large structs, packing those is not going to help much, and
+                # re-organising them can make them much less readable.
+                if foundHole and len(structLines) < 16 and alignedStructSize < 100 and not foundBogusLine:
+                    # Verify that, after packing, and compiler alignment, the new structure will be actually smaller.
+                    # Sometimes, we can save space, but the compiler will align the structure such that we don't
+                    # actually save any space.
+                    # TODO improve detection of the required alignment for a structure
+                    holeAtEnd = alignedStructSize - sizeOfStructWithoutPadding
+                    potentialSpace = (cumulativeHoleBits / 8) + holeAtEnd
+                    if potentialSpace >= 8:
+                        for line in structLines:
+                            f.write(line + "\n")
+                        if holeAtEnd > 0:
+                            f.write("hole at end of struct: " + str(holeAtEnd) + "\n")
+                        f.write("\n")
+                #  reset state
+                structLines.clear()
+                foundHole = False
+                cumulativeHoleBits = 0
+                structSize = 0
+                foundBogusLine = False
+                actualStructSize = 0
 
-    gdbProc.terminate()
+        gdbProc.terminate()
author	Noel Grandin <noel.grandin@collabora.co.uk>	2020-05-28 13:18:41 +0200
committer	Noel Grandin <noel.grandin@collabora.co.uk>	2020-05-29 09:40:12 +0200
commit	31b0be0f21479323408e128f2e8a1a795e037e74 (patch)
tree	97f4d31113dc06084758042cd6e87f73c5c5a43e /compilerplugins
parent	f1ce5c3e7e621334be29df0fa425803ce77afb28 (diff)