2023-01-14 04:36:28 +08:00
|
|
|
#!/usr/bin/python3
|
2021-10-30 04:25:12 +08:00
|
|
|
# This file is part of the Luau programming language and is licensed under MIT License; see LICENSE.txt for details
|
|
|
|
|
|
|
|
# Given two heap snapshots (A & B), this tool performs reachability analysis on new objects allocated in B
|
|
|
|
# This is useful to find memory leaks - reachability analysis answers the question "why is this set of objects not freed"
|
|
|
|
# This tool can also be ran with just one snapshot, in which case it displays all allocated objects
|
|
|
|
# The result of analysis is a .svg file which can be viewed in a browser
|
|
|
|
# To generate these dumps, use luaC_dump, ideally preceded by luaC_fullgc
|
|
|
|
|
2022-02-12 02:43:14 +08:00
|
|
|
import argparse
|
2021-10-30 04:25:12 +08:00
|
|
|
import json
|
|
|
|
import sys
|
|
|
|
import svg
|
|
|
|
|
2022-02-12 02:43:14 +08:00
|
|
|
argumentParser = argparse.ArgumentParser(description='Luau heap snapshot analyzer')
|
|
|
|
|
|
|
|
argumentParser.add_argument('--split', dest = 'split', type = str, default = 'none', help = 'Perform additional root split using memory categories', choices = ['none', 'custom', 'all'])
|
|
|
|
|
|
|
|
argumentParser.add_argument('snapshot')
|
|
|
|
argumentParser.add_argument('snapshotnew', nargs='?')
|
|
|
|
|
|
|
|
arguments = argumentParser.parse_args()
|
|
|
|
|
2021-10-30 04:25:12 +08:00
|
|
|
class Node(svg.Node):
|
|
|
|
def __init__(self):
|
|
|
|
svg.Node.__init__(self)
|
|
|
|
self.size = 0
|
|
|
|
self.count = 0
|
|
|
|
# data for memory category filtering
|
|
|
|
self.objects = []
|
|
|
|
self.categories = set()
|
|
|
|
|
|
|
|
def text(self):
|
|
|
|
return self.name
|
|
|
|
|
|
|
|
def title(self):
|
|
|
|
return self.name
|
|
|
|
|
|
|
|
def details(self, root):
|
|
|
|
return "{} ({:,} bytes, {:.1%}); self: {:,} bytes in {:,} objects".format(self.name, self.width, self.width / root.width, self.size, self.count)
|
|
|
|
|
2022-08-12 04:42:54 +08:00
|
|
|
def getkey(heap, obj, key):
|
|
|
|
pairs = obj.get("pairs", [])
|
|
|
|
for i in range(0, len(pairs), 2):
|
|
|
|
if pairs[i] and heap[pairs[i]]["type"] == "string" and heap[pairs[i]]["data"] == key:
|
|
|
|
if pairs[i + 1] and heap[pairs[i + 1]]["type"] == "string":
|
|
|
|
return heap[pairs[i + 1]]["data"]
|
|
|
|
else:
|
|
|
|
return None
|
|
|
|
return None
|
|
|
|
|
2021-10-30 04:25:12 +08:00
|
|
|
# load files
|
2022-02-12 02:43:14 +08:00
|
|
|
if arguments.snapshotnew == None:
|
2021-10-30 04:25:12 +08:00
|
|
|
dumpold = None
|
2022-02-12 02:43:14 +08:00
|
|
|
with open(arguments.snapshot) as f:
|
2021-10-30 04:25:12 +08:00
|
|
|
dump = json.load(f)
|
|
|
|
else:
|
2022-02-12 02:43:14 +08:00
|
|
|
with open(arguments.snapshot) as f:
|
2021-10-30 04:25:12 +08:00
|
|
|
dumpold = json.load(f)
|
2022-02-12 02:43:14 +08:00
|
|
|
with open(arguments.snapshotnew) as f:
|
2021-10-30 04:25:12 +08:00
|
|
|
dump = json.load(f)
|
|
|
|
|
2022-08-12 04:42:54 +08:00
|
|
|
heap = dump["objects"]
|
|
|
|
|
2021-10-30 04:25:12 +08:00
|
|
|
# reachability analysis: how much of the heap is reachable from roots?
|
|
|
|
visited = set()
|
|
|
|
queue = []
|
|
|
|
offset = 0
|
|
|
|
root = Node()
|
|
|
|
|
|
|
|
for name, addr in dump["roots"].items():
|
|
|
|
queue.append((addr, root.child(name)))
|
|
|
|
|
|
|
|
while offset < len(queue):
|
|
|
|
addr, node = queue[offset]
|
|
|
|
offset += 1
|
|
|
|
if addr in visited:
|
|
|
|
continue
|
|
|
|
|
|
|
|
visited.add(addr)
|
2022-08-12 04:42:54 +08:00
|
|
|
obj = heap[addr]
|
2021-10-30 04:25:12 +08:00
|
|
|
|
|
|
|
if not dumpold or not addr in dumpold["objects"]:
|
|
|
|
node.count += 1
|
|
|
|
node.size += obj["size"]
|
|
|
|
node.objects.append(obj)
|
|
|
|
|
|
|
|
if obj["type"] == "table":
|
|
|
|
pairs = obj.get("pairs", [])
|
2022-08-12 04:42:54 +08:00
|
|
|
weakkey = False
|
|
|
|
weakval = False
|
|
|
|
|
|
|
|
if "metatable" in obj:
|
|
|
|
modemt = getkey(heap, heap[obj["metatable"]], "__mode")
|
|
|
|
if modemt:
|
|
|
|
weakkey = "k" in modemt
|
|
|
|
weakval = "v" in modemt
|
2021-10-30 04:25:12 +08:00
|
|
|
|
|
|
|
for i in range(0, len(pairs), 2):
|
|
|
|
key = pairs[i+0]
|
|
|
|
val = pairs[i+1]
|
2022-08-12 04:42:54 +08:00
|
|
|
if key and heap[key]["type"] == "string":
|
|
|
|
# string keys are always strong
|
2021-10-30 04:25:12 +08:00
|
|
|
queue.append((key, node))
|
2022-08-12 04:42:54 +08:00
|
|
|
if val and not weakval:
|
|
|
|
queue.append((val, node.child(heap[key]["data"])))
|
2021-10-30 04:25:12 +08:00
|
|
|
else:
|
2022-08-12 04:42:54 +08:00
|
|
|
if key and not weakkey:
|
2021-10-30 04:25:12 +08:00
|
|
|
queue.append((key, node))
|
2022-08-12 04:42:54 +08:00
|
|
|
if val and not weakval:
|
2021-10-30 04:25:12 +08:00
|
|
|
queue.append((val, node))
|
|
|
|
|
|
|
|
for a in obj.get("array", []):
|
|
|
|
queue.append((a, node))
|
|
|
|
if "metatable" in obj:
|
|
|
|
queue.append((obj["metatable"], node.child("__meta")))
|
|
|
|
elif obj["type"] == "function":
|
|
|
|
queue.append((obj["env"], node.child("__env")))
|
|
|
|
|
|
|
|
source = ""
|
|
|
|
if "proto" in obj:
|
2022-08-12 04:42:54 +08:00
|
|
|
proto = heap[obj["proto"]]
|
2021-10-30 04:25:12 +08:00
|
|
|
if "source" in proto:
|
|
|
|
source = proto["source"]
|
|
|
|
|
|
|
|
if "proto" in obj:
|
|
|
|
queue.append((obj["proto"], node.child("__proto")))
|
|
|
|
for a in obj.get("upvalues", []):
|
|
|
|
queue.append((a, node.child(source)))
|
|
|
|
elif obj["type"] == "userdata":
|
|
|
|
if "metatable" in obj:
|
|
|
|
queue.append((obj["metatable"], node.child("__meta")))
|
|
|
|
elif obj["type"] == "thread":
|
|
|
|
queue.append((obj["env"], node.child("__env")))
|
2022-08-19 05:04:33 +08:00
|
|
|
stack = obj.get("stack")
|
|
|
|
stacknames = obj.get("stacknames", [])
|
|
|
|
stacknode = node.child("__stack")
|
|
|
|
framenode = None
|
|
|
|
for i in range(len(stack)):
|
|
|
|
name = stacknames[i] if stacknames else None
|
|
|
|
if name and name.startswith("frame:"):
|
|
|
|
framenode = stacknode.child(name[6:])
|
|
|
|
name = None
|
|
|
|
queue.append((stack[i], framenode.child(name) if framenode and name else framenode or stacknode))
|
2021-10-30 04:25:12 +08:00
|
|
|
elif obj["type"] == "proto":
|
|
|
|
for a in obj.get("constants", []):
|
|
|
|
queue.append((a, node))
|
|
|
|
for a in obj.get("protos", []):
|
|
|
|
queue.append((a, node))
|
|
|
|
elif obj["type"] == "upvalue":
|
|
|
|
if "object" in obj:
|
|
|
|
queue.append((obj["object"], node))
|
|
|
|
|
2022-02-12 02:43:14 +08:00
|
|
|
def annotateContainedCategories(node, start):
|
2021-10-30 04:25:12 +08:00
|
|
|
for obj in node.objects:
|
2022-02-12 02:43:14 +08:00
|
|
|
if obj["cat"] < start:
|
|
|
|
obj["cat"] = 0
|
|
|
|
|
2021-10-30 04:25:12 +08:00
|
|
|
node.categories.add(obj["cat"])
|
|
|
|
|
|
|
|
for child in node.children.values():
|
2022-02-12 02:43:14 +08:00
|
|
|
annotateContainedCategories(child, start)
|
2021-10-30 04:25:12 +08:00
|
|
|
|
|
|
|
for cat in child.categories:
|
|
|
|
node.categories.add(cat)
|
|
|
|
|
|
|
|
def filteredTreeForCategory(node, category):
|
|
|
|
children = {}
|
|
|
|
|
|
|
|
for c in node.children.values():
|
|
|
|
if category in c.categories:
|
|
|
|
filtered = filteredTreeForCategory(c, category)
|
|
|
|
|
|
|
|
if filtered:
|
|
|
|
children[filtered.name] = filtered
|
|
|
|
|
|
|
|
if len(children):
|
|
|
|
result = Node()
|
|
|
|
result.name = node.name
|
|
|
|
|
|
|
|
# re-count the objects with the correct category that we have
|
|
|
|
for obj in node.objects:
|
|
|
|
if obj["cat"] == category:
|
|
|
|
result.count += 1
|
|
|
|
result.size += obj["size"]
|
|
|
|
|
|
|
|
result.children = children
|
|
|
|
return result
|
|
|
|
else:
|
|
|
|
result = Node()
|
|
|
|
result.name = node.name
|
|
|
|
|
|
|
|
# re-count the objects with the correct category that we have
|
|
|
|
for obj in node.objects:
|
|
|
|
if obj["cat"] == category:
|
|
|
|
result.count += 1
|
|
|
|
result.size += obj["size"]
|
|
|
|
|
|
|
|
if result.count != 0:
|
|
|
|
return result
|
|
|
|
|
|
|
|
return None
|
|
|
|
|
|
|
|
def splitIntoCategories(root):
|
|
|
|
result = Node()
|
|
|
|
|
|
|
|
for i in range(0, 256):
|
|
|
|
filtered = filteredTreeForCategory(root, i)
|
|
|
|
|
|
|
|
if filtered:
|
|
|
|
name = dump["stats"]["categories"][str(i)]["name"]
|
|
|
|
|
|
|
|
filtered.name = name
|
|
|
|
result.children[name] = filtered
|
|
|
|
|
|
|
|
return result
|
|
|
|
|
2022-02-12 02:43:14 +08:00
|
|
|
if dump["stats"].get("categories") and arguments.split != 'none':
|
|
|
|
if arguments.split == 'custom':
|
|
|
|
annotateContainedCategories(root, 128)
|
|
|
|
else:
|
|
|
|
annotateContainedCategories(root, 0)
|
2021-10-30 04:25:12 +08:00
|
|
|
|
|
|
|
root = splitIntoCategories(root)
|
|
|
|
|
|
|
|
svg.layout(root, lambda n: n.size)
|
|
|
|
svg.display(root, "Memory Graph", "cold")
|