[dumpling] Add RelateTool and DiffOracle

Danylo Mocherniuk · Mathias Payer · datenschutzakademie-ag1 · V8-internal LUCI CQ · commit 7b9f695a9e56 · 2026-01-09T01:37:08.000-08:00
DiffOracle is a library that allows to see if there was a difference between optimized and unoptimized runs. RelateTool is designed as a CLI tool to compare optimized vs unoptimized runs. Usage: swift run -c release RelateTool --d8=... --poc=... Bug: 441467877 Change-Id: Ie8850e8534ae3a890f93be77ba2d0961f51a129e Co-authored-by: Mathias Payer <mathias.payer@gmail.com> Co-authored-by: Liam Wachter <liam.g.wachter@gmail.com> Co-authored-by: Flavio Toffalini <flavio87@gmail.com> Co-authored-by: Christian Wressnegger <intellisec.de@gmail.com> Co-authored-by: Julian Gremminger <asdfju77@gmail.com> Reviewed-on: https://chrome-internal-review.googlesource.com/c/v8/fuzzilli/+/8759816 Reviewed-by: Matthias Liedtke <mliedtke@google.com> Commit-Queue: Danylo Mocherniuk <mdanylo@google.com>
diff --git a/Package.swift b/Package.swift
@@ -70,6 +70,14 @@ let package = Package(
         .executableTarget(name: "FuzzILTool",
                 dependencies: ["Fuzzilli"]),
 
+        // Tool that runs d8 in Dumpling mode. First time it runs with Maglev
+        // and Turbofan. Second time without. In both runs frames are dumped
+        // in certain points to the files. The dumps are later compared for
+        // equality. If they are not equal, it means that there's likely a bug
+        // in V8.
+        .executableTarget(name: "RelateTool",
+                dependencies: ["Fuzzilli"]),
+
         .testTarget(name: "FuzzilliTests",
                     dependencies: ["Fuzzilli"],
                     resources: [.copy("CompilerTests")]),
diff --git a/Sources/Fuzzilli/DumplingDiffOracle/Oracle.swift b/Sources/Fuzzilli/DumplingDiffOracle/Oracle.swift
@@ -0,0 +1,229 @@
+// Copyright 2026 Google LLC
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+// https://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+// The tool implemented in this file compares two Dumpling dumps for
+// equality. Each Dumpling dump consists of multiple frame dumps.
+// Example frame dump:
+// ---I
+// b:34
+// f:500
+// n:3
+// m:5
+// x:40
+// r0:30
+// r3:some_string
+// a0:1
+// a1:2
+//
+// A frame dump always starts with a header which is one of
+// ---I (for interpreter), ---S (for Sparkplug), ---M (for Maglev),
+// ---T (for Turbofan), ---D (deopt Turbofan: this is frame produced by actual
+// Turbofan deopt, not by Dumpling).
+// Next line with 'b' might follow (see when it and other lines might get omitted
+// in the NOTE below), it denotes bytecode offset of a dump (within a function).
+// Next line with 'f' might follow, it denotes JS function id of a dump.
+// Next line with 'x' might follow, it denotes the dump of the accumulator.
+// Next lines with 'n' and 'm' might follow, which denote parameters of a function
+// and register count of a frame respectfully.
+// Next multiple lines 'ai' might follow, where 'a' denotes that this is a dump
+// of a function parameter and 'i' denotes the number of the parameter.
+// Next multiple lines 'ri' might follow, where 'r' denotes that this is a dump
+// of a register and 'i' denotes the number of the register.
+// Lastly an empty line always ends the frame dump.
+//
+// NOTE: frame dumps are implemented incrementally to not write too much data
+// to the file.
+// IOW let's say we dumped 2 frames with full format as follows:
+// ---I
+// b:30
+// f:40
+// a0:1
+// a1:2
+//
+// ---I
+// b:35
+// f:40
+// a0:1
+// a1:1
+//
+// In order to save space a file will contain just:
+// ---I
+// b:30
+// f:40
+// a0:1
+// a1:2
+//
+// ---I
+// b:35
+// a1:1
+
+
+import Foundation
+
+// This class is implementing one public function relate(optimizedOutput, unoptimizedOutput).
+// `relate` compares optimizedOutput and unoptimizedOutput for equality.
+public final class DiffOracle {
+    private enum FrameType {
+        case interpreter
+        case sparkplug
+        case maglev
+        case turbofan
+        case deoptTurbofan
+    }
+
+    private struct Frame: Equatable {
+        let bytecodeOffset: Int
+        let accumulator: String
+        let arguments: [String]
+        let registers: [String]
+        let functionId: Int
+        let frameType: FrameType
+
+        // 'reference' is the value from Unoptimized frame.
+        func matches(reference: Frame) -> Bool {
+
+            guard self.bytecodeOffset == reference.bytecodeOffset,
+                self.functionId == reference.functionId,
+                self.arguments.count == reference.arguments.count,
+                self.registers.count == reference.registers.count else {
+                return false
+            }
+
+            // Logic: 'self' is the Optimized frame. It is allowed to have "<optimized_out>".
+            func isMatch(_ optValue: String, unoptValue: String) -> Bool {
+                return optValue == "<optimized_out>" || optValue == unoptValue
+            }
+
+            if !isMatch(self.accumulator, unoptValue: reference.accumulator) {
+                return false
+            }
+
+            if !zip(self.arguments, reference.arguments).allSatisfy(isMatch) {
+                return false
+            }
+
+            if !zip(self.registers, reference.registers).allSatisfy(isMatch) {
+                return false
+            }
+
+            return true
+        }
+    }
+
+    private static func parseDiffFrame(_ frameArr: ArraySlice<Substring>, _ prevFrame: Frame?) -> Frame {
+        func parseValue<T>(prefix: String, defaultValue: T, index: inout Int, conversion: (Substring) -> T) -> T {
+            if index < frameArr.endIndex && frameArr[index].starts(with: prefix) {
+                let value = conversion(frameArr[index].dropFirst(prefix.count))
+                index += 1
+                return value
+            }
+            return defaultValue
+        }
+        var i = frameArr.startIndex
+        func parseFrameType(_ type: Substring) -> FrameType {
+            switch type {
+                case "---I": .interpreter
+                case "---S": .sparkplug
+                case "---M": .maglev
+                case "---T": .turbofan
+                case "---D": .deoptTurbofan
+                default:
+                    fatalError("Unknown frame type")
+            }
+        }
+
+        let frameType: FrameType = parseFrameType(frameArr[i])
+
+        i += 1
+
+        let bytecodeOffset = parseValue(prefix: "b:", defaultValue: prevFrame?.bytecodeOffset ?? -1, index: &i){ Int($0)! }
+        let functionId = parseValue(prefix: "f:", defaultValue: prevFrame?.functionId ?? -1, index: &i){ Int($0)! }
+        let accumulator = parseValue(prefix: "x:", defaultValue: prevFrame?.accumulator ?? "", index: &i){ String($0) }
+        let argCount = parseValue(prefix: "n:", defaultValue: prevFrame?.arguments.count ?? -1, index: &i){ Int($0)! }
+        let regCount = parseValue(prefix: "m:", defaultValue: prevFrame?.registers.count ?? -1, index: &i){ Int($0)! }
+
+        func updateValues(prefix: String, totalCount: Int, oldValues: [String]) -> [String] {
+            var newValues = oldValues
+
+            if newValues.count > totalCount {
+                newValues.removeLast(newValues.count - totalCount)
+            } else if newValues.count < totalCount {
+                let missingCount = totalCount - newValues.count
+                let defaults = Array(repeating: "<missing>", count: missingCount)
+                newValues.append(contentsOf: defaults)
+            }
+
+            while i < frameArr.endIndex && frameArr[i].starts(with: prefix) {
+                let data = frameArr[i].dropFirst(1).split(separator: ":", maxSplits: 1)
+                let number = Int(data[0])!
+                let value = String(data[1])
+                newValues[number] = value
+                i += 1
+            }
+            return newValues
+
+        }
+
+        let arguments = updateValues(prefix: "a", totalCount: argCount, oldValues: prevFrame?.arguments ?? [])
+        let registers = updateValues(prefix: "r", totalCount: regCount, oldValues: prevFrame?.registers ?? [])
+
+        let frame = Frame(bytecodeOffset: bytecodeOffset,
+                          accumulator: accumulator,
+                          arguments: arguments,
+                          registers: registers,
+                          functionId: functionId,
+                          frameType: frameType)
+        return frame
+    }
+
+    private static func parseFullFrames(_ stdout: String) -> [Frame] {
+        var frameArray: [Frame] = []
+        var prevFrame: Frame? = nil
+
+        let split = stdout.split(separator: "\n", omittingEmptySubsequences: false)
+        let frames = split.split(separator: "")
+
+        for frame in frames {
+            assert(frame.first?.starts(with: "---") == true, "Invalid frame header found: \(frame.first ?? "nil")")
+
+            prevFrame = parseDiffFrame(frame, prevFrame)
+            frameArray.append(prevFrame!)
+        }
+        return frameArray
+    }
+
+    public static func relate(_ optIn: String, with unoptIn: String) -> Bool {
+        let optFrames = parseFullFrames(optIn)
+        let unoptFrames = parseFullFrames(unoptIn)
+        var unoptFramesLeft = ArraySlice(unoptFrames)
+
+        for optFrame in optFrames {
+            guard let unoptIndex = unoptFramesLeft.firstIndex(where: optFrame.matches) else {
+                print(optFrame as AnyObject)
+                print("--------------------------")
+                print("[")
+                for unoptFrame in unoptFrames {
+                    if unoptFrame.bytecodeOffset == optFrame.bytecodeOffset {
+                        print(unoptFrame as AnyObject)
+                    }
+                }
+                print("]")
+                return false
+            }
+            // Remove all skipped frames and the found frame.
+            unoptFramesLeft = unoptFramesLeft[(unoptIndex + 1)...]
+        }
+        return true
+    }
+}
diff --git a/Sources/RelateTool/main.swift b/Sources/RelateTool/main.swift
@@ -0,0 +1,114 @@
+// Copyright 2026 Google LLC
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+// https://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+import Foundation
+import Fuzzilli
+
+public struct V8DifferentialConfig {
+    public static let commonArgs: [String] = [
+        "--expose-gc",
+        "--omit-quit",
+        "--allow-natives-for-differential-fuzzing",
+        "--fuzzing",
+        "--future",
+        "--harmony",
+        "--predictable",
+        "--trace",
+        "--print-bytecode",
+        "--correctness-fuzzer-suppressions",
+        "--no-lazy-feedback-allocation",
+    ]
+
+    public static let differentialArgs: [String] = [
+        "--no-sparkplug",
+        "--jit-fuzzing",
+        "--maglev-dumping",
+        "--turbofan-dumping",
+        "--turbofan-dumping-print-deopt-frames"
+    ]
+
+    public static let referenceArgs: [String] = [
+        "--no-turbofan",
+        "--no-maglev",
+        "--sparkplug-dumping",
+        "--interpreter-dumping"
+    ]
+}
+
+struct Relater {
+    let d8Path: String
+    let pocPath: String
+    let dumpFilePath: String
+
+    private func runV8(args: [String]) throws {
+        let process = Process()
+        process.executableURL = URL(fileURLWithPath: d8Path)
+        process.arguments = args + [pocPath]
+
+        let pipe = Pipe()
+        process.standardOutput = pipe
+        process.standardError = pipe
+
+        try process.run()
+        process.waitUntilExit()
+    }
+
+    private func readDumpFile() throws -> String {
+        return try String(contentsOfFile: dumpFilePath, encoding: .utf8)
+    }
+
+    private func cleanDumpFile() {
+        try? FileManager.default.removeItem(atPath: dumpFilePath)
+    }
+
+    /// Main execution flow.
+    func run() {
+        do {
+            cleanDumpFile()
+            let optArgs = V8DifferentialConfig.commonArgs + V8DifferentialConfig.differentialArgs
+            try runV8(args: optArgs)
+            let optDumps = try readDumpFile()
+
+            cleanDumpFile()
+            let refArgs = V8DifferentialConfig.commonArgs + V8DifferentialConfig.referenceArgs
+            try runV8(args: refArgs)
+            let unOptDumps = try readDumpFile()
+
+            let result = DiffOracle.relate(optDumps, with: unOptDumps)
+            print("Differential check result: \(result)")
+
+            if !result {
+                exit(1)
+            }
+
+        } catch {
+            print("Error during relate: \(error)")
+            exit(1)
+        }
+    }
+}
+
+let args = Arguments.parse(from: CommandLine.arguments)
+
+guard let jsShellPath = args["--d8"],
+      let pocPath = args["--poc"] else {
+    print("Usage: --d8 <path_to_d8> --poc <path_to_poc> [--dump <path_to_dump_file>]")
+    exit(1)
+}
+
+// Parse optional dump path, default to /tmp/output_dump.txt
+let dumpPath = args["--dump"] ?? "/tmp/output_dump.txt"
+
+let relater = Relater(d8Path: jsShellPath, pocPath: pocPath, dumpFilePath: dumpPath)
+relater.run()
diff --git a/Tests/FuzzilliTests/DiffOracleTests.swift b/Tests/FuzzilliTests/DiffOracleTests.swift