mirror of
https://github.com/lightpanda-io/browser.git
synced 2026-03-28 15:40:04 +00:00
This commit involves a number of changes to finalizers, all aimed towards better consistency and reliability. A big part of this has to do with v8::Inspector's ability to move objects across IsolatedWorlds. There has been a few previous efforts on this, the most significant being https://github.com/lightpanda-io/browser/pull/1901. To recap, a Zig instance can map to 0-N v8::Objects. Where N is the total number of IsolatedWorlds. Generally, IsolatedWorlds between origins are...isolated...but the v8::Inspector isn't bound by this. So a Zig instance cannot be tied to a Context/Identity/IsolatedWorld...it has to live until all references, possibly from different IsolatedWorlds, are released (or the page is reset). Finalizers could previously be managed via reference counting or explicitly toggling the instance as weak/strong. Now, only reference counting is supported. weak/strong can essentially be seen as an acquireRef (rc += 1) and releaseRef (rc -= 1). Explicit setting did make some things easier, like not having to worry so much about double-releasing (e.g. XHR abort being called multiple times), but it was only used in a few places AND it simply doesn't work with objects shared between IsolatedWorlds. It is never a boolean now, as 3 different IsolatedWorlds can each hold a reference. Temps and Globals are tracked on the Session. Previously, they were tracked on the Identity, but that makes no sense. If a Zig instance can outlive an Identity, then any of its Temp references can too. This hasn't been a problem because we've only seen MutationObserver and IntersectionObserver be used cross-origin, but the right CDP script can make this crash with a use-after-free (e.g. `MessageEvent.data` is released when the Identity is done, but `MessageEvent` is still referenced by a different IsolateWorld). Rather than deinit with a `comptime shutdown: bool`, there is now an explicit `releaseRef` and `deinit`. Bridge registration has been streamlined. Previously, types had to register their finalizer AND acquireRef/releaseRef/deinit had to be declared on the entire prototype chain, even if these methods just delegated to their proto. Finalizers are now automatically enabled if a type has a `acquireRef` function. If a type has an `acquireRef`, then it must have a `releaseRef` and a `deinit`. So if there's custom cleanup to do in `deinit`, then you also have to define `acquireRef` and `releaseRef` which will just delegate to the _proto. Furthermore these finalizer methods can be defined anywhere on the chain. Previously: ```zig const KeywboardEvent = struct { _proto: *Event, ... pub fn deinit(self: *KeyboardEvent, session: *Session) void { self._proto.deinit(session); } pub fn releaseRef(self: *KeyboardEvent, session: *Session) void { self._proto.releaseRef(session); } } ``` ```zig const KeyboardEvent = struct { _proto: *Event, ... // no deinit, releaseRef, acquireref } ``` Since the `KeyboardEvent` doesn't participate in finalization directly, it doesn't have to define anything. The bridge will detect the most specific place they are defined and call them there.
246 lines
9.0 KiB
Zig
246 lines
9.0 KiB
Zig
// Copyright (C) 2023-2025 Lightpanda (Selecy SAS)
|
|
//
|
|
// Francis Bouvier <francis@lightpanda.io>
|
|
// Pierre Tachoire <pierre@lightpanda.io>
|
|
//
|
|
// This program is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU Affero General Public License as
|
|
// published by the Free Software Foundation, either version 3 of the
|
|
// License, or (at your option) any later version.
|
|
//
|
|
// This program is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU Affero General Public License for more details.
|
|
//
|
|
// You should have received a copy of the GNU Affero General Public License
|
|
// along with this program. If not, see <https://www.gnu.org/licenses/>.
|
|
|
|
const std = @import("std");
|
|
pub const App = @import("App.zig");
|
|
pub const Network = @import("network/Runtime.zig");
|
|
pub const Server = @import("Server.zig");
|
|
pub const Config = @import("Config.zig");
|
|
pub const URL = @import("browser/URL.zig");
|
|
pub const String = @import("string.zig").String;
|
|
pub const Page = @import("browser/Page.zig");
|
|
pub const Browser = @import("browser/Browser.zig");
|
|
pub const Session = @import("browser/Session.zig");
|
|
pub const Notification = @import("Notification.zig");
|
|
|
|
pub const log = @import("log.zig");
|
|
pub const js = @import("browser/js/js.zig");
|
|
pub const dump = @import("browser/dump.zig");
|
|
pub const markdown = @import("browser/markdown.zig");
|
|
pub const SemanticTree = @import("SemanticTree.zig");
|
|
pub const CDPNode = @import("cdp/Node.zig");
|
|
pub const interactive = @import("browser/interactive.zig");
|
|
pub const links = @import("browser/links.zig");
|
|
pub const forms = @import("browser/forms.zig");
|
|
pub const actions = @import("browser/actions.zig");
|
|
pub const structured_data = @import("browser/structured_data.zig");
|
|
pub const mcp = @import("mcp.zig");
|
|
pub const build_config = @import("build_config");
|
|
pub const crash_handler = @import("crash_handler.zig");
|
|
|
|
pub const HttpClient = @import("browser/HttpClient.zig");
|
|
const IS_DEBUG = @import("builtin").mode == .Debug;
|
|
|
|
pub const FetchOpts = struct {
|
|
wait_ms: u32 = 5000,
|
|
wait_until: Config.WaitUntil = .load,
|
|
dump: dump.Opts,
|
|
dump_mode: ?Config.DumpFormat = null,
|
|
writer: ?*std.Io.Writer = null,
|
|
};
|
|
pub fn fetch(app: *App, url: [:0]const u8, opts: FetchOpts) !void {
|
|
const http_client = try HttpClient.init(app.allocator, &app.network);
|
|
defer http_client.deinit();
|
|
|
|
const notification = try Notification.init(app.allocator);
|
|
defer notification.deinit();
|
|
|
|
var browser = try Browser.init(app, .{ .http_client = http_client });
|
|
defer browser.deinit();
|
|
|
|
var session = try browser.newSession(notification);
|
|
const page = try session.createPage();
|
|
|
|
// // Comment this out to get a profile of the JS code in v8/profile.json.
|
|
// // You can open this in Chrome's profiler.
|
|
// // I've seen it generate invalid JSON, but I'm not sure why. It
|
|
// // happens rarely, and I manually fix the file.
|
|
// page.js.startCpuProfiler();
|
|
// defer {
|
|
// if (page.js.stopCpuProfiler()) |profile| {
|
|
// std.fs.cwd().writeFile(.{
|
|
// .sub_path = ".lp-cache/cpu_profile.json",
|
|
// .data = profile,
|
|
// }) catch |err| {
|
|
// log.err(.app, "profile write error", .{ .err = err });
|
|
// };
|
|
// } else |err| {
|
|
// log.err(.app, "profile error", .{ .err = err });
|
|
// }
|
|
// }
|
|
|
|
// // Comment this out to get a heap V8 heap profil
|
|
// page.js.startHeapProfiler();
|
|
// defer {
|
|
// if (page.js.stopHeapProfiler()) |profile| {
|
|
// std.fs.cwd().writeFile(.{
|
|
// .sub_path = ".lp-cache/allocating.heapprofile",
|
|
// .data = profile.@"0",
|
|
// }) catch |err| {
|
|
// log.err(.app, "allocating write error", .{ .err = err });
|
|
// };
|
|
// std.fs.cwd().writeFile(.{
|
|
// .sub_path = ".lp-cache/snapshot.heapsnapshot",
|
|
// .data = profile.@"1",
|
|
// }) catch |err| {
|
|
// log.err(.app, "heapsnapshot write error", .{ .err = err });
|
|
// };
|
|
// } else |err| {
|
|
// log.err(.app, "profile error", .{ .err = err });
|
|
// }
|
|
// }
|
|
|
|
const encoded_url = try URL.ensureEncoded(page.call_arena, url);
|
|
_ = try page.navigate(encoded_url, .{
|
|
.reason = .address_bar,
|
|
.kind = .{ .push = null },
|
|
});
|
|
var runner = try session.runner(.{});
|
|
try runner.wait(.{ .ms = opts.wait_ms, .until = opts.wait_until });
|
|
|
|
const writer = opts.writer orelse return;
|
|
if (opts.dump_mode) |mode| {
|
|
switch (mode) {
|
|
.html => try dump.root(page.window._document, opts.dump, writer, page),
|
|
.markdown => try markdown.dump(page.window._document.asNode(), .{}, writer, page),
|
|
.semantic_tree, .semantic_tree_text => {
|
|
var registry = CDPNode.Registry.init(app.allocator);
|
|
defer registry.deinit();
|
|
|
|
const st: SemanticTree = .{
|
|
.dom_node = page.window._document.asNode(),
|
|
.registry = ®istry,
|
|
.page = page,
|
|
.arena = page.call_arena,
|
|
.prune = (mode == .semantic_tree_text),
|
|
};
|
|
|
|
if (mode == .semantic_tree) {
|
|
try std.json.Stringify.value(st, .{}, writer);
|
|
} else {
|
|
try st.textStringify(writer);
|
|
}
|
|
},
|
|
.wpt => try dumpWPT(page, writer),
|
|
}
|
|
}
|
|
try writer.flush();
|
|
}
|
|
|
|
fn dumpWPT(page: *Page, writer: *std.Io.Writer) !void {
|
|
var ls: js.Local.Scope = undefined;
|
|
page.js.localScope(&ls);
|
|
defer ls.deinit();
|
|
|
|
var try_catch: js.TryCatch = undefined;
|
|
try_catch.init(&ls.local);
|
|
defer try_catch.deinit();
|
|
|
|
// return the detailed result.
|
|
const dump_script =
|
|
\\ JSON.stringify((() => {
|
|
\\ const statuses = ['Pass', 'Fail', 'Timeout', 'Not Run', 'Optional Feature Unsupported'];
|
|
\\ const parse = (raw) => {
|
|
\\ for (const status of statuses) {
|
|
\\ const idx = raw.indexOf('|' + status);
|
|
\\ if (idx !== -1) {
|
|
\\ const name = raw.slice(0, idx);
|
|
\\ const rest = raw.slice(idx + status.length + 1);
|
|
\\ const message = rest.length > 0 && rest[0] === '|' ? rest.slice(1) : null;
|
|
\\ return { name, status, message };
|
|
\\ }
|
|
\\ }
|
|
\\ return { name: raw, status: 'Unknown', message: null };
|
|
\\ };
|
|
\\ const cases = Object.values(report.cases).map(parse);
|
|
\\ return {
|
|
\\ url: window.location.href,
|
|
\\ status: report.status,
|
|
\\ message: report.message,
|
|
\\ summary: {
|
|
\\ total: cases.length,
|
|
\\ passed: cases.filter(c => c.status === 'Pass').length,
|
|
\\ failed: cases.filter(c => c.status === 'Fail').length,
|
|
\\ timeout: cases.filter(c => c.status === 'Timeout').length,
|
|
\\ notrun: cases.filter(c => c.status === 'Not Run').length,
|
|
\\ unsupported: cases.filter(c => c.status === 'Optional Feature Unsupported').length
|
|
\\ },
|
|
\\ cases
|
|
\\ };
|
|
\\ })(), null, 2)
|
|
;
|
|
const value = ls.local.exec(dump_script, "dump_script") catch |err| {
|
|
const caught = try_catch.caughtOrError(page.call_arena, err);
|
|
return writer.print("Caught error trying to access WPT's report: {f}\n", .{caught});
|
|
};
|
|
try writer.writeAll("== WPT Results==\n");
|
|
try writer.writeAll(try value.toStringSliceWithAlloc(page.call_arena));
|
|
}
|
|
|
|
pub inline fn assert(ok: bool, comptime ctx: []const u8, args: anytype) void {
|
|
if (!ok) {
|
|
if (comptime IS_DEBUG) {
|
|
unreachable;
|
|
}
|
|
assertionFailure(ctx, args);
|
|
}
|
|
}
|
|
|
|
noinline fn assertionFailure(comptime ctx: []const u8, args: anytype) noreturn {
|
|
@branchHint(.cold);
|
|
if (@inComptime()) {
|
|
@compileError(std.fmt.comptimePrint("assertion failure: " ++ ctx, args));
|
|
}
|
|
@import("crash_handler.zig").crash(ctx, args, @returnAddress());
|
|
}
|
|
|
|
// Reference counting helper
|
|
pub fn RC(comptime T: type) type {
|
|
return struct {
|
|
_refs: T = 0,
|
|
|
|
pub fn init(refs: T) @This() {
|
|
return .{._refs = refs};
|
|
}
|
|
|
|
pub fn acquire(self: *@This()) void {
|
|
self._refs += 1;
|
|
}
|
|
|
|
pub fn release(self: *@This(), value: anytype, session: *Session) void {
|
|
if (comptime IS_DEBUG) {
|
|
std.debug.assert(self._refs > 0);
|
|
}
|
|
|
|
const refs = self._refs - 1;
|
|
self._refs = refs;
|
|
if (refs > 0) {
|
|
return;
|
|
}
|
|
value.deinit(session);
|
|
if (session.finalizer_callbacks.fetchRemove(@intFromPtr(value))) |kv| {
|
|
session.releaseArena(kv.value.arena);
|
|
}
|
|
}
|
|
};
|
|
}
|
|
|
|
test {
|
|
std.testing.refAllDecls(@This());
|
|
}
|