Move Net staff to clean network module

2026-03-22 04:34:44 +00:00 · 2026-02-24 02:50:03 +00:00
parent a041162b32
commit 5fea1df42b
7 changed files with 1493 additions and 1408 deletions
--- a/src/http/Http.zig
+++ b/src/http/Http.zig
@@ -17,19 +17,24 @@
 // along with this program.  If not, see <https://www.gnu.org/licenses/>.

 const std = @import("std");
+const Net = @import("../Net.zig");

-pub const c = @cImport({
-    @cInclude("curl/curl.h");
-});
+pub const c = Net.c;

-pub const ENABLE_DEBUG = false;
+pub const ENABLE_DEBUG = Net.ENABLE_DEBUG;
 pub const Client = @import("Client.zig");
 pub const Transfer = Client.Transfer;

-const lp = @import("lightpanda");
+pub const Method = Net.Method;
+pub const Header = Net.Header;
+pub const Headers = Net.Headers;
+
+pub const Connection = Net.Connection;
+
+pub const errorCheck = Net.errorCheck;
+pub const errorMCheck = Net.errorMCheck;
+
 const Config = @import("../Config.zig");
-const log = @import("../log.zig");
-const errors = @import("errors.zig");
 const RobotStore = @import("../browser/Robots.zig").RobotStore;

 const Allocator = std.mem.Allocator;
@@ -49,8 +54,8 @@ ca_blob: ?c.curl_blob,
 robot_store: *RobotStore,

 pub fn init(allocator: Allocator, robot_store: *RobotStore, config: *const Config) !Http {
-    try errorCheck(c.curl_global_init(c.CURL_GLOBAL_SSL));
-    errdefer c.curl_global_cleanup();
+    try Net.globalInit();
+    errdefer Net.globalDeinit();

    if (comptime ENABLE_DEBUG) {
        std.debug.print("curl version: {s}\n\n", .{c.curl_version()});
@@ -61,7 +66,7 @@ pub fn init(allocator: Allocator, robot_store: *RobotStore, config: *const Confi

    var ca_blob: ?c.curl_blob = null;
    if (config.tlsVerifyHost()) {
-        ca_blob = try loadCerts(allocator);
+        ca_blob = try Net.loadCerts(allocator);
    }

    return .{
@@ -78,7 +83,7 @@ pub fn deinit(self: *Http) void {
        const data: [*]u8 = @ptrCast(ca_blob.data);
        self.allocator.free(data[0..ca_blob.len]);
    }
-    c.curl_global_cleanup();
+    Net.globalDeinit();
    self.arena.deinit();
 }

@@ -89,348 +94,3 @@ pub fn createClient(self: *Http, allocator: Allocator) !*Client {
 pub fn newConnection(self: *Http) !Connection {
    return Connection.init(self.ca_blob, self.config);
 }
-
-pub const Connection = struct {
-    easy: *c.CURL,
-    http_headers: *const Config.HttpHeaders,
-
-    pub fn init(
-        ca_blob_: ?c.curl_blob,
-        config: *const Config,
-    ) !Connection {
-        const easy = c.curl_easy_init() orelse return error.FailedToInitializeEasy;
-        errdefer _ = c.curl_easy_cleanup(easy);
-
-        // timeouts
-        try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_TIMEOUT_MS, @as(c_long, @intCast(config.httpTimeout()))));
-        try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_CONNECTTIMEOUT_MS, @as(c_long, @intCast(config.httpConnectTimeout()))));
-
-        // redirect behavior
-        try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_MAXREDIRS, @as(c_long, @intCast(config.httpMaxRedirects()))));
-        try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_FOLLOWLOCATION, @as(c_long, 2)));
-        try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_REDIR_PROTOCOLS_STR, "HTTP,HTTPS")); // remove FTP and FTPS from the default
-
-        // proxy
-        const http_proxy = config.httpProxy();
-        if (http_proxy) |proxy| {
-            try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_PROXY, proxy.ptr));
-        }
-
-        // tls
-        if (ca_blob_) |ca_blob| {
-            try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_CAINFO_BLOB, ca_blob));
-            if (http_proxy != null) {
-                // Note, this can be difference for the proxy and for the main
-                // request. Might be something worth exposting as command
-                // line arguments at some point.
-                try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_PROXY_CAINFO_BLOB, ca_blob));
-            }
-        } else {
-            lp.assert(config.tlsVerifyHost() == false, "Http.init tls_verify_host", .{});
-
-            // Verify peer checks that the cert is signed by a CA, verify host makes sure the
-            // cert contains the server name.
-            try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_SSL_VERIFYHOST, @as(c_long, 0)));
-            try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_SSL_VERIFYPEER, @as(c_long, 0)));
-
-            if (http_proxy != null) {
-                // Note, this can be difference for the proxy and for the main
-                // request. Might be something worth exposting as command
-                // line arguments at some point.
-                try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_PROXY_SSL_VERIFYHOST, @as(c_long, 0)));
-                try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_PROXY_SSL_VERIFYPEER, @as(c_long, 0)));
-            }
-        }
-
-        // compression, don't remove this. CloudFront will send gzip content
-        // even if we don't support it, and then it won't be decompressed.
-        // empty string means: use whatever's available
-        try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_ACCEPT_ENCODING, ""));
-
-        // debug
-        if (comptime Http.ENABLE_DEBUG) {
-            try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_VERBOSE, @as(c_long, 1)));
-
-            // Sometimes the default debug output hides some useful data. You can
-            // uncomment the following line (BUT KEEP THE LIVE ABOVE AS-IS), to
-            // get more control over the data (specifically, the `CURLINFO_TEXT`
-            // can include useful data).
-
-            // try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_DEBUGFUNCTION, debugCallback));
-        }
-
-        return .{
-            .easy = easy,
-            .http_headers = &config.http_headers,
-        };
-    }
-
-    pub fn deinit(self: *const Connection) void {
-        c.curl_easy_cleanup(self.easy);
-    }
-
-    pub fn setURL(self: *const Connection, url: [:0]const u8) !void {
-        try errorCheck(c.curl_easy_setopt(self.easy, c.CURLOPT_URL, url.ptr));
-    }
-
-    // a libcurl request has 2 methods. The first is the method that
-    // controls how libcurl behaves. This specifically influences how redirects
-    // are handled. For example, if you do a POST and get a 301, libcurl will
-    // change that to a GET. But if you do a POST and get a 308, libcurl will
-    // keep the POST (and re-send the body).
-    // The second method is the actual string that's included in the request
-    // headers.
-    // These two methods can be different - you can tell curl to behave as though
-    // you made a GET, but include "POST" in the request header.
-    //
-    // Here, we're only concerned about the 2nd method. If we want, we'll set
-    // the first one based on whether or not we have a body.
-    //
-    // It's important that, for each use of this connection, we set the 2nd
-    // method. Else, if we make a HEAD request and re-use the connection, but
-    // DON'T reset this, it'll keep making HEAD requests.
-    // (I don't know if it's as important to reset the 1st method, or if libcurl
-    // can infer that based on the presence of the body, but we also reset it
-    // to be safe);
-    pub fn setMethod(self: *const Connection, method: Method) !void {
-        const easy = self.easy;
-        const m: [:0]const u8 = switch (method) {
-            .GET => "GET",
-            .POST => "POST",
-            .PUT => "PUT",
-            .DELETE => "DELETE",
-            .HEAD => "HEAD",
-            .OPTIONS => "OPTIONS",
-            .PATCH => "PATCH",
-            .PROPFIND => "PROPFIND",
-        };
-        try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_CUSTOMREQUEST, m.ptr));
-    }
-
-    pub fn setBody(self: *const Connection, body: []const u8) !void {
-        const easy = self.easy;
-        try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_HTTPPOST, @as(c_long, 1)));
-        try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_POSTFIELDSIZE, @as(c_long, @intCast(body.len))));
-        try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_COPYPOSTFIELDS, body.ptr));
-    }
-
-    // These are headers that may not be send to the users for inteception.
-    pub fn secretHeaders(self: *const Connection, headers: *Headers) !void {
-        if (self.http_headers.proxy_bearer_header) |hdr| {
-            try headers.add(hdr);
-        }
-    }
-
-    pub fn request(self: *const Connection) !u16 {
-        const easy = self.easy;
-
-        var header_list = try Headers.init(self.http_headers.user_agent_header);
-        defer header_list.deinit();
-        try self.secretHeaders(&header_list);
-        try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_HTTPHEADER, header_list.headers));
-
-        // Add cookies.
-        if (header_list.cookies) |cookies| {
-            try errorCheck(c.curl_easy_setopt(easy, c.CURLOPT_COOKIE, cookies));
-        }
-
-        try errorCheck(c.curl_easy_perform(easy));
-        var http_code: c_long = undefined;
-        try errorCheck(c.curl_easy_getinfo(easy, c.CURLINFO_RESPONSE_CODE, &http_code));
-        if (http_code < 0 or http_code > std.math.maxInt(u16)) {
-            return 0;
-        }
-        return @intCast(http_code);
-    }
-};
-
-pub const Header = struct {
-    name: []const u8,
-    value: []const u8,
-};
-
-pub const Headers = struct {
-    headers: ?*c.curl_slist,
-    cookies: ?[*c]const u8,
-
-    pub fn init(user_agent: [:0]const u8) !Headers {
-        const header_list = c.curl_slist_append(null, user_agent);
-        if (header_list == null) {
-            return error.OutOfMemory;
-        }
-        return .{ .headers = header_list, .cookies = null };
-    }
-
-    pub fn deinit(self: *const Headers) void {
-        if (self.headers) |hdr| {
-            c.curl_slist_free_all(hdr);
-        }
-    }
-
-    pub fn add(self: *Headers, header: [*c]const u8) !void {
-        // Copies the value
-        const updated_headers = c.curl_slist_append(self.headers, header);
-        if (updated_headers == null) return error.OutOfMemory;
-        self.headers = updated_headers;
-    }
-
-    pub fn parseHeader(header_str: []const u8) ?Header {
-        const colon_pos = std.mem.indexOfScalar(u8, header_str, ':') orelse return null;
-
-        const name = std.mem.trim(u8, header_str[0..colon_pos], " \t");
-        const value = std.mem.trim(u8, header_str[colon_pos + 1 ..], " \t");
-
-        return .{ .name = name, .value = value };
-    }
-
-    pub fn iterator(self: *Headers) Iterator {
-        return .{
-            .header = self.headers,
-            .cookies = self.cookies,
-        };
-    }
-
-    const Iterator = struct {
-        header: [*c]c.curl_slist,
-        cookies: ?[*c]const u8,
-
-        pub fn next(self: *Iterator) ?Header {
-            const h = self.header orelse {
-                const cookies = self.cookies orelse return null;
-                self.cookies = null;
-                return .{ .name = "Cookie", .value = std.mem.span(@as([*:0]const u8, cookies)) };
-            };
-
-            self.header = h.*.next;
-            return parseHeader(std.mem.span(@as([*:0]const u8, @ptrCast(h.*.data))));
-        }
-    };
-};
-
-pub fn errorCheck(code: c.CURLcode) errors.Error!void {
-    if (code == c.CURLE_OK) {
-        return;
-    }
-    return errors.fromCode(code);
-}
-
-pub fn errorMCheck(code: c.CURLMcode) errors.Multi!void {
-    if (code == c.CURLM_OK) {
-        return;
-    }
-    if (code == c.CURLM_CALL_MULTI_PERFORM) {
-        // should we can client.perform() here?
-        // or just wait until the next time we naturally call it?
-        return;
-    }
-    return errors.fromMCode(code);
-}
-
-pub const Method = enum(u8) {
-    GET = 0,
-    PUT = 1,
-    POST = 2,
-    DELETE = 3,
-    HEAD = 4,
-    OPTIONS = 5,
-    PATCH = 6,
-    PROPFIND = 7,
-};
-
-// TODO: on BSD / Linux, we could just read the PEM file directly.
-// This whole rescan + decode is really just needed for MacOS. On Linux
-// bundle.rescan does find the .pem file(s) which could be in a few different
-// places, so it's still useful, just not efficient.
-fn loadCerts(allocator: Allocator) !c.curl_blob {
-    var bundle: std.crypto.Certificate.Bundle = .{};
-    try bundle.rescan(allocator);
-    defer bundle.deinit(allocator);
-
-    const bytes = bundle.bytes.items;
-    if (bytes.len == 0) {
-        log.warn(.app, "No system certificates", .{});
-        return .{
-            .len = 0,
-            .flags = 0,
-            .data = bytes.ptr,
-        };
-    }
-
-    const encoder = std.base64.standard.Encoder;
-    var arr: std.ArrayList(u8) = .empty;
-
-    const encoded_size = encoder.calcSize(bytes.len);
-    const buffer_size = encoded_size +
-        (bundle.map.count() * 75) + // start / end per certificate + extra, just in case
-        (encoded_size / 64) // newline per 64 characters
-    ;
-    try arr.ensureTotalCapacity(allocator, buffer_size);
-    errdefer arr.deinit(allocator);
-    var writer = arr.writer(allocator);
-
-    var it = bundle.map.valueIterator();
-    while (it.next()) |index| {
-        const cert = try std.crypto.Certificate.der.Element.parse(bytes, index.*);
-
-        try writer.writeAll("-----BEGIN CERTIFICATE-----\n");
-        var line_writer = LineWriter{ .inner = writer };
-        try encoder.encodeWriter(&line_writer, bytes[index.*..cert.slice.end]);
-        try writer.writeAll("\n-----END CERTIFICATE-----\n");
-    }
-
-    // Final encoding should not be larger than our initial size estimate
-    lp.assert(buffer_size > arr.items.len, "Http loadCerts", .{ .estimate = buffer_size, .len = arr.items.len });
-
-    // Allocate exactly the size needed and copy the data
-    const result = try allocator.dupe(u8, arr.items);
-    // Free the original oversized allocation
-    arr.deinit(allocator);
-
-    return .{
-        .len = result.len,
-        .data = result.ptr,
-        .flags = 0,
-    };
-}
-
-// Wraps lines @ 64 columns. A PEM is basically a base64 encoded DER (which is
-// what Zig has), with lines wrapped at 64 characters and with a basic header
-// and footer
-const LineWriter = struct {
-    col: usize = 0,
-    inner: std.ArrayList(u8).Writer,
-
-    pub fn writeAll(self: *LineWriter, data: []const u8) !void {
-        var writer = self.inner;
-
-        var col = self.col;
-        const len = 64 - col;
-
-        var remain = data;
-        if (remain.len > len) {
-            col = 0;
-            try writer.writeAll(data[0..len]);
-            try writer.writeByte('\n');
-            remain = data[len..];
-        }
-
-        while (remain.len > 64) {
-            try writer.writeAll(remain[0..64]);
-            try writer.writeByte('\n');
-            remain = data[len..];
-        }
-        try writer.writeAll(remain);
-        self.col = col + remain.len;
-    }
-};
-
-pub fn debugCallback(_: *c.CURL, msg_type: c.curl_infotype, raw: [*c]u8, len: usize, _: *anyopaque) callconv(.c) void {
-    const data = raw[0..len];
-    switch (msg_type) {
-        c.CURLINFO_TEXT => std.debug.print("libcurl [text]: {s}\n", .{data}),
-        c.CURLINFO_HEADER_OUT => std.debug.print("libcurl [req-h]: {s}\n", .{data}),
-        c.CURLINFO_HEADER_IN => std.debug.print("libcurl [res-h]: {s}\n", .{data}),
-        // c.CURLINFO_DATA_IN => std.debug.print("libcurl [res-b]: {s}\n", .{data}),
-        else => std.debug.print("libcurl ?? {d}\n", .{msg_type}),
-    }
-}