mirror of
https://github.com/oven-sh/bun
synced 2026-02-09 18:38:55 +00:00
Co-authored-by: autofix-ci[bot] <114827586+autofix-ci[bot]@users.noreply.github.com> Co-authored-by: Jarred Sumner <jarred@jarredsumner.com> Co-authored-by: Grigory <grigory.orlov.set@gmail.com> Co-authored-by: Dylan Conway <35280289+dylan-conway@users.noreply.github.com> Co-authored-by: Meghan Denny <hello@nektro.net> Co-authored-by: Kenta Iwasaki <63115601+lithdew@users.noreply.github.com> Co-authored-by: John-David Dalton <john.david.dalton@gmail.com> Co-authored-by: Dale Seo <5466341+DaleSeo@users.noreply.github.com> Co-authored-by: Zack Radisic <56137411+zackradisic@users.noreply.github.com> Co-authored-by: paperdave <paperdave@users.noreply.github.com> Co-authored-by: Georgijs Vilums <georgijs.vilums@gmail.com> Co-authored-by: Dylan Conway <dylan.conway567@gmail.com>
450 lines
15 KiB
Zig
450 lines
15 KiB
Zig
const std = @import("std");
|
|
const expect = std.testing.expect;
|
|
|
|
const bun = @import("root").bun;
|
|
|
|
const strings = bun.strings;
|
|
const js_lexer = bun.js_lexer;
|
|
|
|
const string = bun.string;
|
|
const stringZ = bun.stringZ;
|
|
const CodePoint = bun.CodePoint;
|
|
|
|
pub const MutableString = struct {
|
|
allocator: std.mem.Allocator,
|
|
list: std.ArrayListUnmanaged(u8),
|
|
|
|
pub fn init2048(allocator: std.mem.Allocator) std.mem.Allocator.Error!MutableString {
|
|
return MutableString.init(allocator, 2048);
|
|
}
|
|
|
|
pub const Writer = std.io.Writer(*@This(), anyerror, MutableString.writeAll);
|
|
pub fn writer(self: *MutableString) Writer {
|
|
return Writer{
|
|
.context = self,
|
|
};
|
|
}
|
|
|
|
pub fn isEmpty(this: *const MutableString) bool {
|
|
return this.list.items.len == 0;
|
|
}
|
|
|
|
pub fn deinit(str: *MutableString) void {
|
|
if (str.list.capacity > 0) {
|
|
str.list.expandToCapacity();
|
|
str.list.clearAndFree(str.allocator);
|
|
}
|
|
}
|
|
|
|
pub fn owns(this: *const MutableString, slice: []const u8) bool {
|
|
return bun.isSliceInBuffer(slice, this.list.items.ptr[0..this.list.capacity]);
|
|
}
|
|
|
|
pub fn growIfNeeded(self: *MutableString, amount: usize) !void {
|
|
try self.list.ensureUnusedCapacity(self.allocator, amount);
|
|
}
|
|
|
|
pub fn write(self: *MutableString, bytes: anytype) !usize {
|
|
try self.list.appendSlice(self.allocator, bytes);
|
|
return bytes.len;
|
|
}
|
|
|
|
pub fn bufferedWriter(self: *MutableString) BufferedWriter {
|
|
return BufferedWriter{ .context = self };
|
|
}
|
|
|
|
pub fn init(allocator: std.mem.Allocator, capacity: usize) std.mem.Allocator.Error!MutableString {
|
|
return MutableString{ .allocator = allocator, .list = if (capacity > 0)
|
|
try std.ArrayListUnmanaged(u8).initCapacity(allocator, capacity)
|
|
else
|
|
std.ArrayListUnmanaged(u8){} };
|
|
}
|
|
|
|
pub fn initEmpty(allocator: std.mem.Allocator) MutableString {
|
|
return MutableString{ .allocator = allocator, .list = .{} };
|
|
}
|
|
|
|
pub const ensureUnusedCapacity = growIfNeeded;
|
|
|
|
pub fn initCopy(allocator: std.mem.Allocator, str: anytype) !MutableString {
|
|
var mutable = try MutableString.init(allocator, str.len);
|
|
try mutable.copy(str);
|
|
return mutable;
|
|
}
|
|
|
|
/// Convert it to an ASCII identifier. Note: If you change this to a non-ASCII
|
|
/// identifier, you're going to potentially cause trouble with non-BMP code
|
|
/// points in target environments that don't support bracketed Unicode escapes.
|
|
pub fn ensureValidIdentifier(str: string, allocator: std.mem.Allocator) !string {
|
|
if (str.len == 0) {
|
|
return "_";
|
|
}
|
|
|
|
var iterator = strings.CodepointIterator.init(str);
|
|
var cursor = strings.CodepointIterator.Cursor{};
|
|
|
|
var has_needed_gap = false;
|
|
var needs_gap = false;
|
|
var start_i: usize = 0;
|
|
|
|
if (!iterator.next(&cursor)) return "_";
|
|
|
|
const JSLexerTables = @import("./js_lexer_tables.zig");
|
|
|
|
// Common case: no gap necessary. No allocation necessary.
|
|
needs_gap = !js_lexer.isIdentifierStart(cursor.c);
|
|
if (!needs_gap) {
|
|
// Are there any non-alphanumeric chars at all?
|
|
while (iterator.next(&cursor)) {
|
|
if (!js_lexer.isIdentifierContinue(cursor.c) or cursor.width > 1) {
|
|
needs_gap = true;
|
|
start_i = cursor.i;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
if (!needs_gap) {
|
|
return JSLexerTables.StrictModeReservedWordsRemap.get(str) orelse str;
|
|
}
|
|
|
|
if (needs_gap) {
|
|
var mutable = try MutableString.initCopy(allocator, if (start_i == 0)
|
|
// the first letter can be a non-identifier start
|
|
// https://github.com/oven-sh/bun/issues/2946
|
|
"_"
|
|
else
|
|
str[0..start_i]);
|
|
needs_gap = false;
|
|
|
|
var slice = str[start_i..];
|
|
iterator = strings.CodepointIterator.init(slice);
|
|
cursor = strings.CodepointIterator.Cursor{};
|
|
|
|
while (iterator.next(&cursor)) {
|
|
if (js_lexer.isIdentifierContinue(cursor.c) and cursor.width == 1) {
|
|
if (needs_gap) {
|
|
try mutable.appendChar('_');
|
|
needs_gap = false;
|
|
has_needed_gap = true;
|
|
}
|
|
try mutable.append(slice[cursor.i .. cursor.i + @as(u32, cursor.width)]);
|
|
} else if (!needs_gap) {
|
|
needs_gap = true;
|
|
// skip the code point, replace it with a single _
|
|
}
|
|
}
|
|
|
|
// If it ends with an emoji
|
|
if (needs_gap) {
|
|
try mutable.appendChar('_');
|
|
needs_gap = false;
|
|
has_needed_gap = true;
|
|
}
|
|
|
|
if (comptime bun.Environment.allow_assert) {
|
|
bun.assert(js_lexer.isIdentifier(mutable.list.items));
|
|
}
|
|
|
|
return try mutable.list.toOwnedSlice(allocator);
|
|
}
|
|
|
|
return str;
|
|
}
|
|
|
|
pub fn len(self: *const MutableString) usize {
|
|
return self.list.items.len;
|
|
}
|
|
|
|
pub fn copy(self: *MutableString, str: anytype) !void {
|
|
try self.list.ensureTotalCapacity(self.allocator, str[0..].len);
|
|
|
|
if (self.list.items.len == 0) {
|
|
try self.list.insertSlice(self.allocator, 0, str);
|
|
} else {
|
|
try self.list.replaceRange(self.allocator, 0, str[0..].len, str[0..]);
|
|
}
|
|
}
|
|
|
|
pub inline fn growBy(self: *MutableString, amount: usize) !void {
|
|
try self.list.ensureUnusedCapacity(self.allocator, amount);
|
|
}
|
|
|
|
pub inline fn appendSlice(self: *MutableString, slice: []const u8) !void {
|
|
try self.list.appendSlice(self.allocator, slice);
|
|
}
|
|
|
|
pub inline fn appendSliceExact(self: *MutableString, slice: []const u8) !void {
|
|
if (slice.len == 0) return;
|
|
|
|
try self.list.ensureTotalCapacityPrecise(self.allocator, self.list.items.len + slice.len);
|
|
var end = self.list.items.ptr + self.list.items.len;
|
|
self.list.items.len += slice.len;
|
|
@memcpy(end[0..slice.len], slice);
|
|
}
|
|
|
|
pub inline fn reset(
|
|
self: *MutableString,
|
|
) void {
|
|
self.list.clearRetainingCapacity();
|
|
}
|
|
|
|
pub inline fn resetTo(
|
|
self: *MutableString,
|
|
index: usize,
|
|
) void {
|
|
bun.assert(index <= self.list.capacity);
|
|
self.list.items.len = index;
|
|
}
|
|
|
|
pub fn inflate(self: *MutableString, amount: usize) !void {
|
|
try self.list.resize(self.allocator, amount);
|
|
}
|
|
|
|
pub inline fn appendChar(self: *MutableString, char: u8) !void {
|
|
try self.list.append(self.allocator, char);
|
|
}
|
|
pub inline fn appendCharAssumeCapacity(self: *MutableString, char: u8) void {
|
|
self.list.appendAssumeCapacity(char);
|
|
}
|
|
pub inline fn append(self: *MutableString, char: []const u8) !void {
|
|
try self.list.appendSlice(self.allocator, char);
|
|
}
|
|
pub inline fn appendInt(self: *MutableString, int: u64) !void {
|
|
const count = bun.fmt.fastDigitCount(int);
|
|
try self.list.ensureUnusedCapacity(self.allocator, count);
|
|
const old = self.list.items.len;
|
|
self.list.items.len += count;
|
|
bun.assert(count == bun.fmt.formatIntBuf(self.list.items.ptr[old .. old + count], int, 10, .lower, .{}));
|
|
}
|
|
|
|
pub inline fn appendAssumeCapacity(self: *MutableString, char: []const u8) void {
|
|
self.list.appendSliceAssumeCapacity(
|
|
char,
|
|
);
|
|
}
|
|
pub inline fn lenI(self: *MutableString) i32 {
|
|
return @as(i32, @intCast(self.list.items.len));
|
|
}
|
|
|
|
pub fn toOwnedSlice(self: *MutableString) string {
|
|
return self.list.toOwnedSlice(self.allocator) catch bun.outOfMemory(); // TODO
|
|
}
|
|
|
|
pub fn toOwnedSliceLeaky(self: *MutableString) []u8 {
|
|
return self.list.items;
|
|
}
|
|
|
|
/// Clear the existing value without freeing the memory or shrinking the capacity.
|
|
pub fn move(self: *MutableString) []u8 {
|
|
const out = self.list.items;
|
|
self.list = .{};
|
|
return out;
|
|
}
|
|
|
|
pub fn toOwnedSentinelLeaky(self: *MutableString) [:0]u8 {
|
|
if (self.list.items.len > 0 and self.list.items[self.list.items.len - 1] != 0) {
|
|
self.list.append(
|
|
self.allocator,
|
|
0,
|
|
) catch unreachable;
|
|
}
|
|
|
|
return self.list.items[0 .. self.list.items.len - 1 :0];
|
|
}
|
|
|
|
pub fn toOwnedSliceLength(self: *MutableString, length: usize) string {
|
|
self.list.shrinkAndFree(self.allocator, length);
|
|
return self.list.toOwnedSlice(self.allocator) catch bun.outOfMemory(); // TODO
|
|
}
|
|
|
|
// pub fn deleteAt(self: *MutableString, i: usize) {
|
|
// self.list.swapRemove(i);
|
|
// }
|
|
|
|
pub fn containsChar(self: *const MutableString, char: u8) bool {
|
|
return self.indexOfChar(char) != null;
|
|
}
|
|
|
|
pub fn indexOfChar(self: *const MutableString, char: u8) ?u32 {
|
|
return strings.indexOfChar(self.list.items, char);
|
|
}
|
|
|
|
pub fn lastIndexOfChar(self: *const MutableString, char: u8) ?usize {
|
|
return strings.lastIndexOfChar(self.list.items, char);
|
|
}
|
|
|
|
pub fn lastIndexOf(self: *const MutableString, str: u8) ?usize {
|
|
return strings.lastIndexOfChar(self.list.items, str);
|
|
}
|
|
|
|
pub fn indexOf(self: *const MutableString, str: u8) ?usize {
|
|
return std.mem.indexOf(u8, self.list.items, str);
|
|
}
|
|
|
|
pub fn eql(self: *MutableString, other: anytype) bool {
|
|
return std.mem.eql(u8, self.list.items, other);
|
|
}
|
|
|
|
pub fn toSocketBuffers(self: *MutableString, comptime count: usize, ranges: anytype) [count]std.posix.iovec_const {
|
|
var buffers: [count]std.posix.iovec_const = undefined;
|
|
inline for (&buffers, ranges) |*b, r| {
|
|
b.* = .{
|
|
.iov_base = self.list.items[r[0]..r[1]].ptr,
|
|
.iov_len = self.list.items[r[0]..r[1]].len,
|
|
};
|
|
}
|
|
return buffers;
|
|
}
|
|
|
|
pub const BufferedWriter = struct {
|
|
context: *MutableString,
|
|
buffer: [max]u8 = undefined,
|
|
pos: usize = 0,
|
|
|
|
const max = 2048;
|
|
|
|
pub const Writer = std.io.Writer(*BufferedWriter, anyerror, BufferedWriter.writeAll);
|
|
|
|
inline fn remain(this: *BufferedWriter) []u8 {
|
|
return this.buffer[this.pos..];
|
|
}
|
|
|
|
pub fn flush(this: *BufferedWriter) !void {
|
|
_ = try this.context.writeAll(this.buffer[0..this.pos]);
|
|
this.pos = 0;
|
|
}
|
|
|
|
pub fn writeAll(this: *BufferedWriter, bytes: []const u8) anyerror!usize {
|
|
const pending = bytes;
|
|
|
|
if (pending.len >= max) {
|
|
try this.flush();
|
|
try this.context.append(pending);
|
|
return pending.len;
|
|
}
|
|
|
|
if (pending.len > 0) {
|
|
if (pending.len + this.pos > max) {
|
|
try this.flush();
|
|
}
|
|
@memcpy(this.remain()[0..pending.len], pending);
|
|
this.pos += pending.len;
|
|
}
|
|
|
|
return pending.len;
|
|
}
|
|
|
|
const E = bun.JSAst.E;
|
|
|
|
/// Write a E.String to the buffer.
|
|
/// This automatically encodes UTF-16 into UTF-8 using
|
|
/// the same code path as TextEncoder
|
|
pub fn writeString(this: *BufferedWriter, bytes: *E.String) anyerror!usize {
|
|
if (bytes.isUTF8()) {
|
|
return try this.writeAll(bytes.slice(this.context.allocator));
|
|
}
|
|
|
|
return try this.writeAll16(bytes.slice16());
|
|
}
|
|
|
|
/// Write a UTF-16 string to the (UTF-8) buffer
|
|
/// This automatically encodes UTF-16 into UTF-8 using
|
|
/// the same code path as TextEncoder
|
|
pub fn writeAll16(this: *BufferedWriter, bytes: []const u16) anyerror!usize {
|
|
const pending = bytes;
|
|
|
|
if (pending.len >= max) {
|
|
try this.flush();
|
|
try this.context.list.ensureUnusedCapacity(this.context.allocator, bytes.len * 2);
|
|
const decoded = strings.copyUTF16IntoUTF8(
|
|
this.remain()[0 .. bytes.len * 2],
|
|
[]const u16,
|
|
bytes,
|
|
true,
|
|
);
|
|
this.context.list.items.len += @as(usize, decoded.written);
|
|
return pending.len;
|
|
}
|
|
|
|
if (pending.len > 0) {
|
|
if ((pending.len * 2) + this.pos > max) {
|
|
try this.flush();
|
|
}
|
|
const decoded = strings.copyUTF16IntoUTF8(
|
|
this.remain()[0 .. bytes.len * 2],
|
|
[]const u16,
|
|
bytes,
|
|
true,
|
|
);
|
|
this.pos += @as(usize, decoded.written);
|
|
}
|
|
|
|
return pending.len;
|
|
}
|
|
|
|
pub fn writeHTMLAttributeValueString(this: *BufferedWriter, str: *E.String) anyerror!void {
|
|
if (str.isUTF8()) {
|
|
try this.writeHTMLAttributeValue(str.slice(this.context.allocator));
|
|
return;
|
|
}
|
|
|
|
try this.writeHTMLAttributeValue16(str.slice16());
|
|
}
|
|
|
|
pub fn writeHTMLAttributeValue(this: *BufferedWriter, bytes: []const u8) anyerror!void {
|
|
var slice = bytes;
|
|
while (slice.len > 0) {
|
|
// TODO: SIMD
|
|
if (strings.indexOfAny(slice, "\"<>")) |j| {
|
|
_ = try this.writeAll(slice[0..j]);
|
|
_ = switch (slice[j]) {
|
|
'"' => try this.writeAll("""),
|
|
'<' => try this.writeAll("<"),
|
|
'>' => try this.writeAll(">"),
|
|
else => unreachable,
|
|
};
|
|
|
|
slice = slice[j + 1 ..];
|
|
continue;
|
|
}
|
|
|
|
_ = try this.writeAll(slice);
|
|
break;
|
|
}
|
|
}
|
|
|
|
pub fn writeHTMLAttributeValue16(this: *BufferedWriter, bytes: []const u16) anyerror!void {
|
|
var slice = bytes;
|
|
while (slice.len > 0) {
|
|
if (strings.indexOfAny16(slice, "\"<>")) |j| {
|
|
// this won't handle strings larger than 4 GB
|
|
// that's fine though, 4 GB of SSR'd HTML is quite a lot...
|
|
_ = try this.writeAll16(slice[0..j]);
|
|
_ = switch (slice[j]) {
|
|
'"' => try this.writeAll("""),
|
|
'<' => try this.writeAll("<"),
|
|
'>' => try this.writeAll(">"),
|
|
else => unreachable,
|
|
};
|
|
|
|
slice = slice[j + 1 ..];
|
|
continue;
|
|
}
|
|
|
|
_ = try this.writeAll16(slice);
|
|
break;
|
|
}
|
|
}
|
|
|
|
pub fn writer(this: *BufferedWriter) BufferedWriter.Writer {
|
|
return BufferedWriter.Writer{ .context = this };
|
|
}
|
|
};
|
|
|
|
pub fn writeAll(self: *MutableString, bytes: string) std.mem.Allocator.Error!usize {
|
|
try self.list.appendSlice(self.allocator, bytes);
|
|
return bytes.len;
|
|
}
|
|
};
|