Fix ascii→ascii shortcut bypassing 0x7F masking

The `from == to` optimization copied the buffer unchanged for all same-encoding pairs, but ascii→ascii must mask each byte with & 0x7F per Node.js semantics. Exclude ASCII from the shortcut and add an explicit ascii→ascii case that copies the already-masked data. https://claude.ai/code/session_01WK9KQWWRoS7dcmZmUbUo8M
Validate UTF-8 continuation bytes before accepting multi-byte sequences
2026-02-22 08:41:46 +00:00 · 2026-02-21 06:32:42 +00:00 · 2026-02-21 06:02:31 +00:00 · 2026-02-21 05:52:31 +00:00 · 2026-02-21 05:04:21 +00:00 · 2026-02-20 04:45:22 +00:00
8 changed files with 558 additions and 128 deletions
--- a/src/bun.js/bindings/FormatStackTraceForJS.cpp
+++ b/src/bun.js/bindings/FormatStackTraceForJS.cpp
@@ -22,7 +22,6 @@
 #include "BunClientData.h"
 #include "CallSite.h"
 #include "ErrorStackTrace.h"
-#include "JSDOMException.h"
 #include "headers-handwritten.h"

 using namespace JSC;
@@ -380,9 +379,6 @@ static String computeErrorInfoWithoutPrepareStackTrace(
            RETURN_IF_EXCEPTION(scope, {});
            message = instance->sanitizedMessageString(lexicalGlobalObject);
            RETURN_IF_EXCEPTION(scope, {});
-        } else if (auto* domException = jsDynamicCast<WebCore::JSDOMException*>(errorInstance)) {
-            name = domException->wrapped().name();
-            message = domException->wrapped().message();
        }
    }

--- a/src/bun.js/bindings/webcore/JSDOMException.cpp
+++ b/src/bun.js/bindings/webcore/JSDOMException.cpp
@@ -46,10 +46,6 @@
 #include <wtf/PointerPreparations.h>
 #include <wtf/URL.h>

-#include "FormatStackTraceForJS.h"
-#include "ZigGlobalObject.h"
-#include <JavaScriptCore/Interpreter.h>
-
 namespace WebCore {
 using namespace JSC;

@@ -124,34 +120,6 @@ static const HashTableValue JSDOMExceptionConstructorTableValues[] = {
    { "DATA_CLONE_ERR"_s, JSC::PropertyAttribute::DontDelete | JSC::PropertyAttribute::ReadOnly | JSC::PropertyAttribute::ConstantInteger, NoIntrinsic, { HashTableValue::ConstantType, 25 } },
 };

-static void captureStackTraceForDOMException(JSC::VM& vm, JSC::JSGlobalObject* lexicalGlobalObject, JSC::JSObject* errorObject)
-{
-    if (!vm.topCallFrame)
-        return;
-
-    auto* zigGlobalObject = jsDynamicCast<Zig::GlobalObject*>(lexicalGlobalObject);
-    if (!zigGlobalObject)
-        zigGlobalObject = ::defaultGlobalObject(lexicalGlobalObject);
-
-    size_t stackTraceLimit = zigGlobalObject->stackTraceLimit().value();
-    if (stackTraceLimit == 0)
-        stackTraceLimit = Bun::DEFAULT_ERROR_STACK_TRACE_LIMIT;
-
-    WTF::Vector<JSC::StackFrame> stackTrace;
-    vm.interpreter.getStackTrace(errorObject, stackTrace, 0, stackTraceLimit);
-
-    if (stackTrace.isEmpty())
-        return;
-
-    unsigned int line = 0;
-    unsigned int column = 0;
-    String sourceURL;
-    JSValue result = Bun::computeErrorInfoWrapperToJSValue(vm, stackTrace, line, column, sourceURL, errorObject, nullptr);
-
-    if (result)
-        errorObject->putDirect(vm, vm.propertyNames->stack, result, 0);
-}
-
 template<> JSC::EncodedJSValue JSC_HOST_CALL_ATTRIBUTES JSDOMExceptionDOMConstructor::construct(JSGlobalObject* lexicalGlobalObject, CallFrame* callFrame)
 {
    auto& vm = JSC::getVM(lexicalGlobalObject);
@@ -394,12 +362,26 @@ void JSDOMExceptionOwner::finalize(JSC::Handle<JSC::Unknown> handle, void* conte
 // #endif
 // #endif

-JSC::JSValue toJSNewlyCreated(JSC::JSGlobalObject* lexicalGlobalObject, JSDOMGlobalObject* globalObject, Ref<DOMException>&& impl)
+JSC::JSValue toJSNewlyCreated(JSC::JSGlobalObject*, JSDOMGlobalObject* globalObject, Ref<DOMException>&& impl)
 {
-    auto* wrapper = createWrapper<DOMException>(globalObject, WTF::move(impl));
-    auto& vm = globalObject->vm();
-    captureStackTraceForDOMException(vm, lexicalGlobalObject ? lexicalGlobalObject : globalObject, wrapper);
-    return wrapper;
+
+    // if constexpr (std::is_polymorphic_v<DOMException>) {
+    // #if ENABLE(BINDING_INTEGRITY)
+    //         // const void* actualVTablePointer = getVTablePointer(impl.ptr());
+    // #if PLATFORM(WIN)
+    //         void* expectedVTablePointer = __identifier("??_7DOMException@WebCore@@6B@");
+    // #else
+    //         // void* expectedVTablePointer = &_ZTVN7WebCore12DOMExceptionE[2];
+    // #endif
+
+    //         // If you hit this assertion you either have a use after free bug, or
+    //         // DOMException has subclasses. If DOMException has subclasses that get passed
+    //         // to toJS() we currently require DOMException you to opt out of binding hardening
+    //         // by adding the SkipVTableValidation attribute to the interface IDL definition
+    //         // RELEASE_ASSERT(actualVTablePointer == expectedVTablePointer);
+    // #endif
+    // }
+    return createWrapper<DOMException>(globalObject, WTF::move(impl));
 }

 JSC::JSValue toJS(JSC::JSGlobalObject* lexicalGlobalObject, JSDOMGlobalObject* globalObject, DOMException& impl)
--- a/src/bun.js/modules/NodeBufferModule.h
+++ b/src/bun.js/modules/NodeBufferModule.h
@@ -3,6 +3,7 @@
 #include "root.h"

 #include "../bindings/JSBuffer.h"
+#include "../bindings/JSBufferEncodingType.h"
 #include "ErrorCode.h"
 #include "JavaScriptCore/PageCount.h"
 #include "NodeValidator.h"
@@ -125,6 +126,432 @@ JSC_DEFINE_HOST_FUNCTION(jsBufferConstructorFunction_isAscii,

 BUN_DECLARE_HOST_FUNCTION(jsFunctionResolveObjectURL);

+// Transcode encoding enum - only the 4 encodings supported by Node.js transcode()
+enum class TranscodeEncoding : uint8_t {
+    ASCII,
+    LATIN1,
+    UTF8,
+    UCS2, // UTF-16LE
+};
+
+static std::optional<TranscodeEncoding> parseTranscodeEncoding(JSC::JSGlobalObject& globalObject, JSValue value)
+{
+    auto encoding = parseEnumeration<BufferEncodingType>(globalObject, value);
+    if (!encoding.has_value())
+        return std::nullopt;
+
+    switch (encoding.value()) {
+    case BufferEncodingType::ascii:
+        return TranscodeEncoding::ASCII;
+    case BufferEncodingType::latin1:
+        return TranscodeEncoding::LATIN1;
+    case BufferEncodingType::utf8:
+        return TranscodeEncoding::UTF8;
+    case BufferEncodingType::ucs2:
+    case BufferEncodingType::utf16le:
+        return TranscodeEncoding::UCS2;
+    default:
+        return std::nullopt;
+    }
+}
+
+// Validate that all continuation bytes in a multi-byte UTF-8 sequence have the 10xxxxxx pattern.
+static inline bool validateUtf8Continuations(const char* source, size_t srcIdx, size_t seqLen)
+{
+    for (size_t i = 1; i < seqLen; i++) {
+        if ((static_cast<uint8_t>(source[srcIdx + i]) & 0xC0) != 0x80)
+            return false;
+    }
+    return true;
+}
+
+// Count the number of output codepoints from UTF-8 input, handling invalid sequences safely.
+// Each valid codepoint produces one output byte; each invalid/truncated byte also produces one.
+static size_t countUtf8Codepoints(const char* source, size_t sourceLength)
+{
+    size_t count = 0;
+    size_t srcIdx = 0;
+    while (srcIdx < sourceLength) {
+        uint8_t byte = static_cast<uint8_t>(source[srcIdx]);
+        size_t seqLen;
+        if (byte < 0x80)
+            seqLen = 1;
+        else if ((byte & 0xE0) == 0xC0)
+            seqLen = 2;
+        else if ((byte & 0xF0) == 0xE0)
+            seqLen = 3;
+        else if ((byte & 0xF8) == 0xF0)
+            seqLen = 4;
+        else {
+            // Invalid start byte: counts as one output
+            count++;
+            srcIdx++;
+            continue;
+        }
+        if (srcIdx + seqLen > sourceLength) {
+            // Truncated sequence: each remaining byte counts as one output
+            count += (sourceLength - srcIdx);
+            break;
+        }
+        if (seqLen > 1 && !validateUtf8Continuations(source, srcIdx, seqLen)) {
+            // Bad continuation byte: treat start byte as one invalid output
+            count++;
+            srcIdx++;
+            continue;
+        }
+        count++;
+        srcIdx += seqLen;
+    }
+    return count;
+}
+
+// Transcode UTF-8 to single-byte encoding: codepoints > threshold become '?'.
+// Invalid/truncated UTF-8 sequences emit '?' for each bad byte.
+static JSC::JSUint8Array* transcodeUtf8ToSingleByte(JSC::JSGlobalObject* globalObject, const char* source, size_t sourceLength, uint32_t threshold)
+{
+    size_t outputLength;
+    if (simdutf::validate_utf8(source, sourceLength)) {
+        outputLength = simdutf::utf32_length_from_utf8(source, sourceLength);
+    } else {
+        outputLength = countUtf8Codepoints(source, sourceLength);
+    }
+
+    auto* result = WebCore::createUninitializedBuffer(globalObject, outputLength);
+    if (!result)
+        return nullptr;
+
+    auto* out = result->typedVector();
+    size_t srcIdx = 0;
+    size_t dstIdx = 0;
+    while (srcIdx < sourceLength && dstIdx < outputLength) {
+        uint8_t byte = static_cast<uint8_t>(source[srcIdx]);
+        uint32_t codepoint;
+        size_t seqLen;
+
+        if (byte < 0x80) {
+            codepoint = byte;
+            seqLen = 1;
+        } else if ((byte & 0xE0) == 0xC0) {
+            seqLen = 2;
+            if (srcIdx + seqLen > sourceLength) {
+                while (srcIdx < sourceLength && dstIdx < outputLength) {
+                    out[dstIdx++] = '?';
+                    srcIdx++;
+                }
+                break;
+            }
+            if (!validateUtf8Continuations(source, srcIdx, seqLen)) {
+                out[dstIdx++] = '?';
+                srcIdx++;
+                continue;
+            }
+            codepoint = (byte & 0x1F) << 6;
+            codepoint |= (static_cast<uint8_t>(source[srcIdx + 1]) & 0x3F);
+        } else if ((byte & 0xF0) == 0xE0) {
+            seqLen = 3;
+            if (srcIdx + seqLen > sourceLength) {
+                while (srcIdx < sourceLength && dstIdx < outputLength) {
+                    out[dstIdx++] = '?';
+                    srcIdx++;
+                }
+                break;
+            }
+            if (!validateUtf8Continuations(source, srcIdx, seqLen)) {
+                out[dstIdx++] = '?';
+                srcIdx++;
+                continue;
+            }
+            codepoint = (byte & 0x0F) << 12;
+            codepoint |= (static_cast<uint8_t>(source[srcIdx + 1]) & 0x3F) << 6;
+            codepoint |= (static_cast<uint8_t>(source[srcIdx + 2]) & 0x3F);
+        } else if ((byte & 0xF8) == 0xF0) {
+            seqLen = 4;
+            if (srcIdx + seqLen > sourceLength) {
+                while (srcIdx < sourceLength && dstIdx < outputLength) {
+                    out[dstIdx++] = '?';
+                    srcIdx++;
+                }
+                break;
+            }
+            if (!validateUtf8Continuations(source, srcIdx, seqLen)) {
+                out[dstIdx++] = '?';
+                srcIdx++;
+                continue;
+            }
+            codepoint = (byte & 0x07) << 18;
+            codepoint |= (static_cast<uint8_t>(source[srcIdx + 1]) & 0x3F) << 12;
+            codepoint |= (static_cast<uint8_t>(source[srcIdx + 2]) & 0x3F) << 6;
+            codepoint |= (static_cast<uint8_t>(source[srcIdx + 3]) & 0x3F);
+        } else {
+            // Invalid UTF-8 start byte
+            out[dstIdx++] = '?';
+            srcIdx++;
+            continue;
+        }
+
+        out[dstIdx++] = (codepoint <= threshold) ? static_cast<uint8_t>(codepoint) : '?';
+        srcIdx += seqLen;
+    }
+
+    return result;
+}
+
+static JSC::JSUint8Array* transcodeUtf8ToAscii(JSC::JSGlobalObject* globalObject, const char* source, size_t sourceLength)
+{
+    return transcodeUtf8ToSingleByte(globalObject, source, sourceLength, 0x7F);
+}
+
+static JSC::JSUint8Array* transcodeUtf8ToLatin1(JSC::JSGlobalObject* globalObject, const char* source, size_t sourceLength)
+{
+    return transcodeUtf8ToSingleByte(globalObject, source, sourceLength, 0xFF);
+}
+
+// Transcode UCS-2 to ASCII: each char16_t > 0x7F becomes '?'
+static JSC::JSUint8Array* transcodeUcs2ToAscii(JSC::JSGlobalObject* globalObject, const char16_t* source, size_t charLength)
+{
+    auto* result = WebCore::createUninitializedBuffer(globalObject, charLength);
+    if (!result)
+        return nullptr;
+
+    auto* out = result->typedVector();
+    for (size_t i = 0; i < charLength; i++) {
+        out[i] = (source[i] <= 0x7F) ? static_cast<uint8_t>(source[i]) : '?';
+    }
+    return result;
+}
+
+// Transcode UCS-2 to Latin-1: each char16_t > 0xFF becomes '?'
+static JSC::JSUint8Array* transcodeUcs2ToLatin1(JSC::JSGlobalObject* globalObject, const char16_t* source, size_t charLength)
+{
+    auto* result = WebCore::createUninitializedBuffer(globalObject, charLength);
+    if (!result)
+        return nullptr;
+
+    auto* out = result->typedVector();
+    for (size_t i = 0; i < charLength; i++) {
+        out[i] = (source[i] <= 0xFF) ? static_cast<uint8_t>(source[i]) : '?';
+    }
+    return result;
+}
+
+JSC_DEFINE_HOST_FUNCTION(jsFunction_transcode,
+    (JSGlobalObject * globalObject,
+        CallFrame* callFrame))
+{
+    VM& vm = globalObject->vm();
+    auto scope = DECLARE_THROW_SCOPE(vm);
+
+    JSValue sourceValue = callFrame->argument(0);
+
+    // Validate source is Buffer or Uint8Array
+    auto* sourceView = JSC::jsDynamicCast<JSC::JSArrayBufferView*>(sourceValue);
+    if (!sourceView) {
+        Bun::ERR::INVALID_ARG_TYPE_INSTANCE(scope, globalObject,
+            "source"_s, "Buffer"_s, "Uint8Array"_s, sourceValue);
+        return {};
+    }
+
+    if (sourceView->isDetached()) [[unlikely]] {
+        Bun::ERR::INVALID_STATE(scope, globalObject,
+            "Cannot transcode a detached buffer"_s);
+        return {};
+    }
+
+    const char* sourceData = reinterpret_cast<const char*>(sourceView->vector());
+    size_t sourceLength = sourceView->byteLength();
+
+    // Empty input → empty Buffer
+    if (sourceLength == 0) {
+        return JSValue::encode(WebCore::createEmptyBuffer(globalObject));
+    }
+
+    // Parse encodings
+    auto fromEncoding = parseTranscodeEncoding(*globalObject, callFrame->argument(1));
+    RETURN_IF_EXCEPTION(scope, {});
+    auto toEncoding = parseTranscodeEncoding(*globalObject, callFrame->argument(2));
+    RETURN_IF_EXCEPTION(scope, {});
+
+    if (!fromEncoding.has_value() || !toEncoding.has_value()) {
+        throwException(globalObject, scope,
+            createError(globalObject, "Unable to transcode Buffer [U_ILLEGAL_ARGUMENT_ERROR]"_s));
+        return {};
+    }
+
+    auto from = fromEncoding.value();
+    auto to = toEncoding.value();
+
+    JSC::JSUint8Array* resultBuffer = nullptr;
+
+    // Same encoding → copy (except ASCII which needs 0x7F masking)
+    if (from == to && from != TranscodeEncoding::ASCII) {
+        resultBuffer = WebCore::createBuffer(globalObject, reinterpret_cast<const uint8_t*>(sourceData), sourceLength);
+        RETURN_IF_EXCEPTION(scope, {});
+        return JSValue::encode(resultBuffer);
+    }
+
+    switch (from) {
+    case TranscodeEncoding::ASCII: {
+        // Node.js ASCII encoding masks bytes > 0x7F with & 0x7F
+        Vector<char> masked(sourceLength);
+        for (size_t i = 0; i < sourceLength; i++)
+            masked[i] = static_cast<char>(static_cast<uint8_t>(sourceData[i]) & 0x7F);
+        const char* maskedData = masked.data();
+
+        switch (to) {
+        case TranscodeEncoding::ASCII: {
+            resultBuffer = WebCore::createBuffer(globalObject, reinterpret_cast<const uint8_t*>(maskedData), sourceLength);
+            break;
+        }
+        case TranscodeEncoding::UCS2: {
+            auto* result = WebCore::createUninitializedBuffer(globalObject, sourceLength * 2);
+            if (!result) {
+                RETURN_IF_EXCEPTION(scope, {});
+                return {};
+            }
+            (void)simdutf::convert_latin1_to_utf16le(maskedData, sourceLength,
+                reinterpret_cast<char16_t*>(result->typedVector()));
+            resultBuffer = result;
+            break;
+        }
+        case TranscodeEncoding::UTF8: {
+            // All bytes are <= 0x7F after masking, so UTF-8 output == sourceLength
+            resultBuffer = WebCore::createBuffer(globalObject, reinterpret_cast<const uint8_t*>(maskedData), sourceLength);
+            break;
+        }
+        case TranscodeEncoding::LATIN1: {
+            resultBuffer = WebCore::createBuffer(globalObject, reinterpret_cast<const uint8_t*>(maskedData), sourceLength);
+            break;
+        }
+        }
+        break;
+    }
+    case TranscodeEncoding::LATIN1: {
+        switch (to) {
+        case TranscodeEncoding::UCS2: {
+            auto* result = WebCore::createUninitializedBuffer(globalObject, sourceLength * 2);
+            if (!result) {
+                RETURN_IF_EXCEPTION(scope, {});
+                return {};
+            }
+            (void)simdutf::convert_latin1_to_utf16le(sourceData, sourceLength,
+                reinterpret_cast<char16_t*>(result->typedVector()));
+            resultBuffer = result;
+            break;
+        }
+        case TranscodeEncoding::UTF8: {
+            size_t utf8Length = simdutf::utf8_length_from_latin1(sourceData, sourceLength);
+            auto* result = WebCore::createUninitializedBuffer(globalObject, utf8Length);
+            if (!result) {
+                RETURN_IF_EXCEPTION(scope, {});
+                return {};
+            }
+            (void)simdutf::convert_latin1_to_utf8(sourceData, sourceLength,
+                reinterpret_cast<char*>(result->typedVector()));
+            resultBuffer = result;
+            break;
+        }
+        case TranscodeEncoding::ASCII: {
+            // Latin1 → ASCII: clamp bytes > 0x7F to '?'
+            auto* result = WebCore::createUninitializedBuffer(globalObject, sourceLength);
+            if (!result) {
+                RETURN_IF_EXCEPTION(scope, {});
+                return {};
+            }
+            auto* out = result->typedVector();
+            for (size_t i = 0; i < sourceLength; i++) {
+                uint8_t byte = static_cast<uint8_t>(sourceData[i]);
+                out[i] = (byte <= 0x7F) ? byte : '?';
+            }
+            resultBuffer = result;
+            break;
+        }
+        default:
+            break;
+        }
+        break;
+    }
+    case TranscodeEncoding::UTF8: {
+        switch (to) {
+        case TranscodeEncoding::UCS2: {
+            // UTF-8 → UCS-2: use simdutf
+            size_t utf16Length = simdutf::utf16_length_from_utf8(sourceData, sourceLength);
+            auto* result = WebCore::createUninitializedBuffer(globalObject, utf16Length * sizeof(char16_t));
+            if (!result) {
+                RETURN_IF_EXCEPTION(scope, {});
+                return {};
+            }
+            size_t actual = simdutf::convert_utf8_to_utf16le(sourceData, sourceLength,
+                reinterpret_cast<char16_t*>(result->typedVector()));
+            if (actual == 0 && sourceLength > 0) {
+                throwException(globalObject, scope,
+                    createError(globalObject, "Unable to transcode Buffer [U_INVALID_CHAR_FOUND]"_s));
+                return {};
+            }
+            resultBuffer = result;
+            break;
+        }
+        case TranscodeEncoding::ASCII: {
+            resultBuffer = transcodeUtf8ToAscii(globalObject, sourceData, sourceLength);
+            break;
+        }
+        case TranscodeEncoding::LATIN1: {
+            resultBuffer = transcodeUtf8ToLatin1(globalObject, sourceData, sourceLength);
+            break;
+        }
+        default:
+            break;
+        }
+        break;
+    }
+    case TranscodeEncoding::UCS2: {
+        const char16_t* utf16Data = reinterpret_cast<const char16_t*>(sourceData);
+        size_t charLength = sourceLength / sizeof(char16_t);
+
+        switch (to) {
+        case TranscodeEncoding::UTF8: {
+            // UCS-2 → UTF-8: use simdutf
+            size_t utf8Length = simdutf::utf8_length_from_utf16le(utf16Data, charLength);
+            auto* result = WebCore::createUninitializedBuffer(globalObject, utf8Length);
+            if (!result) {
+                RETURN_IF_EXCEPTION(scope, {});
+                return {};
+            }
+            size_t actual = simdutf::convert_utf16le_to_utf8(utf16Data, charLength,
+                reinterpret_cast<char*>(result->typedVector()));
+            if (actual == 0 && charLength > 0) {
+                throwException(globalObject, scope,
+                    createError(globalObject, "Unable to transcode Buffer [U_INVALID_CHAR_FOUND]"_s));
+                return {};
+            }
+            resultBuffer = result;
+            break;
+        }
+        case TranscodeEncoding::ASCII: {
+            resultBuffer = transcodeUcs2ToAscii(globalObject, utf16Data, charLength);
+            break;
+        }
+        case TranscodeEncoding::LATIN1: {
+            resultBuffer = transcodeUcs2ToLatin1(globalObject, utf16Data, charLength);
+            break;
+        }
+        default:
+            break;
+        }
+        break;
+    }
+    }
+
+    if (!resultBuffer) {
+        RETURN_IF_EXCEPTION(scope, {});
+        throwException(globalObject, scope,
+            createError(globalObject, "Unable to transcode Buffer [U_ILLEGAL_ARGUMENT_ERROR]"_s));
+        return {};
+    }
+
+    RETURN_IF_EXCEPTION(scope, {});
+    return JSValue::encode(resultBuffer);
+}
+
 JSC_DEFINE_HOST_FUNCTION(jsFunctionNotImplemented,
    (JSGlobalObject * globalObject,
        CallFrame* callFrame))
@@ -203,9 +630,7 @@ DEFINE_NATIVE_MODULE(NodeBuffer)
    put(atobI, atobV);
    put(btoaI, btoaV);

-    auto* transcode = InternalFunction::createFunctionThatMasqueradesAsUndefined(vm, globalObject, 1, "transcode"_s, jsFunctionNotImplemented);
-
-    put(JSC::Identifier::fromString(vm, "transcode"_s), transcode);
+    put(JSC::Identifier::fromString(vm, "transcode"_s), JSC::JSFunction::create(vm, globalObject, 3, "transcode"_s, jsFunction_transcode, ImplementationVisibility::Public, NoIntrinsic, jsFunction_transcode));

    auto* resolveObjectURL = JSC::JSFunction::create(vm, globalObject, 1, "resolveObjectURL"_s, jsFunctionResolveObjectURL, ImplementationVisibility::Public, NoIntrinsic, jsFunctionResolveObjectURL);

--- a/test/js/node/buffer.test.js
+++ b/test/js/node/buffer.test.js
@@ -2188,10 +2188,39 @@ for (let withOverridenBufferWrite of [false, true]) {
      });

      it("transcode", () => {
-        expect(typeof BufferModule.transcode).toBe("undefined");
+        expect(typeof BufferModule.transcode).toBe("function");

-        // This is a masqueradesAsUndefined function
-        expect(() => BufferModule.transcode()).toThrow("Not implemented");
+        // Basic UTF-8 to ASCII
+        const euroUtf8 = Buffer.from("€", "utf8");
+        const asciiResult = BufferModule.transcode(euroUtf8, "utf8", "ascii");
+        expect(asciiResult.toString("ascii")).toBe("?");
+
+        // UTF-8 to Latin-1
+        const orig = Buffer.from("těst ☕", "utf8");
+        const latin1 = BufferModule.transcode(orig, "utf8", "latin1");
+        expect(Array.from(latin1)).toEqual([0x74, 0x3f, 0x73, 0x74, 0x20, 0x3f]);
+
+        // UTF-8 to UCS-2
+        const ucs2 = BufferModule.transcode(orig, "utf8", "ucs2");
+        expect(Array.from(ucs2)).toEqual([0x74, 0x00, 0x1b, 0x01, 0x73, 0x00, 0x74, 0x00, 0x20, 0x00, 0x15, 0x26]);
+
+        // Round-trip UCS-2 → UTF-8
+        const backToUtf8 = BufferModule.transcode(Buffer.from(ucs2), "ucs2", "utf8");
+        expect(backToUtf8.toString()).toBe(orig.toString());
+
+        // Empty input
+        const empty = BufferModule.transcode(new Uint8Array(), "utf8", "latin1");
+        expect(empty.length).toBe(0);
+
+        // Invalid source type
+        expect(() => BufferModule.transcode(null, "utf8", "ascii")).toThrow();
+
+        // Invalid encoding
+        expect(() => BufferModule.transcode(Buffer.from("a"), "b", "utf8")).toThrow(/U_ILLEGAL_ARGUMENT_ERROR/);
+
+        // Uint8Array support
+        const uint8arr = new Uint8Array([...Buffer.from("hä", "latin1")]);
+        expect(BufferModule.transcode(uint8arr, "latin1", "utf16le")).toEqual(Buffer.from("hä", "utf16le"));
      });

      it("Buffer.from (Node.js test/test-buffer-from.js)", () => {
--- a/test/js/node/domexception-node.test.js
+++ b/test/js/node/domexception-node.test.js
@@ -56,7 +56,8 @@ describe("DOMException in Node.js environment", () => {
    expect(DOMException.DATA_CLONE_ERR).toBe(25);
  });

-  it("inherits prototype properties from Error", () => {
+  // TODO: missing stack trace on DOMException
+  it.failing("inherits prototype properties from Error", () => {
    const error = new DOMException("Test error");
    expect(error.toString()).toBe("Error: Test error");
    expect(error.stack).toBeDefined();
--- a/test/js/web/abort/abort.test.ts
+++ b/test/js/web/abort/abort.test.ts
@@ -67,7 +67,7 @@ describe("AbortSignal", () => {
  function fmt(value: any) {
    const res = {};
    for (const key in value) {
-      if (key === "column" || key === "line" || key === "sourceURL" || key === "stack") continue;
+      if (key === "column" || key === "line" || key === "sourceURL") continue;
      res[key] = value[key];
    }
    return res;
--- a/test/regression/issue/17877.test.ts
+++ b/test/regression/issue/17877.test.ts
@@ -1,79 +0,0 @@
-import { expect, test } from "bun:test";
-
-test("DOMException from new DOMException() has a stack trace", () => {
-  const e = new DOMException("test error", "AbortError");
-  expect(typeof e.stack).toBe("string");
-  expect(e.stack).toContain("AbortError: test error");
-  expect(e.stack).toContain("17877.test");
-  expect(e instanceof DOMException).toBe(true);
-  expect(e instanceof Error).toBe(true);
-});
-
-test("DOMException from AbortSignal.abort() has a stack trace", () => {
-  const signal = AbortSignal.abort();
-  try {
-    signal.throwIfAborted();
-    expect.unreachable();
-  } catch (err: any) {
-    expect(typeof err.stack).toBe("string");
-    expect(err.stack).toContain("AbortError");
-    expect(err.stack).toContain("The operation was aborted");
-    expect(err instanceof DOMException).toBe(true);
-    expect(err instanceof Error).toBe(true);
-  }
-});
-
-test("DOMException stack trace includes correct name and message", () => {
-  const e = new DOMException("custom message", "NotFoundError");
-  expect(typeof e.stack).toBe("string");
-  expect(e.stack).toStartWith("NotFoundError: custom message\n");
-});
-
-test("DOMException with default args has a stack trace", () => {
-  const e = new DOMException();
-  expect(typeof e.stack).toBe("string");
-  expect(e.name).toBe("Error");
-  expect(e.message).toBe("");
-});
-
-test("DOMException stack trace shows correct call site", () => {
-  function createException() {
-    return new DOMException("inner", "DataError");
-  }
-
-  const e = createException();
-  expect(typeof e.stack).toBe("string");
-  expect(e.stack).toContain("createException");
-});
-
-test("DOMException.stack is writable", () => {
-  const e = new DOMException("test", "AbortError");
-  expect(typeof e.stack).toBe("string");
-  e.stack = "custom stack";
-  expect(e.stack).toBe("custom stack");
-});
-
-test("DOMException from AbortSignal.abort() with custom reason has no stack on reason", () => {
-  const reason = "custom reason string";
-  const signal = AbortSignal.abort(reason);
-  try {
-    signal.throwIfAborted();
-    expect.unreachable();
-  } catch (err: any) {
-    // When a custom reason (non-DOMException) is used, it's thrown as-is
-    expect(err).toBe("custom reason string");
-  }
-});
-
-test("DOMException from AbortSignal.abort() with DOMException reason has stack", () => {
-  const reason = new DOMException("custom abort", "AbortError");
-  const signal = AbortSignal.abort(reason);
-  try {
-    signal.throwIfAborted();
-    expect.unreachable();
-  } catch (err: any) {
-    expect(err).toBe(reason);
-    expect(typeof err.stack).toBe("string");
-    expect(err.stack).toContain("AbortError: custom abort");
-  }
-});
--- a/test/regression/issue/24235.test.ts
+++ b/test/regression/issue/24235.test.ts
@@ -0,0 +1,76 @@
+import { expect, test } from "bun:test";
+import * as buffer from "node:buffer";
+
+test("buffer.transcode is a function, not undefined", () => {
+  expect(typeof buffer.transcode).toBe("function");
+});
+
+test("buffer.transcode converts UTF-8 to ASCII with ? substitution", () => {
+  const newBuf = buffer.transcode(Buffer.from("€"), "utf8", "ascii");
+  expect(newBuf.toString("ascii")).toBe("?");
+});
+
+test("buffer.transcode converts UTF-8 to Latin-1 with ? substitution", () => {
+  const orig = Buffer.from("těst ☕", "utf8");
+  const dest = buffer.transcode(orig, "utf8", "latin1");
+  // ě (U+011B) fits in latin1 → 0x3F because it's > 0xFF? No.
+  // Actually ě is U+011B which is > 0xFF, so it becomes '?' (0x3F)
+  // ☕ is U+2615, also > 0xFF, so '?' (0x3F)
+  expect(Array.from(dest)).toEqual([0x74, 0x3f, 0x73, 0x74, 0x20, 0x3f]);
+});
+
+test("buffer.transcode converts UTF-8 to UCS-2", () => {
+  const orig = Buffer.from("těst ☕", "utf8");
+  const dest = buffer.transcode(orig, "utf8", "ucs2");
+  expect(Array.from(dest)).toEqual([0x74, 0x00, 0x1b, 0x01, 0x73, 0x00, 0x74, 0x00, 0x20, 0x00, 0x15, 0x26]);
+});
+
+test("buffer.transcode round-trips UCS-2 to UTF-8", () => {
+  const orig = Buffer.from("těst ☕", "utf8");
+  const ucs2 = buffer.transcode(orig, "utf8", "ucs2");
+  const back = buffer.transcode(Buffer.from(ucs2), "ucs2", "utf8");
+  expect(back.toString()).toBe(orig.toString());
+});
+
+test("buffer.transcode handles large data", () => {
+  const repeated = Buffer.alloc(4000 * Buffer.byteLength("€"), "€").toString();
+  const utf8 = Buffer.from(repeated, "utf8");
+  const ucs2 = Buffer.from(repeated, "ucs2");
+  const utf8_to_ucs2 = buffer.transcode(utf8, "utf8", "ucs2");
+  const ucs2_to_utf8 = buffer.transcode(ucs2, "ucs2", "utf8");
+  expect(Buffer.compare(utf8, ucs2_to_utf8)).toBe(0);
+  expect(Buffer.compare(ucs2, utf8_to_ucs2)).toBe(0);
+});
+
+test("buffer.transcode throws on invalid source type", () => {
+  expect(() => buffer.transcode(null as any, "utf8", "ascii")).toThrow();
+});
+
+test("buffer.transcode throws on unsupported encoding", () => {
+  expect(() => buffer.transcode(Buffer.from("a"), "b" as any, "utf8")).toThrow(/U_ILLEGAL_ARGUMENT_ERROR/);
+  expect(() => buffer.transcode(Buffer.from("a"), "uf8" as any, "b" as any)).toThrow(/U_ILLEGAL_ARGUMENT_ERROR/);
+});
+
+test("buffer.transcode ASCII/Latin-1 to UTF-16LE", () => {
+  expect(buffer.transcode(Buffer.from("hi", "ascii"), "ascii", "utf16le")).toEqual(Buffer.from("hi", "utf16le"));
+  expect(buffer.transcode(Buffer.from("hi", "latin1"), "latin1", "utf16le")).toEqual(Buffer.from("hi", "utf16le"));
+  expect(buffer.transcode(Buffer.from("hä", "latin1"), "latin1", "utf16le")).toEqual(Buffer.from("hä", "utf16le"));
+});
+
+test("buffer.transcode accepts Uint8Array", () => {
+  const uint8array = new Uint8Array([...Buffer.from("hä", "latin1")]);
+  expect(buffer.transcode(uint8array, "latin1", "utf16le")).toEqual(Buffer.from("hä", "utf16le"));
+});
+
+test("buffer.transcode empty input", () => {
+  const dest = buffer.transcode(new Uint8Array(), "utf8", "latin1");
+  expect(dest.length).toBe(0);
+});
+
+test("buffer.transcode doesn't crash with allocUnsafeSlow", () => {
+  // Test that allocUnsafeSlow buffers work with transcode
+  const slowBuf = buffer.Buffer.allocUnsafeSlow(4);
+  slowBuf.write("hi", "utf16le");
+  const result = buffer.transcode(slowBuf, "utf16le", "utf8");
+  expect(result.toString()).toBe("hi");
+});
Author	SHA1	Message	Date
Claude	f841c17731	Fix ascii→ascii shortcut bypassing 0x7F masking The `from == to` optimization copied the buffer unchanged for all same-encoding pairs, but ascii→ascii must mask each byte with & 0x7F per Node.js semantics. Exclude ASCII from the shortcut and add an explicit ascii→ascii case that copies the already-masked data. https://claude.ai/code/session_01WK9KQWWRoS7dcmZmUbUo8M	2026-02-21 06:32:42 +00:00
Claude	9ab36c6b0a	Validate UTF-8 continuation bytes before accepting multi-byte sequences Add validateUtf8Continuations() helper that checks each continuation byte has the 10xxxxxx pattern. Applied in both countUtf8Codepoints (for accurate output length calculation) and transcodeUtf8ToSingleByte (for correct '?' emission). Sequences with bad continuation bytes now treat the start byte as invalid, emit '?', and advance by 1. https://claude.ai/code/session_01WK9KQWWRoS7dcmZmUbUo8M	2026-02-21 06:02:31 +00:00
Claude	c215477bce	Fix invalid UTF-8 handling, ASCII masking semantics, and test guidelines - transcodeUtf8ToSingleByte now validates UTF-8 first; on invalid input, uses safe counting pass and emits '?' per bad/truncated byte instead of leaving uninitialized memory - Separate ASCII from Latin-1 transcoding: ASCII masks bytes >0x7F with & 0x7F per Node.js semantics before conversion to UCS2/UTF8/Latin1 - Replace .repeat(4000) with Buffer.alloc pattern per test guidelines https://claude.ai/code/session_01WK9KQWWRoS7dcmZmUbUo8M	2026-02-21 05:52:31 +00:00
Claude	23dc6d6704	Address review comments: deduplicate UTF-8 helpers, add detached buffer check, improve test - Extract shared UTF-8 decode loop into transcodeUtf8ToSingleByte with threshold param - Add isDetached() check before accessing sourceView->vector() in jsFunction_transcode - Update allocUnsafeSlow test to use a proper 4-byte buffer exercising the UTF-16 path https://claude.ai/code/session_01WK9KQWWRoS7dcmZmUbUo8M	2026-02-21 05:04:21 +00:00
Claude Bot	7183dc224e	fix: implement `buffer.transcode()` from `node:buffer` Implements the `transcode` function which was previously stubbed with a "Not implemented" error. Supports all encoding pairs that Node.js supports: utf8, ascii, latin1, and ucs2/utf16le. Uses simdutf for fast SIMD-accelerated conversions where possible, with custom paths for ASCII/Latin-1 substitution (replacing unmappable characters with '?'). Closes #24235 Co-Authored-By: Claude <noreply@anthropic.com>	2026-02-20 04:45:22 +00:00