fixup! buffer: add buffer.isUtf8 for utf8 validation

nodejs · nodejs-github-bot · Dec 25, 2022 · Dec 22, 2022 · Dec 23, 2022 · Dec 23, 2022
commit b590f061edbbca3568f07869dc461da4717a807e
diff --git a/src/node_buffer.cc b/src/node_buffer.cc
@@ -1226,11 +1226,13 @@ static void EncodeInto(const FunctionCallbackInfo<Value>& args) {
 static void IsUtf8(const FunctionCallbackInfo<Value>& args) {
   Environment* env = Environment::GetCurrent(args);
   CHECK_EQ(args.Length(), 1);
-  CHECK(args[0]->IsTypedArray() || args[0]->IsArrayBuffer());
+  CHECK(args[0]->IsTypedArray() || args[0]->IsArrayBuffer() ||
+        args[0]->IsSharedArrayBuffer());
   ArrayBufferViewContents<char> abv(args[0]);
 
   if (abv.WasDetached()) {
-    return node::THROW_ERR_BUFFER_CONTEXT_NOT_AVAILABLE(env->isolate());
+    return node::THROW_ERR_INVALID_STATE(
+        env, "Cannot validate on a detached buffer");
   }
 
   args.GetReturnValue().Set(simdutf::validate_utf8(abv.data(), abv.length()));

diff --git a/src/node_errors.h b/src/node_errors.h
@@ -68,6 +68,7 @@ void OOMErrorHandler(const char* location, const v8::OOMDetails& details);
   V(ERR_INVALID_ARG_TYPE, TypeError)                                           \
   V(ERR_INVALID_OBJECT_DEFINE_PROPERTY, TypeError)                             \
   V(ERR_INVALID_MODULE, Error)                                                 \
+  V(ERR_INVALID_STATE, Error)                                                  \
   V(ERR_INVALID_THIS, TypeError)                                               \
   V(ERR_INVALID_TRANSFER_OBJECT, TypeError)                                    \
   V(ERR_MEMORY_ALLOCATION_FAILED, Error)                                       \

diff --git a/test/parallel/test-buffer-isutf8.js b/test/parallel/test-buffer-isutf8.js
@@ -9,9 +9,21 @@ const encoder = new TextEncoder();
 
 assert.strictEqual(isUtf8(encoder.encode('hello')), true);
 assert.strictEqual(isUtf8(encoder.encode('ğ')), true);
+assert.strictEqual(isUtf8(Buffer.from([])), true);
+
+// Invalid UTF-8
 assert.strictEqual(isUtf8(Buffer.from([0xf8])), false);
+
+// CESU-8
+assert.strictEqual(isUtf8(encoder.encode('\u0045\u0205\u10400')), true);
 assert.strictEqual(isUtf8(encoder.encode('aé日')), true);
 
+// Two byte overlong encoding
+assert.strictEqual(isUtf8(encoder.encode('\u0000')), true);
+
+// WTF-8
+assert.strictEqual(isUtf8(encoder.encode('\uD800\uDFFF')), true);
+
 [
   null,
   undefined,
@@ -34,7 +46,7 @@ assert.strictEqual(isUtf8(encoder.encode('aé日')), true);
   assert.throws(
     () => { isUtf8(arrayBuffer); },
     {
-      code: 'ERR_BUFFER_CONTEXT_NOT_AVAILABLE'
+      code: 'ERR_INVALID_STATE'
     }
   );
 }