From fb86fb925aa70e9cdb62727cd049d220ce7af8d0 Mon Sep 17 00:00:00 2001
From: Yagiz Nizipli <yagiz@nizipli.com>
Date: Thu, 11 Jun 2026 18:03:07 -0400
Subject: [PATCH 1/3] src: improve compile cache performance and size

Improve the compile cache by:

- Reading cache files with a single exactly-sized read using the file
  size from fstat instead of reading into an exponentially growing
  buffer, which previously cost O(log N) syscalls and allocations and
  about 2N bytes of copying per file.
- Compressing the cache content on disk with zstd at level 1, falling
  back to raw storage when the data is not compressible. This shrinks
  cache directories by about 2-4x. The magic number is bumped so that
  files in the old format are discarded as cache misses and then
  overwritten in place.
- Handing the cache to V8 through a non-owning CachedData wrapper
  instead of copying the whole buffer on every cache hit.

Corrupted cache files keep degrading to silent cache misses and are
regenerated, now covered by a regression test.

Co-authored-by: Grok <grok@x.ai>
Signed-off-by: Yagiz Nizipli <yagiz@nizipli.com>
---
 src/compile_cache.cc                          | 212 +++++++++++++-----
 src/compile_cache.h                           |  12 +-
 src/module_wrap.cc                            |   5 +-
 src/node_contextify.cc                        |   5 +-
 test/parallel/test-compile-cache-corrupted.js | 128 +++++++++++
 5 files changed, 294 insertions(+), 68 deletions(-)
 create mode 100644 test/parallel/test-compile-cache-corrupted.js
diff --git a/src/compile_cache.cc b/src/compile_cache.cc
index dd097acd86f8e4..38615900ec3d56 100644
--- a/src/compile_cache.cc
+++ b/src/compile_cache.cc
@@ -1,4 +1,6 @@
 #include "compile_cache.h"
+#include <array>
+#include <memory>
 #include <string>
 #include "debug_utils-inl.h"
 #include "env-inl.h"
@@ -8,6 +10,7 @@
 #include "path.h"
 #include "util.h"
 #include "zlib.h"
+#include "zstd.h"
 
 #ifdef NODE_IMPLEMENTS_POSIX_CREDENTIALS
 #include <unistd.h>  // getuid
@@ -75,18 +78,21 @@ inline void CompileCacheHandler::Debug(const char* format,
   }
 }
 
-ScriptCompiler::CachedData* CompileCacheEntry::CopyCache() const {
+ScriptCompiler::CachedData* CompileCacheEntry::WrapCache() const {
   DCHECK_NOT_NULL(cache);
-  int cache_size = cache->length;
-  uint8_t* data = new uint8_t[cache_size];
-  memcpy(data, cache->data, cache_size);
+  // The returned CachedData does not own the buffer - it's a view into
+  // the buffer owned by this entry, which outlives the synchronous
+  // consumption of the cache during compilation, so no copy is necessary.
   return new ScriptCompiler::CachedData(
-      data, cache_size, ScriptCompiler::CachedData::BufferOwned);
+      cache->data, cache->length, ScriptCompiler::CachedData::BufferNotOwned);
 }
 
 // Used for identifying and verifying a file is a compile cache file.
 // See comments in CompileCacheHandler::Persist().
-constexpr uint32_t kCacheMagicNumber = 0x8adfdbb2;
+// The last byte is bumped whenever the format of the cache file changes
+// so that files in an older format are discarded as cache misses and
+// then overwritten with the new format.
+constexpr uint32_t kCacheMagicNumber = 0x8adfdbb3;
 
 const char* CompileCacheEntry::type_name() const {
   switch (type) {
@@ -124,10 +130,21 @@ void CompileCacheHandler::ReadCacheFile(CompileCacheEntry* entry) {
     uv_fs_req_cleanup(&close_req);
   });
 
+  // Get the file size upfront so that the cache can be read with a single
+  // exactly-sized read, and truncated or trailing data can be detected
+  // without additional read attempts.
+  int err = uv_fs_fstat(nullptr, &req, file, nullptr);
+  if (err < 0) {
+    Debug("fstat failed, %s\n", uv_strerror(err));
+    return;
+  }
+  uint64_t file_size = req.statbuf.st_size;
+  uv_fs_req_cleanup(&req);
+
   // Read the headers.
-  std::vector<uint32_t> headers(kHeaderCount);
-  uv_buf_t headers_buf = uv_buf_init(reinterpret_cast<char*>(headers.data()),
-                                     kHeaderCount * sizeof(uint32_t));
+  std::array<uint32_t, kHeaderCount> headers;
+  uv_buf_t headers_buf =
+      uv_buf_init(reinterpret_cast<char*>(headers.data()), kHeaderSize);
   const int r = uv_fs_read(nullptr, &req, file, &headers_buf, 1, 0, nullptr);
   if (r != static_cast<int>(headers_buf.len)) {
     Debug("reading header failed, bytes read %d", r);
@@ -137,13 +154,15 @@ void CompileCacheHandler::ReadCacheFile(CompileCacheEntry* entry) {
     Debug("\n");
     return;
   }
+  uv_fs_req_cleanup(&req);
 
-  Debug("[%d %d %d %d %d]...",
+  Debug("[%d %d %d %d %d %d]...",
         headers[kMagicNumberOffset],
         headers[kCodeSizeOffset],
         headers[kCacheSizeOffset],
         headers[kCodeHashOffset],
-        headers[kCacheHashOffset]);
+        headers[kCacheHashOffset],
+        headers[kCacheRawSizeOffset]);
 
   if (headers[kMagicNumberOffset] != kCacheMagicNumber) {
     Debug("magic number mismatch: expected %d, actual %d\n",
@@ -166,50 +185,57 @@ void CompileCacheHandler::ReadCacheFile(CompileCacheEntry* entry) {
     return;
   }
 
-  // Read the cache, grow the buffer exponentially whenever it fills up.
-  size_t offset = headers_buf.len;
-  size_t capacity = 4096;  // Initial buffer capacity
-  size_t total_read = 0;
-  uint8_t* buffer = new uint8_t[capacity];
-
-  while (true) {
-    // If there is not enough space to read more data, do a simple
-    // realloc here (we don't actually realloc because V8 requires
-    // the underlying buffer to be delete[]-able).
-    if (total_read == capacity) {
-      size_t new_capacity = capacity * 2;
-      auto* new_buffer = new uint8_t[new_capacity];
-      memcpy(new_buffer, buffer, capacity);
-      delete[] buffer;
-      buffer = new_buffer;
-      capacity = new_capacity;
-    }
+  uint32_t cache_size = headers[kCacheSizeOffset];
+  uint32_t raw_size = headers[kCacheRawSizeOffset];
+
+  // Check the cache size. The headers were read successfully, so
+  // file_size >= kHeaderSize here. The file must contain exactly the
+  // headers followed by cache_size bytes of cache content.
+  if (file_size - kHeaderSize != cache_size) {
+    Debug("cache size mismatch: expected %d, actual %d\n",
+          cache_size,
+          file_size - kHeaderSize);
+    return;
+  }
 
-    uv_buf_t iov = uv_buf_init(reinterpret_cast<char*>(buffer + total_read),
-                               capacity - total_read);
-    int bytes_read =
-        uv_fs_read(nullptr, &req, file, &iov, 1, offset + total_read, nullptr);
+  // The cache content is stored uncompressed when cache_size == raw_size,
+  // and zstd-compressed when cache_size < raw_size (see
+  // CompileCacheHandler::Persist()). Anything else is invalid.
+  if (cache_size > raw_size) {
+    Debug("invalid cache size %d > uncompressed size %d\n",
+          cache_size,
+          raw_size);
+    return;
+  }
+
+  // Read the cache content in one go with an exactly-sized buffer,
+  // looping only in case of short reads.
+  std::unique_ptr<uint8_t[]> disk_data(new uint8_t[cache_size]);
+  size_t total_read = 0;
+  while (total_read < cache_size) {
+    uv_buf_t iov =
+        uv_buf_init(reinterpret_cast<char*>(disk_data.get() + total_read),
+                    cache_size - total_read);
+    int bytes_read = uv_fs_read(
+        nullptr, &req, file, &iov, 1, kHeaderSize + total_read, nullptr);
     if (req.result < 0) {  // Error.
       // req will be cleaned up by scope leave.
-      delete[] buffer;
       Debug(" %s\n", uv_strerror(req.result));
       return;
     }
     uv_fs_req_cleanup(&req);
-    if (bytes_read <= 0) {
-      break;
+    if (bytes_read == 0) {  // Unexpected EOF - the file shrank under us.
+      Debug("cache size mismatch: expected %d, actual %d\n",
+            cache_size,
+            total_read);
+      return;
     }
     total_read += bytes_read;
   }
 
-  // Check the cache size and hash.
-  if (headers[kCacheSizeOffset] != total_read) {
-    Debug("cache size mismatch: expected %d, actual %d\n",
-          headers[kCacheSizeOffset],
-          total_read);
-    return;
-  }
-  uint32_t cache_hash = GetHash(reinterpret_cast<char*>(buffer), total_read);
+  // Check the cache hash of the on-disk content before decompressing.
+  uint32_t cache_hash =
+      GetHash(reinterpret_cast<char*>(disk_data.get()), cache_size);
   if (headers[kCacheHashOffset] != cache_hash) {
     Debug("cache hash mismatch: expected %d, actual %d\n",
           headers[kCacheHashOffset],
@@ -217,9 +243,44 @@ void CompileCacheHandler::ReadCacheFile(CompileCacheEntry* entry) {
     return;
   }
 
-  entry->cache.reset(new ScriptCompiler::CachedData(
-      buffer, total_read, ScriptCompiler::CachedData::BufferOwned));
-  Debug(" success, size=%d\n", total_read);
+  if (cache_size == raw_size) {
+    // Stored uncompressed - hand the buffer to V8 directly.
+    entry->cache.reset(new ScriptCompiler::CachedData(
+        disk_data.release(),
+        raw_size,
+        ScriptCompiler::CachedData::BufferOwned));
+  } else {
+    // Cross-check the content size embedded in the zstd frame before
+    // allocating, in case the headers are corrupted.
+    unsigned long long content_size =  // NOLINT(runtime/int)
+        ZSTD_getFrameContentSize(disk_data.get(), cache_size);
+    if (content_size != raw_size) {
+      Debug("uncompressed size mismatch: expected %d, actual %d\n",
+            raw_size,
+            content_size);
+      return;
+    }
+    // Decompress directly into the buffer handed to V8.
+    std::unique_ptr<uint8_t[]> raw_data(new uint8_t[raw_size]);
+    size_t decompressed_size =
+        ZSTD_decompress(raw_data.get(), raw_size, disk_data.get(), cache_size);
+    if (ZSTD_isError(decompressed_size)) {
+      Debug("decompression failed: %s\n",
+            ZSTD_getErrorName(decompressed_size));
+      return;
+    }
+    if (decompressed_size != raw_size) {
+      Debug("decompressed size mismatch: expected %d, actual %d\n",
+            raw_size,
+            decompressed_size);
+      return;
+    }
+    entry->cache.reset(new ScriptCompiler::CachedData(
+        raw_data.release(),
+        raw_size,
+        ScriptCompiler::CachedData::BufferOwned));
+  }
+  Debug(" success, size=%d\n", raw_size);
 }
 
 static std::string GetRelativePath(std::string_view path,
@@ -280,11 +341,18 @@ CompileCacheEntry* CompileCacheHandler::GetOrInsert(Local<String> code,
     return loaded->second.get();
   }
 
-  // If the code hash mismatches, the code has changed, discard the stale entry
-  // and create a new one.
-  auto emplaced =
-      compiler_cache_store_.emplace(key, std::make_unique<CompileCacheEntry>());
-  auto* result = emplaced.first->second.get();
+  // If the code hash mismatches, the code has changed, reset the stale
+  // entry in place. Otherwise insert a new one.
+  CompileCacheEntry* result;
+  if (loaded != compiler_cache_store_.end()) {
+    result = loaded->second.get();
+    result->refreshed = false;
+    result->persisted = false;
+  } else {
+    result = compiler_cache_store_
+                 .emplace(key, std::make_unique<CompileCacheEntry>())
+                 .first->second.get();
+  }
 
   result->code_hash = code_hash;
   result->code_size = code_utf8.length();
@@ -418,18 +486,41 @@ void CompileCacheHandler::Persist() {
 
     DCHECK_EQ(entry->cache->buffer_policy,
               ScriptCompiler::CachedData::BufferOwned);
-    char* cache_ptr =
+    char* raw_ptr =
         reinterpret_cast<char*>(const_cast<uint8_t*>(entry->cache->data));
-    uint32_t cache_size = static_cast<uint32_t>(entry->cache->length);
+    uint32_t raw_size = static_cast<uint32_t>(entry->cache->length);
+
+    // Compress the cache with zstd to reduce the size on disk. Compression
+    // level 1 prioritizes speed - persistence usually happens on process
+    // shutdown and should add as little overhead as possible. If the data
+    // is not compressible, store it uncompressed, which is indicated by
+    // the cache size being equal to the uncompressed size in the headers.
+    size_t compressed_bound = ZSTD_compressBound(raw_size);
+    std::unique_ptr<uint8_t[]> compressed(new uint8_t[compressed_bound]);
+    size_t compressed_size = ZSTD_compress(
+        compressed.get(), compressed_bound, raw_ptr, raw_size, 1);
+    char* cache_ptr = raw_ptr;
+    uint32_t cache_size = raw_size;
+    if (!ZSTD_isError(compressed_size) && compressed_size < raw_size) {
+      cache_ptr = reinterpret_cast<char*>(compressed.get());
+      cache_size = static_cast<uint32_t>(compressed_size);
+    }
+    Debug("[compile cache] compressed cache for %s %s: %d -> %d bytes\n",
+          type_name,
+          entry->source_filename,
+          raw_size,
+          cache_size);
+
     uint32_t cache_hash = GetHash(cache_ptr, cache_size);
 
     // Generating headers.
-    std::vector<uint32_t> headers(kHeaderCount);
+    std::array<uint32_t, kHeaderCount> headers;
     headers[kMagicNumberOffset] = kCacheMagicNumber;
     headers[kCodeSizeOffset] = entry->code_size;
     headers[kCacheSizeOffset] = cache_size;
     headers[kCodeHashOffset] = entry->code_hash;
     headers[kCacheHashOffset] = cache_hash;
+    headers[kCacheRawSizeOffset] = raw_size;
 
     // Generate the temporary filename.
     // The temporary file should be placed in a location like:
@@ -459,7 +550,7 @@ void CompileCacheHandler::Persist() {
     Debug(" -> %s\n", mkstemp_req.path);
     Debug("[compile cache] writing cache for %s %s to temporary file %s [%d "
           "%d %d "
-          "%d %d]...",
+          "%d %d %d]...",
           type_name,
           entry->source_filename,
           mkstemp_req.path,
@@ -467,12 +558,13 @@ void CompileCacheHandler::Persist() {
           headers[kCodeSizeOffset],
           headers[kCacheSizeOffset],
           headers[kCodeHashOffset],
-          headers[kCacheHashOffset]);
+          headers[kCacheHashOffset],
+          headers[kCacheRawSizeOffset]);
 
     // Write to the temporary file.
-    uv_buf_t headers_buf = uv_buf_init(reinterpret_cast<char*>(headers.data()),
-                                       headers.size() * sizeof(uint32_t));
-    uv_buf_t data_buf = uv_buf_init(cache_ptr, entry->cache->length);
+    uv_buf_t headers_buf =
+        uv_buf_init(reinterpret_cast<char*>(headers.data()), kHeaderSize);
+    uv_buf_t data_buf = uv_buf_init(cache_ptr, cache_size);
     uv_buf_t bufs[] = {headers_buf, data_buf};
 
     uv_fs_t write_req;
diff --git a/src/compile_cache.h b/src/compile_cache.h
index 62934332103661..7ecd6d0910197e 100644
--- a/src/compile_cache.h
+++ b/src/compile_cache.h
@@ -36,9 +36,11 @@ struct CompileCacheEntry {
   bool refreshed = false;
   bool persisted = false;
 
-  // Copy the cache into a new store for V8 to consume. Caller takes
-  // ownership.
-  v8::ScriptCompiler::CachedData* CopyCache() const;
+  // Wrap the cache into a non-owning CachedData for V8 to consume.
+  // The caller takes ownership of the returned wrapper object, while
+  // the underlying buffer remains owned by this entry and must outlive
+  // the consumption of the wrapper.
+  v8::ScriptCompiler::CachedData* WrapCache() const;
   const char* type_name() const;
 };
 
@@ -99,7 +101,9 @@ class CompileCacheHandler {
   static constexpr size_t kCacheSizeOffset = 2;
   static constexpr size_t kCodeHashOffset = 3;
   static constexpr size_t kCacheHashOffset = 4;
-  static constexpr size_t kHeaderCount = 5;
+  static constexpr size_t kCacheRawSizeOffset = 5;
+  static constexpr size_t kHeaderCount = 6;
+  static constexpr size_t kHeaderSize = kHeaderCount * sizeof(uint32_t);
 
   v8::Isolate* isolate_ = nullptr;
   bool is_debug_ = false;
diff --git a/src/module_wrap.cc b/src/module_wrap.cc
index 87a8b4d57726af..1f0c0912dea013 100644
--- a/src/module_wrap.cc
+++ b/src/module_wrap.cc
@@ -521,8 +521,9 @@ MaybeLocal<Module> ModuleWrap::CompileSourceTextModule(
   }
 
   if (cache_entry != nullptr && cache_entry->cache != nullptr) {
-    // source will take ownership of cached_data.
-    cached_data = cache_entry->CopyCache();
+    // source only takes ownership of the cached_data wrapper - the
+    // underlying buffer is still owned by the compile cache entry.
+    cached_data = cache_entry->WrapCache();
   }
 
   ScriptCompiler::Source source(source_text, origin, cached_data);
diff --git a/src/node_contextify.cc b/src/node_contextify.cc
index f319420ae02f35..3d615dbe81e115 100644
--- a/src/node_contextify.cc
+++ b/src/node_contextify.cc
@@ -1675,8 +1675,9 @@ static MaybeLocal<Function> CompileFunctionForCJSLoader(
         code, filename, CachedCodeType::kCommonJS);
   }
   if (cache_entry != nullptr && cache_entry->cache != nullptr) {
-    // source will take ownership of cached_data.
-    cached_data = cache_entry->CopyCache();
+    // source only takes ownership of the cached_data wrapper - the
+    // underlying buffer is still owned by the compile cache entry.
+    cached_data = cache_entry->WrapCache();
   }
 
   ScriptCompiler::Source source(code, origin, cached_data);
diff --git a/test/parallel/test-compile-cache-corrupted.js b/test/parallel/test-compile-cache-corrupted.js
new file mode 100644
index 00000000000000..b63b82440c66e2
--- /dev/null
+++ b/test/parallel/test-compile-cache-corrupted.js
@@ -0,0 +1,128 @@
+'use strict';
+
+// This tests that NODE_COMPILE_CACHE gracefully discards corrupted
+// cache files and regenerates them.
+
+require('../common');
+const { spawnSyncAndAssert } = require('../common/child_process');
+const assert = require('assert');
+const fs = require('fs');
+const os = require('os');
+const path = require('path');
+const tmpdir = require('../common/tmpdir');
+
+// Offsets into the cache file headers (see src/compile_cache.h).
+const kHeaderSize = 6 * 4;
+const kCacheRawSizeOffset = 5 * 4;
+
+function readU32(buf, offset) {
+  return os.endianness() === 'LE' ?
+    buf.readUInt32LE(offset) : buf.readUInt32BE(offset);
+}
+
+function writeU32(buf, value, offset) {
+  if (os.endianness() === 'LE') {
+    buf.writeUInt32LE(value, offset);
+  } else {
+    buf.writeUInt32BE(value, offset);
+  }
+}
+
+tmpdir.refresh();
+const dir = tmpdir.resolve('.compile_cache_dir');
+const script = tmpdir.resolve('script.js');
+fs.writeFileSync(script, 'const foo = 1;', 'utf-8');
+
+const env = {
+  ...process.env,
+  NODE_DEBUG_NATIVE: 'COMPILE_CACHE',
+  NODE_COMPILE_CACHE: dir,
+};
+
+function getCacheFile() {
+  const subdirs = fs.readdirSync(dir);
+  assert.strictEqual(subdirs.length, 1);
+  const entries = fs.readdirSync(path.join(dir, subdirs[0]));
+  assert.strictEqual(entries.length, 1);
+  return path.join(dir, subdirs[0], entries[0]);
+}
+
+// Runs the script and expects the corrupted cache to be discarded
+// with the given debug message and then regenerated.
+function expectRecovery(mismatchRE) {
+  spawnSyncAndAssert(
+    process.execPath,
+    [script],
+    { env, cwd: tmpdir.path },
+    {
+      stderr(output) {
+        console.log(output);  // Logging for debugging.
+        assert.match(output, mismatchRE);
+        assert.match(output, /writing cache for .*script\.js.*success/);
+        return true;
+      }
+    });
+}
+
+// Warm the cache.
+spawnSyncAndAssert(
+  process.execPath,
+  [script],
+  { env, cwd: tmpdir.path },
+  {
+    stderr(output) {
+      console.log(output);  // Logging for debugging.
+      assert.match(output, /writing cache for .*script\.js.*success/);
+      return true;
+    }
+  });
+const cacheFile = getCacheFile();
+assert(fs.readFileSync(cacheFile).length > kHeaderSize);
+
+{
+  // Corrupt the magic number.
+  const data = fs.readFileSync(cacheFile);
+  for (let i = 0; i < 4; i++) data[i] ^= 0xff;
+  fs.writeFileSync(cacheFile, data);
+  expectRecovery(
+    /reading cache from .* for CommonJS .*script\.js.*magic number mismatch/);
+}
+
+{
+  // Truncate the cache content.
+  const data = fs.readFileSync(cacheFile);
+  fs.writeFileSync(cacheFile, data.subarray(0, data.length - 3));
+  expectRecovery(
+    /reading cache from .* for CommonJS .*script\.js.*cache size mismatch/);
+}
+
+{
+  // Flip a byte in the middle of the cache content.
+  const data = fs.readFileSync(cacheFile);
+  data[kHeaderSize + Math.floor((data.length - kHeaderSize) / 2)] ^= 0xff;
+  fs.writeFileSync(cacheFile, data);
+  expectRecovery(
+    /reading cache from .* for CommonJS .*script\.js.*cache hash mismatch/);
+}
+
+{
+  // Corrupt the uncompressed size field in the headers.
+  const data = fs.readFileSync(cacheFile);
+  writeU32(data, readU32(data, kCacheRawSizeOffset) + 1, kCacheRawSizeOffset);
+  fs.writeFileSync(cacheFile, data);
+  expectRecovery(
+    /reading cache from .* for CommonJS .*script\.js.*uncompressed size mismatch/);
+}
+
+// After the last recovery the cache should be consumed just fine.
+spawnSyncAndAssert(
+  process.execPath,
+  [script],
+  { env, cwd: tmpdir.path },
+  {
+    stderr(output) {
+      console.log(output);  // Logging for debugging.
+      assert.match(output, /cache for .*script\.js was accepted/);
+      return true;
+    }
+  });

From f427fb358c8fc9568ab1daa4314f130804ccdecc Mon Sep 17 00:00:00 2001
From: Yagiz Nizipli <yagiz@nizipli.com>
Date: Thu, 11 Jun 2026 18:37:51 -0400
Subject: [PATCH 2/3] src: reuse zstd contexts in compile cache

Creating and freeing a zstd context for every cache file costs more
than the (de)compression itself for small caches. Lazily create one
decompression context on the handler and reuse it across reads, and
share one compression context across all entries in Persist().

Co-authored-by: Grok <grok@x.ai>
Signed-off-by: Yagiz Nizipli <yagiz@nizipli.com>
---
 src/compile_cache.cc | 56 ++++++++++++++++++++++++++++++--------------
 src/compile_cache.h  |  6 +++++
 2 files changed, 45 insertions(+), 17 deletions(-)

diff --git a/src/compile_cache.cc b/src/compile_cache.cc
index 38615900ec3d56..9e11793aa3388f 100644
--- a/src/compile_cache.cc
+++ b/src/compile_cache.cc
@@ -202,9 +202,8 @@ void CompileCacheHandler::ReadCacheFile(CompileCacheEntry* entry) {
   // and zstd-compressed when cache_size < raw_size (see
   // CompileCacheHandler::Persist()). Anything else is invalid.
   if (cache_size > raw_size) {
-    Debug("invalid cache size %d > uncompressed size %d\n",
-          cache_size,
-          raw_size);
+    Debug(
+        "invalid cache size %d > uncompressed size %d\n", cache_size, raw_size);
     return;
   }
 
@@ -260,13 +259,19 @@ void CompileCacheHandler::ReadCacheFile(CompileCacheEntry* entry) {
             content_size);
       return;
     }
+    // Lazily create the decompression context on first use and reuse it
+    // for subsequent reads - recreating its workspace for every file
+    // costs more than the decompression itself for small caches.
+    if (zstd_dctx_ == nullptr && (zstd_dctx_ = ZSTD_createDCtx()) == nullptr) {
+      Debug("failed to create zstd context\n");
+      return;
+    }
     // Decompress directly into the buffer handed to V8.
     std::unique_ptr<uint8_t[]> raw_data(new uint8_t[raw_size]);
-    size_t decompressed_size =
-        ZSTD_decompress(raw_data.get(), raw_size, disk_data.get(), cache_size);
+    size_t decompressed_size = ZSTD_decompressDCtx(
+        zstd_dctx_, raw_data.get(), raw_size, disk_data.get(), cache_size);
     if (ZSTD_isError(decompressed_size)) {
-      Debug("decompression failed: %s\n",
-            ZSTD_getErrorName(decompressed_size));
+      Debug("decompression failed: %s\n", ZSTD_getErrorName(decompressed_size));
       return;
     }
     if (decompressed_size != raw_size) {
@@ -276,9 +281,7 @@ void CompileCacheHandler::ReadCacheFile(CompileCacheEntry* entry) {
       return;
     }
     entry->cache.reset(new ScriptCompiler::CachedData(
-        raw_data.release(),
-        raw_size,
-        ScriptCompiler::CachedData::BufferOwned));
+        raw_data.release(), raw_size, ScriptCompiler::CachedData::BufferOwned));
   }
   Debug(" success, size=%d\n", raw_size);
 }
@@ -459,6 +462,16 @@ void CompileCacheHandler::Persist() {
   // finished. In that case, the off-thread writes should finish long
   // before any attempt of flushing is made so the method would then only
   // incur a negligible overhead from thread synchronization.
+
+  // The compression context is created lazily when there is anything to
+  // compress and reused for all the entries in this invocation.
+  ZSTD_CCtx* cctx = nullptr;
+  auto cleanup_cctx = OnScopeLeave([&cctx]() {
+    if (cctx != nullptr) {
+      ZSTD_freeCCtx(cctx);
+    }
+  });
+
   for (auto& pair : compiler_cache_store_) {
     auto* entry = pair.second.get();
     const char* type_name = entry->type_name();
@@ -495,15 +508,18 @@ void CompileCacheHandler::Persist() {
     // shutdown and should add as little overhead as possible. If the data
     // is not compressible, store it uncompressed, which is indicated by
     // the cache size being equal to the uncompressed size in the headers.
-    size_t compressed_bound = ZSTD_compressBound(raw_size);
-    std::unique_ptr<uint8_t[]> compressed(new uint8_t[compressed_bound]);
-    size_t compressed_size = ZSTD_compress(
-        compressed.get(), compressed_bound, raw_ptr, raw_size, 1);
     char* cache_ptr = raw_ptr;
     uint32_t cache_size = raw_size;
-    if (!ZSTD_isError(compressed_size) && compressed_size < raw_size) {
-      cache_ptr = reinterpret_cast<char*>(compressed.get());
-      cache_size = static_cast<uint32_t>(compressed_size);
+    std::unique_ptr<uint8_t[]> compressed;
+    if (cctx != nullptr || (cctx = ZSTD_createCCtx()) != nullptr) {
+      size_t compressed_bound = ZSTD_compressBound(raw_size);
+      compressed.reset(new uint8_t[compressed_bound]);
+      size_t compressed_size = ZSTD_compressCCtx(
+          cctx, compressed.get(), compressed_bound, raw_ptr, raw_size, 1);
+      if (!ZSTD_isError(compressed_size) && compressed_size < raw_size) {
+        cache_ptr = reinterpret_cast<char*>(compressed.get());
+        cache_size = static_cast<uint32_t>(compressed_size);
+      }
     }
     Debug("[compile cache] compressed cache for %s %s: %d -> %d bytes\n",
           type_name,
@@ -621,6 +637,12 @@ CompileCacheHandler::CompileCacheHandler(Environment* env)
       is_debug_(
           env->enabled_debug_list()->enabled(DebugCategory::COMPILE_CACHE)) {}
 
+CompileCacheHandler::~CompileCacheHandler() {
+  if (zstd_dctx_ != nullptr) {
+    ZSTD_freeDCtx(zstd_dctx_);
+  }
+}
+
 // Directory structure:
 // - Compile cache directory (from NODE_COMPILE_CACHE)
 //   - $NODE_VERSION-$ARCH-$CACHE_DATA_VERSION_TAG-$UID
diff --git a/src/compile_cache.h b/src/compile_cache.h
index 7ecd6d0910197e..78501dff693d39 100644
--- a/src/compile_cache.h
+++ b/src/compile_cache.h
@@ -10,6 +10,8 @@
 #include <unordered_map>
 #include "v8.h"
 
+struct ZSTD_DCtx_s;
+
 namespace node {
 class Environment;
 
@@ -67,6 +69,7 @@ enum class EnableOption : uint8_t { DEFAULT, PORTABLE };
 class CompileCacheHandler {
  public:
   explicit CompileCacheHandler(Environment* env);
+  ~CompileCacheHandler();
   CompileCacheEnableResult Enable(Environment* env,
                                   const std::string& dir,
                                   EnableOption option = EnableOption::DEFAULT);
@@ -113,6 +116,9 @@ class CompileCacheHandler {
   EnableOption portable_ = EnableOption::DEFAULT;
   std::unordered_map<uint32_t, std::unique_ptr<CompileCacheEntry>>
       compiler_cache_store_;
+  // Lazily created zstd decompression context, reused across cache reads
+  // to avoid recreating its workspace for every file.
+  ZSTD_DCtx_s* zstd_dctx_ = nullptr;
 };
 }  // namespace node
 

From a6273b1f4a46d5c8150978a342b25e02150f516a Mon Sep 17 00:00:00 2001
From: Daniel Lemire <daniel@lemire.me>
Date: Thu, 11 Jun 2026 20:17:56 -0400
Subject: [PATCH 3/3] src: embed zstd dictionary for further compile cache size
 wins

Builds on the zstd compression in #63861 by embedding a small zstd
dictionary trained on a diverse corpus of real modules, so each
small/medium compile-cache entry compresses better. Per entry we keep
the smaller of the plain and dictionary-assisted frame, so the
dictionary only ever helps.

- Add src/compile_cache_zstd.dict (16 KiB). It is trained on V8 code
  caches harvested (via vm.compileFunction, the same shape the CJS
  loader produces) from a diverse corpus: bundled npm packages, lib/,
  tools/ and a few deps.
- Add tools/generate_compile_cache_dict.py and a node.gyp action that
  generates compile_cache_zstd_dict.h into SHARED_INTERMEDIATE_DIR at
  build time; no generated header is checked in. libnode include_dirs
  updated to pick it up.
- Prepare the CDict/DDict once per process (shared across all handlers
  and Workers, matching the lazy-context approach from #63861) and use
  them in Persist() and ReadCacheFile(). Persist() compresses the plain
  and dict frames into separate buffers and selects the smaller, so the
  written bytes and recorded size always agree. The dictionary is only
  tried for entries up to 256 KiB; larger blobs never benefit, so the
  second compression is skipped to avoid wasted work. Falls back to
  plain zstd if dictionary preparation fails.
- The dictionary is embedded in the binary because the compile cache
  must be usable early, portably, and without extra filesystem state.
- No on-disk format change: dict-assisted frames carry the dictID, plain
  frames carry none, and a single DDict decompresses both.
- Size, measured on data held out from training (per-entry min policy):
  diverse modules go from ~1.87x (plain zstd) to ~2.44x with the
  dictionary (~24% smaller on disk); on test/parallel, which is not in
  the training corpus at all, ~1.74x -> ~2.22x (~22% smaller). A real
  end-to-end run (npm --version, ~70 modules) is ~15% smaller. Read
  time is unchanged and the extra write-time work is negligible.
- Add a multi-module write/read roundtrip test and a startup benchmark
  (standard createBenchmark harness).
---
 benchmark/misc/compile-cache-timing.js      |  72 ++++++++++++++++++
 node.gyp                                    |  17 +++++
 src/compile_cache.cc                        |  72 +++++++++++++++++-
 src/compile_cache_zstd.dict                 | Bin 0 -> 16384 bytes
 test/parallel/test-compile-cache-success.js |  80 ++++++++++++++++++++
 tools/generate_compile_cache_dict.py        |  37 +++++++++
 6 files changed, 274 insertions(+), 4 deletions(-)
 create mode 100644 benchmark/misc/compile-cache-timing.js
 create mode 100644 src/compile_cache_zstd.dict
 create mode 100644 tools/generate_compile_cache_dict.py

diff --git a/benchmark/misc/compile-cache-timing.js b/benchmark/misc/compile-cache-timing.js
new file mode 100644
index 00000000000000..bdeae8c5cd2e93
--- /dev/null
+++ b/benchmark/misc/compile-cache-timing.js
@@ -0,0 +1,72 @@
+'use strict';
+
+// Startup benchmark for the compile cache (including the zstd dictionary).
+// Compares no-cache / cold-cache / warm-cache for two workloads:
+//   big  - one large module (the typescript.js fixture)
+//   many - many small modules (generated here, side-effect-free)
+// The modules are generated into a temp dir so the benchmark is self-contained
+// and reproducible, and never executes unrelated code.
+
+const common = require('../common.js');
+const { spawnSync } = require('child_process');
+const fs = require('fs');
+const os = require('os');
+const path = require('path');
+
+const bench = common.createBenchmark(main, {
+  workload: ['big', 'many'],
+  cache: ['none', 'cold', 'warm'],
+  n: [30],
+});
+
+const BIG = path.resolve(__dirname, '../../test/fixtures/snapshot/typescript.js');
+
+// Generate `count` small, side-effect-free modules and return the require()
+// code that loads them all in one child.
+function makeManyModules(dir, count) {
+  fs.mkdirSync(dir, { recursive: true });
+  const reqs = [];
+  for (let i = 0; i < count; i++) {
+    const file = path.join(dir, `mod-${i}.js`);
+    fs.writeFileSync(
+      file,
+      `'use strict';\n` +
+      `module.exports = function value${i}(a, b) {\n` +
+      `  const sum = a + b + ${i};\n` +
+      `  return { id: ${i}, sum, label: 'module-${i}' };\n` +
+      `};\n`);
+    reqs.push(`require(${JSON.stringify(file)});`);
+  }
+  return reqs.join('');
+}
+
+function run(cmd, args, cacheDir) {
+  const env = { ...process.env };
+  if (cacheDir) env.NODE_COMPILE_CACHE = cacheDir;
+  else delete env.NODE_COMPILE_CACHE;
+  const child = spawnSync(cmd, args, { env, stdio: 'ignore' });
+  if (child.error) throw child.error;
+}
+
+function main({ n, workload, cache }) {
+  const cmd = process.execPath || process.argv[0];
+  const tmp = fs.mkdtempSync(path.join(os.tmpdir(), 'cc-bench-'));
+  const args = workload === 'big' ?
+    [BIG] :
+    ['-e', makeManyModules(path.join(tmp, 'mods'), 120)];
+  const cacheDir = cache === 'none' ? null : path.join(tmp, 'cache');
+
+  try {
+    if (cache === 'warm') run(cmd, args, cacheDir);  // populate once
+    bench.start();
+    for (let i = 0; i < n; i++) {
+      if (cache === 'cold' && cacheDir) {
+        fs.rmSync(cacheDir, { recursive: true, force: true });
+      }
+      run(cmd, args, cacheDir);
+    }
+    bench.end(n);
+  } finally {
+    fs.rmSync(tmp, { recursive: true, force: true });
+  }
+}
diff --git a/node.gyp b/node.gyp
index d2dbce19992b10..ab54cc27437e72 100644
--- a/node.gyp
+++ b/node.gyp
@@ -1110,6 +1110,22 @@
             '<@(linked_module_files)',
           ],
         },
+        {
+          'action_name': 'generate_compile_cache_zstd_dict',
+          'inputs': [
+            'src/compile_cache_zstd.dict',
+            'tools/generate_compile_cache_dict.py',
+          ],
+          'outputs': [
+            '<(SHARED_INTERMEDIATE_DIR)/compile_cache_zstd_dict.h',
+          ],
+          'action': [
+            '<(python)',
+            'tools/generate_compile_cache_dict.py',
+            'src/compile_cache_zstd.dict',
+            '<@(_outputs)',
+          ],
+        },
       ],
     }, # node_base
     {
@@ -1123,6 +1139,7 @@
         'src',
         'deps/v8/include',
         'deps/uv/include',
+        '<(SHARED_INTERMEDIATE_DIR)',  # for compile_cache_zstd_dict.h etc.
       ],
 
       'dependencies': [
diff --git a/src/compile_cache.cc b/src/compile_cache.cc
index 9e11793aa3388f..35c4b02cc70d9a 100644
--- a/src/compile_cache.cc
+++ b/src/compile_cache.cc
@@ -11,6 +11,10 @@
 #include "util.h"
 #include "zlib.h"
 #include "zstd.h"
+// kCompileCacheZstdDict + kCompileCacheZstdDictSize come from the header
+// generated at build time by the GYP action (from src/compile_cache_zstd.dict).
+// The include directory (SHARED_INTERMEDIATE_DIR) is added by node.gyp.
+#include "compile_cache_zstd_dict.h"
 
 #ifdef NODE_IMPLEMENTS_POSIX_CREDENTIALS
 #include <unistd.h>  // getuid
@@ -28,6 +32,29 @@ using v8::ScriptCompiler;
 using v8::String;
 
 namespace {
+// The compile-cache zstd dictionary is immutable and embedded in the binary,
+// so the prepared CDict/DDict are created once and shared across all handlers
+// (and all Environments/Workers) instead of per handler. They live for the
+// lifetime of the process. Returns nullptr if preparation fails, in which
+// case callers fall back to plain (dictionary-less) zstd.
+ZSTD_CDict* GetCompileCacheCDict() {
+  static ZSTD_CDict* cdict =
+      ZSTD_createCDict(kCompileCacheZstdDict, kCompileCacheZstdDictSize, 1);
+  return cdict;
+}
+
+ZSTD_DDict* GetCompileCacheDDict() {
+  static ZSTD_DDict* ddict =
+      ZSTD_createDDict(kCompileCacheZstdDict, kCompileCacheZstdDictSize);
+  return ddict;
+}
+
+// The dictionary only helps small/medium caches; for larger inputs zstd's own
+// adaptive model dominates and the dictionary never wins, so we skip the
+// (otherwise wasted) second compression above this raw size. Decompression is
+// unaffected: a single DDict decodes both dict-assisted and plain frames.
+constexpr uint32_t kCompileCacheDictMaxRawSize = 256 * 1024;
+
 std::string Uint32ToHex(uint32_t crc) {
   std::string str;
   str.reserve(8);
@@ -266,10 +293,20 @@ void CompileCacheHandler::ReadCacheFile(CompileCacheEntry* entry) {
       Debug("failed to create zstd context\n");
       return;
     }
-    // Decompress directly into the buffer handed to V8.
+    // Decompress directly into the buffer handed to V8. The embedded
+    // dictionary is referenced via a shared, prepared DDict; plain frames
+    // (which carry no dictID) decompress correctly with it as well.
     std::unique_ptr<uint8_t[]> raw_data(new uint8_t[raw_size]);
-    size_t decompressed_size = ZSTD_decompressDCtx(
-        zstd_dctx_, raw_data.get(), raw_size, disk_data.get(), cache_size);
+    ZSTD_DDict* ddict = GetCompileCacheDDict();
+    size_t decompressed_size;
+    if (ddict != nullptr) {
+      decompressed_size = ZSTD_decompress_usingDDict(
+          zstd_dctx_, raw_data.get(), raw_size, disk_data.get(), cache_size,
+          ddict);
+    } else {
+      decompressed_size = ZSTD_decompressDCtx(
+          zstd_dctx_, raw_data.get(), raw_size, disk_data.get(), cache_size);
+    }
     if (ZSTD_isError(decompressed_size)) {
       Debug("decompression failed: %s\n", ZSTD_getErrorName(decompressed_size));
       return;
@@ -508,16 +545,43 @@ void CompileCacheHandler::Persist() {
     // shutdown and should add as little overhead as possible. If the data
     // is not compressible, store it uncompressed, which is indicated by
     // the cache size being equal to the uncompressed size in the headers.
+    //
+    // We also try the embedded trained dictionary and keep whichever frame is
+    // smaller (still subject to the "only store if < raw" policy). The
+    // dictionary mainly helps the small/medium caches that dominate real
+    // compile cache usage; for inputs where plain zstd already wins we keep
+    // the plain frame.
     char* cache_ptr = raw_ptr;
     uint32_t cache_size = raw_size;
     std::unique_ptr<uint8_t[]> compressed;
+    std::unique_ptr<uint8_t[]> compressed_dict;
     if (cctx != nullptr || (cctx = ZSTD_createCCtx()) != nullptr) {
       size_t compressed_bound = ZSTD_compressBound(raw_size);
       compressed.reset(new uint8_t[compressed_bound]);
       size_t compressed_size = ZSTD_compressCCtx(
           cctx, compressed.get(), compressed_bound, raw_ptr, raw_size, 1);
+      char* best_ptr = reinterpret_cast<char*>(compressed.get());
+      // Only attempt the dictionary for small/medium entries (see
+      // kCompileCacheDictMaxRawSize); for large blobs it never wins and the
+      // extra compression would be wasted work.
+      ZSTD_CDict* cdict = raw_size <= kCompileCacheDictMaxRawSize
+                              ? GetCompileCacheCDict()
+                              : nullptr;
+      if (cdict != nullptr) {
+        // Compress into a separate buffer so the selected frame's bytes and
+        // size always stay in sync (the plain buffer is left untouched).
+        compressed_dict.reset(new uint8_t[compressed_bound]);
+        size_t dict_size = ZSTD_compress_usingCDict(
+            cctx, compressed_dict.get(), compressed_bound, raw_ptr, raw_size,
+            cdict);
+        if (!ZSTD_isError(dict_size) &&
+            (ZSTD_isError(compressed_size) || dict_size < compressed_size)) {
+          compressed_size = dict_size;
+          best_ptr = reinterpret_cast<char*>(compressed_dict.get());
+        }
+      }
       if (!ZSTD_isError(compressed_size) && compressed_size < raw_size) {
-        cache_ptr = reinterpret_cast<char*>(compressed.get());
+        cache_ptr = best_ptr;
         cache_size = static_cast<uint32_t>(compressed_size);
       }
     }
diff --git a/src/compile_cache_zstd.dict b/src/compile_cache_zstd.dict
new file mode 100644
index 0000000000000000000000000000000000000000..b64455d45b1d82ca5b0c2a4dc0c41a6c1220fc68
GIT binary patch
literal 16384
zcmcJ04}4VBmH&H_mzg06;Xx1rL=1li6hahKWKr{GG9d#=$OIyw?&eJ<kI9h9Oq`hz
z!pGKtC|axy|APJFu2t05wtm#rT3g+sTid!-M0ah~Z7o{=*Q&KB()L$=-|xNeO(p@`
z?PouG^O^VFz4x4R?>+b2bI(2J=E8&3?>+R|?Q_Dq9*UgrzHVaalQ;fwN?&Vh?|E<U
zcWr#VedESk?%DorZ_h1l^{eYvuG{`<)9lg{Ri)ql!|^|V{_UL)dam2q|8~(M?Q{P5
z<-M<+n||z1Cx7y%SN?Rx<@49v;nqt^ih}<8m+YCdSkcVdJr!qtZSd*q|Ij?uH{+)5
zHyQ3J(UKX;cvYD&I8{-Uj-Ql%@vi@LEqpF|ON;m19VO5F^d^+5_-Xig@k@5ZlQBgt
zX^u?#@_kc0C`t8X<Edmulx@BJ>fMDX%l7wJ8N3PCbesAl;d;`ksFjg$)9?A<EmGTT
zr87h(-1~E)Uy$^yWG0hP)bi$zd%Lf>W;)>F$*h%5MiPr`B6wSE))p(;%eK)DU|Y<W
zU*;H4)e}iujgfeAZD-nwbOeXtP_3vFo1+)3OMK%De0N9EUH()mo5`jlJ%LnrPr}Mt
zgwdPZ|D&t4L&tZnZF`_vtyb?DuX`>o^1R{l{Hmn%VMQ?kr<_F6CaUW_M+J>46cv^?
zD}@tl@T(qUZY!KLpt!uFe}_&}CSV3!lYpb}uK<6l;u3ESZ+`Q~C;yx;r__b{k~Pj#
zLKL8!Uz(`L`^EM`#f^@-l$r?yRg_sv@IWdqV)~Z*l|wC$ojmZSu2e=kZn>l0|6ljL
zT_Pd)RA+|^20cGA`Ta8UUeAninl__gx#uCZo23!_T$)??sye7nSUPp>gbM%NYVp80
ze4F_GSGD+vd&1JHr_0Lp2^BM!&-{nUN7bSwWtBzC%jSvSm1XZuC{-pX#Rt{WC6gB8
z<8@W!@3ZscZm3~HNHaXwjh|7_<N1ziGD~StP0z(@$Ll?64NI6PpG=gs{DdKjdB5b-
zThAMZing{Wq$g|n<F?F0ZvOJp#lZ=pE@NdIQyskttJc~W=}lxMCCc&T8<wo3Y`4cD
zvE7s=CR04|P?xV0-(&GzPWH{V*~flK_L(yZO29sHPOLeyuk6raRSvJj8J=90?S$f|
zlXl?)A~`IRY9(0^sCEE8`+a1Jq6AIWQ<l{d&r#6_Qm2qGX*Fn&1ujL=MemejGenJ2
zK3J|T5ko5RJfjB9*T-N+AS))T#p0N!P2Af~DMmX=4YW=H-p6h90m+VeHajR}k{vr{
z6zE`w7$`_8uAjz>lu7d@&%-y9WQ*>w1sxN5=dQX*cTsC4Q(`%ax&62Mzwmky$};g-
zGLr303nhho6u%KnEL{dNc&IKe@4PXn3xqsfb=3fiPnXW+%pwKx))tuj<lt-6*+U&O
zl^SHJfxds~sz)c{dv*IJE1F$nWt-EfY>Ikw^+ps6n8Ow62w_mw9nV-fh_#&-bRM-!
zWGiV+_ivh&2e&Ss?QF3!sRXqv;RrMH%s>3F4BstQEV!j7M~b?UAVPz>i+}Tjic?|M
z^mn(X5-nCwA`%tiOnQ^XpE-wZuF0mcA>`<-=}E-14!!BoU=`QkD44aWhE$)G4n#8c
z;_y5*mJ0WQ$u~|e2Dr2C5-Bm|qWfq6qGHD6k#%+8N?kl*HAk|YV8ynRr18p*hil3I
zn3b)KWFwNh$g}SHxmO+G<aaejwlrAD7|=vwUHenVpJ3Z-tu5JFE1K%C(y|T<`sK?*
z$0(?+Ee$#N^Uk>WDQ*tjK-Q)s$;?J84Sisd*5>}yHDcq)7|DJkosRVTdpDw<Z1b=A
z?l;E+FP_P(xGZk<3CcQlil<#g1Bz>I$pS7h{y~bCo}#5M*&q;XEj_HKUz{|or|0Eq
zI4YV>du4qIs5w178!IbDTIb_OMRT{>IhES>CRMx!<?A-rRAth`>eThqex$mU;v?Rz
zO7RVMt3}Hv*8oqhz#3--mZC`Qk?TZdy-3t=OkBeG30)TJ_3~X$e99iDt*d(DX-nD;
zGvB&~tWR1(s1(mXj-iUZ{+5S-!KIDeKS5ID>=TduWh(_Tl-wLi#5;_1thd`rW`pT;
zN=zkTnr?XXJ}!blDw)KpTO04TQoX|<qRE$cw|$FEW)ouV2+1jZ;H7TrqcyN!U~dE>
z(N4J#Xrcsu^elzEJJR27HKo$sXnm_?w~%XHQG~Fq1t8PoColaUy^q>(e|wFaq(|0L
z0%s0Q+Dl1Krjo0B)?_1T$vwqHnKBbUwX%8R+@i@l&%t+JI-ZTRCoHT|E7IKvfv$_E
zGud@0wpuV3Rwf%t)+OSxPD#ZCj$+`qL-75APbO@jDJ3^cTU7-ji9~xO+J$lxKZQ$|
z9b0xm*EPA0i56IE1I@yRI=eY`iR;W5rEz4(?0r@srGv=~ly?h^yMDXH7K?h+>Trmy
z#s@lB(QGxnd&T0}pG6Myluf4+38<q)O6nsMu*&85Z5Lg>{E6SWIQO-y8-rV-mN0e+
zVe&ycfr9l<n-7&!_@F(~k!ZFa%vuN2Ax&-)&g5enem4m4%|Cu;TORlt2#k@4rNHsd
zZbF)TP!kV`E_{C3<OkV>u3&dhwm+xS2-X)1#f<(~zzBqlkP(g<>#|pc!mTl5jbTKp
zgMmmqxWec%YQq7;-w-wc<M;PwTa8G(+AxCACZpdl!r_%GYQw>p5e)hPFX^=MJLGTa
zt2P4tMs3JwJ<o_4jeUKghLF*iGGgIQBLKQFW3kbP8qf(Dm-~%%skqT%^oC;oI)Bjb
zU(y%sG-CZ%8L>>vsIEWPSi2!m54?~OJkRI^Ht?Eap~i670NmDq5zG27GJq2|{2`-d
zMQt>Qk+D6L1dL$Fs7s@db-<4qE3#~_(;r)D7}bDSgE0j#p7u?b87op*!|>PFhQS|<
zt0h(qdVT?K(~*5`1rH4Lt>36aKaASOP=MnNZwLlg_XSh`v#}aYMqi)A3mfE9gBVX7
zbeQk#BYi*Uw}y-+|M@LTQ3j~$V2ER{ZCDxzRM%f-tO*8cSG7ty8yg89Mf)-GtWNNZ
zw72+;0N@&`frGgU8v)F1?J6U*Botd&R~sg$Vu3Kkg%ZZ(g?ieC9r6jcG%0C(F?r8|
z5qw5*gx|Ierg(icEBxP*kdB4r#aTu(Gy%z_#N<62*tbe-?r2P2tn;0Uc4mQq<Tk+M
zMMrijo^!{-pj5}1q6iPa_!<MKZHni2MFM3mE0MelL^r-HyTKD6lNW7!#_9r6l|_md
zABE+wb*pO00h49iX8hu73^sHsod^E%%T_9#ZmT=hXk|N79mpU#7_74~ux*1+ifp!A
zK%rT*uRSTpbf!}_i(MHTVHRu@$vcNb(e9U!T<uKW8KSgXmh$kx<OOl=WX}hm{}&DU
z9xE-)K6?}eD6{(nrH%pKBm0Eu5y`udrMJ(|4I5*15HK6id>Htf$>KpyLNt<y_9mc@
zI-qHyiQW#Fy(Y<^Yt(Y+$2~RXoiy>g*2<H+iEjmyAn4rdExCg9dpBc0>yGrSuy<n<
zWlBAM*UKGvW7m(l69~&DXAy>y9o80M)0(Ig(=#Bb{>K9syhf_gL?n}uW+?$=&(6UI
zsG?`D4EmEa3mReO!Elq+WTR*P7!xl=<qxBMt;$<WEh(B0N&AZRCLc7T1WP_0U&CE8
zo>_-uU8+y+@iq{}9esm7|LDg<Eo?*T+E6CAB@3rS9J?e6kxV|gj$n|8@AL3Y#6KRM
z{Vwbo&~LWVFxqJ@&@N2amVf}}Nepa<@$kw6H&&Aj%vD(BVgqvwmwXFVwif^(+bHV4
zeu$kL$>)`+coKz3CLf$k4!9_)4UsEdp-dC{kuyk4lqr-ZcBAy<m|su9flpuEUVtJl
z2=u5jlj==Ni(gUp4Z#>!6;9Yso>Rr)`QkQYkmQkXFlhc3l6(;B&txgjJPtu}oCJGP
z>8!(Xn;_dFK`-8yj3)R9h+TroH&H21kXfLquyd$!ehxHJzH~I236!6JpovO}Ru43u
zJ86gf0%&ZtCLhf?b#i>tHlCyAox&-AuA>c;lxg#%vFo{Ue3V_L@HuIU>-o~<t`j&n
zJ}in%J_Q^8=9%#T$AR>9yg6&%UwVf)stBVbxEXe=tT*{0$r^RRZu>MTYn&$qohfTm
z3}N!MCEEE?eK>aKtFSAziKc+WL!9&-Odg+@v>jr`QH!%f$)2Ej7=!%?Ka;g$T(-Q}
z2d>IQJcDII|DdAm9TeD9Kb&6bIE`|TB;^GJU1)M4ekMyvP^-1kD6yPg%)e4N8f^(s
z?jM0x12pL#lV}uv_h__7fb!`Gv@2~ic8;xamOZ1<iVNUQ!Oujc?4)U<(fA`8<-j`{
z?GR8d24NGG60KpcwxyjC!$CQ+J7zTA3gG<r2)yRKy9F8tMKsE8k&RZ9=WclqST_PF
zf_l*+-%Q$q-9q>|O+O#+Qpnum5$)~`nzsP+7-Z%Y?0piM3xmicQeq<us>my=j;IPZ
z>DQ<Rk?a}Pt~6h$!U|rL$A<j}cDHMS1rqHnfd6I`T8H@tP<Emflhh~~L!;0tQU1D(
zR%0R~m$cA$-ED>JWhYJtR=R3arV3jY@-<gT*A=I$Mwh;)w`>xg8AUxyQBF^*lfI<5
zDn2dNd<DgYK3B2(9`_X2RQD`Zd3Nz9F4vJM1&61&p6NXP$;ZdE=MT;-D>zbo;_Bn>
zyGo`M99eu^^Zw&d$>I}*MR&LtpKzBPoVe3dI{(Nnui{#EykOk4<0p!bOG;zLADLG0
z@ih0bX(#?*9sfitD}C5x2gGW)TAk=Q8s(OXRj0V&M;<c~{^SOC(STism!jP!7z)~A
zSdeh#XZEnP7qtrQLv6gO1yyZ|icx9<YPn~M3W1V)BHtv=M8?3S9nc<9$;Zon9o|GG
zlEk*LtcOk(nZ*8Ry5~(mwrWu#l8#vmlfB*Ta5jP2HqfxYaETCJ(VFcq+-4h5<$KGu
z%Hhe|reK1&ikXTbQT)2rhJ{V~tZLCBbLaZ2C||+>?}YAim8nO%wByQii$8U_e6C&a
zm0wh-Y5A<2sFv)Ha0PL&+Qdphd?@Eufx|=8Y`2?}&hMP}dwapKSLM*KgecUE%Wbd9
zxg_p*zbC@05=DWq!Rb{AEFE@k_e?%2OiSrCndf*-$bPlj_L>|bG82^rlQT&&2m1lt
z;4HoJxVMrT!OBD<Jy!kN#s&#t^7UU(^Fi@Nd6KN=Iu#mS`e>1R0*uZ9ad!P}fpf}G
z5ltoGLd*s_BgvSRS({pK6GxDv!DEf{D!~Y#MkFq=Vaal;Zb$Fcij}4iv02F!jKeMc
z?EQo*68+RHvqXszb2d8GwQoCr0p)KNEC*3-Q)3UO9`M{p`J0uME*#t4B4R-VBh2SN
zH}D;<omm|?F(#WW;l;Nd8WdBHQRHbY@>oTih~eyvf9w5}?U5P%cJQ9F>-h$sDn0YZ
znWWFX1)-tc;~<4l)JT{>k=ECnd@llzJpKBL;Y_byCo-3^=5x9yR4TIX0vH?i!f}H6
z+fm810rR>;@kCr#s15rgj2SWI+Hj6dVyvhjmgm+I6EEc)WQLDsMDf$`cD;0yFuWlJ
zbe74T!NKPcI7yq&o7+}|??^|7&01ub=feSJUkIGM=I{w_KGIdRCKc_H2MGa81g5uO
zG7QVCuuNFY4s-o7Y4wmY7C>-qoicBxs9_Ak5pGrYyrG&Ljxf|)OH_To$WpXDzbbUH
zlp|<HwPbaKz#Lf>L=G>-yd1fm_?gUc4dI~57zUfCY;qq#CzL9udC~Yjhcp`=ax!f8
zfRkaPgQsosO*B^qj+uZEP43<^vORWkk<*^GT#k2N(EJ_Pa}slrL)5DGfK%)sT}ceL
za3aoeP#r!6%?d2Rt(cf$%q4sFk3b~n7ubll%`p@-ZwAhrn66>Gr8XYN$_A;^7TS0N
zN{s-dxCmWOgPe+xfaLnwHlTK&_C4*8r?rH$GGgAV+egp)*F!)=D&JkM&C5-F(0mhk
z9j?5tQ6rpvviEIj1k7$D0tcCFDrwONoXJMIX(4D6_lZ$cMY2-`cpr2c5bVOBuLIQ=
zM^k<|@w4qb_JJ}9u1?2eh&~UKKCn;poW_nb+B<E+qnN@0k`lqtigJeyrgdsruAxn<
zwx?-$I#KCdbP{#nUGP<l+LX=&I--+N3pr3k-TPmde%%;+V>M&A$=oqaD~E|tSy(=E
zfvV1PECXkukpWDcMgiivP3sxbt{yrtC^qCI4Z-{k`DR6{_yilW?kmuJ+Aa*iSGWs7
zwC8pez-F4IDTm7npXvJenCtN3kKNici;sESKG))7UazlU@yBC|eA?oVi%Oo~SzJ2*
znc@@6junk7{&d-~lJUjImmM2hR($ND!qPLu;mSn2_JSO*ACN~=3ODUzI^(~54(q{1
zlh2&QNtQ~(lg!;=gJ}cW4W4adF($97eND|NZHh4h8Bp3@TlqK~`QIt+JJ~qWO=v(H
zt48?kC`+DfVXKWOqqeY>``1;^7<D5N!~<{6cz&w1Gd$~#PFS#o<*yzS#2q{@S{(Mk
zIRo@USR4lzIm_e)inEbmeThW>o9F%#L6P#s<b{Bi%vQ8RqSO&4uV~zHWKpD;ywD$o
z<*MuwzD1(Pa0iMVk0rGOlNU4Tcr3Z0GI?R^gEzJ(l2eU2!(#tv%Avg=qXb)8+Coj2
z84aP@HaL{q)^2DHIxy~cXPuxz7!3pHRswP1EVI7i(ruX4t!vv>*R{16O)G-*n|y!8
zh0ju1#52OLf=El0(ZHzH5butQ2nqu$po8u7pMUU`rDTPS1<JCyzrFBbjw7DT(D@_U
z`{Y2=LtNk@ipA>(sZ_#>Bt_lXXS}|ZeR1mQdXrIJfMGwsviHf?$Ump9Ntonv3^)Jc
zYqj}xG9WAK=Dzco$>WlPw>l{!(4^U3|H5VYcuwd+w5P3~m*3A2uIR)NHD%qKmG4)u
zpK<v0A|1oQCDwhn{P^p#j-i~9bvLhj@I6Qg@aU_O0V!k!&5yqP+e<mSjQIspiIfa&
z%es|ww)@%7L}Y7!YhFFuYf4`52<u{)2PXH#>L~+wYo<89I>)9$6m6z{M#}9YT7`K#
zmg)!tIXE<EBSO7k`{$hY<s&+-Bo0y@2!5G&fq^V@-B9jUCSQpl>-W56hsN09(}~VO
zfJ;zaA`b$_05T(zv+z`VrLITMJ-sC+fsT!|_wzkGIH~BK=hQuBCGaY-pkN*?RNI{;
z`)l`KJZ`0iL_{+Aq`|XCdk>tV;^d0ufcd`09<XCWh>3lB*>#+}wzhaT9es>DBCD7e
zptV-?(qxV_gF^=dMK(@~oYn!G;wfG=amM3LGT+6W<Y5!Qg33_NHl#L{k#bmA?HC$t
zGnb&u#kIwm9PPuJa_!Gza+lbLwmGO*y}9UEcnu;(t+ALN(Xw#3?y69%4iO|obJnzW
z8hu-O5OGO_!i|j)MvM?agO>0|!!1TQ+URHb+CG-Y0{%b{Q8mPP`VpNG5g|mn;*5|5
z!>iUH4i!X{2GKkj;X#C|c0-_6#PI4Em11N}wjrW$L4R#sAEIuet`m{HKto@!4-qzh
z%&6PKC>tU|2BLhT?bU%$ZA-WsZ6Ruw2*-`;)+R)}7)5I_4D^Y854JY>(VuY3W%ac!
zOW7AjzYuLgUu3i?5Z>6e9%bQ>vC?0Mvf3b{O^uD0_hlGyGQttW4_jBn{EQ-kenZ&E
zB9geJHZ1ys2;WLS$AxGg+P0&8T`SfFw{AfEihKzpn$<^oF(bBe5!&8tto8fr>g)V<
z!41JMqIM|D8i7u~(Ym3@Xh~swOZ|;q^$8=mq0tD-Iat*itZRv7E-(V;e>NZDr{zN+
zY#?&jg}&e&GK|%Av5+4l3;OM!^kH(Nqz{u~dhnm{K$0qAchKyB1zQh0-()F;+cD~?
z7hn!nrn+*@P)Z{Sk>H)930(^!ye(s*QWCPgt5SKv8=u9Er3^2q<OoukkRX@cU84zZ
z0<jNIN0804XVO8IK`uv-gh-GZ!rh|@{yz|lBdleja>P)n5lFB-)zNP|aJjTeh@Jn&
zXhK^-<k$#8_E6cpL#Q<)g87aknLQ#w4*8p-30C5OGlXSsqSEeJbL6|ft1E!kL3{~j
zKHhfEI4?94sh;l{P3S=oxpu~Byr4klaRnR@UQo_6_Lj|455CWi;l3%ZXZ0o$2;PvN
zyQO|}?07Pvw+Rm<DL4q0JPTJ-%k=y{!)R&B{PA8IEzV}_he3h+tQp>RAhu1IUMe0C
z$c)W4;TjW}k)|$9N#`69x503@dQ|(Vb_A}$*Wnucvo=Phe{hPb%}}+4!tr<Sibv*A
zMtaim?o_%X9<gu2ctT_3X+fK<&4bN$lP5e@TcA}Vys(s4xX}NV7vFr6tvaWZMOG4b
zsboX|#bP5Lda2`GlBXmGS?yf40z>N_4<F^AhVglQN8TCU{Jn2Bi}?fwnXE0>YB&jZ
zHKp$6B;;^tA+WxdJ#ziJwis6S$l68D{bWGZYYl{Z|H*982snER96Lj6R&Q~RM>9c>
zi6dpA{FBCOug;iNPc4BfLc@27k+)C995qFcz1@Ey9!NqSxHAXMzDgXj=aNa>nMsG~
zXLa9bIPK0%qq6D2=boTeNhM`q&u)kvVnY<XA-kcP(+J2c)H?!llMP3frf;0_7&|Lm
zzlhGl35cAWzCSK~^CC`BRn?+sDs3&wh}(e~MJp%f;cLD#m909pmYhEv3t9X8g5MwI
z8h2{#nNqY$iWFpNK+T=K$RzcsbJ)26IVR^MAaiv8$iyCvPB_$rN{2mVU$rf#DzMlj
ztQW)(%BY9eP2|S{V1=jG&cLYHrqsdjChE>CKyT_jXQ)wPI<4|MKe2baVC}Dru+(l(
zcwf|}WgqN*b&9d<gFU|~{%F|;d*3Mj;G)8PZ`q;3JT(BP;nkj_pL+)c=HTb1$3Oq4
zpFXeYHSk~5C~nkiHay=fD`Xk*M4g1omF3YUjm&w6l#&K_`M|cPz??(MUe#T0vW&F!
zqe?OBP&R;@>CT;W+Fk|t@ostk4RhWy*I*#aH=l%*H`1NA%wb|Ts5x)Ea}~Y&QnC>z
z+!0sNkHCI)uA+D5$pdXs$F7?PtW%xwT;DFuQ(dY|HqTb3eW*>SL`0X)G3N?ng=2$L
z(QttkZ9VJXG4+&KLZQqvcAUvC8lA$YjkkmzGVv+P^;N^)pwj;Qr7i4fyJhtdhLj&I
zSyLu^FXI5`t4`ai2(dx^toxG?-x2BI<p9Uxy8WiaKXBU>*8+Gs)`p^HntsWfZtg21
zuMFV!Ebgcgj4(G3bfqSp0uxHw7e)lko(ipnT5lwsMiF0g=*<1%%Bl&cz%=(}Itd}$
z@-N61Ovd*}I)pKLdJ_Gjt;>Eecq?aYB+Qyb-1cgDZY*NA&puvtkVBJaQ`{1aCwWsE
zKCo;*iUn&fiGKYy>Qf1`%IeRs26Z^Yw?u#b4);@82TXYjyFQXx-IvTGL>6zHKkyaO
zX|XmYa9&?w--8kJ`EL^&eo0llCbAL#d(tDyUNiUI<&@!yw}K6mUG{5l>g@8Ud(pX}
zv0HO*$X(R{Bpa_=z4j?K-nKCTKGh{6F=UXq*NI3^{@V#heAb(hA*Ro&cghdt!39lX
z(8jG1UtBm^IsCM+1wP{HyV5>YZ9#=xea$lpDi8{@P@r&4x^@(}l?$88)|Xv5p`uDT
zYfzouJaftP`l+?kuADTWUU*QQP_ayzmX%AQ+F21Cwz_=uiP%~DT!~Dkcw%dX;`Kb|
z_Ppd4YIvVrycX}gA><v7>1zJC2(Epy`HvfxiM_Y2&C1CC@R0bPcU+!VUD%)O=;`Rz
zy#Vw4$`#n}xo!AV>_i~AuF#6A?=z`QxPOQUgv@gD5<IlcV6NgS7&%cV4uQP68l%Fg
z8KW#Hf%%xkE?WXRChBq~@5}%CjThK2c(#R}fw>6ALGMa)fNXs9GCYt5hAq)^KxQR=
zf?J$k2_dXaqSNR-yjzC;AG6Vg*|NZ%Z_2Wq?-{N<R|lJOefwIqY@V;-EYN2X6N}3;
z9b^|qlS{ZfGfrHdnNlD>{{DZw*kre{3vaE{Bxxb6>Vm<JnMw`wBa$OGO*Y;g&|2E>
zRqcc-IN>Y-zVn1dcpaR{AG<_S)Z(h(G}Zr$k4wYriF{Vc|A_f2TKW-wCb8JJ-P*Y>
zUTAXROz2Yn{e^3VN&mwUm<NL9)4++McR4(5ylYT;y`8z`7*1+icFVX8XM~0wji}N_
zJdm6j7jfTtIJR!a&twgIqFudPlb2|yyNOGR<7`}cYS|w&2Z8h82)qINOoBpz#_d5L
zjrO0Yt;#<oYdf@w2gH%eIm@uw@uTsgz-fb?F;OX{94qwYM;h+p62S_=-R*w+_y8+g
z5_I~{y<>t+u*O7Y_;5rch1HJjTWEvfV8mn5d)l%5gV7uwjBtZWyZEmkkG6^bV)?8i
z43AFS_fI*-RB}tWcm5amO+t@yhZqbExA8NJXd+{`vh8DW*5bj3|AeSDXwBMMZM}A-
zy42B1TyspcNSLHnlHWCQ7KgOi=2-<$5)d7eH9`;vW$26fhGv(*-+w-H;F8HFDd(<e
zko`{VbFU3XEsB8MUs0id`|1heqs{GA-`mKmyUNB4|J{@S`6Rb%a&P(ztE;$fQ?f|x
zvULj^&*Cz0?x<)9ZOc_PC~zwnrkxm>I-ZM6>Au2Z*FpDUm#W<1-UX}l`B?>wNom@%
zWra`gbi3#OY+AuF>ywW)Pw7Pko-t+KXS%dw#fQ62d^{G{O~x=cj=Ax^g0dp!%9uL?
zF|T4oyNW+0(ykKRMkyS98E{Zs>Y?$&&hZ~a_YM?#2joA2Dm0KeK5fY<*6<#i&-UGv
z;s5!$%`<Eef9STyix;<{Ew+ljhk56AN;S6RO@wQ7VL!7kC<ul8e{exzMI~FpC9jKf
zF|75xiX%JfOwf8Kt|a;eaPAG-LoT6-oiYMzkB=<l#B0xtETiyiFO4i?bJ`mt%V?VI
zy#h-<<kA{lTG*wvy0i^0?K+qCMVGeUrQPb%?sRGIxU}E9w9mP;@3^!_T-uW^?KzkB
zE0;E(-1{rmfc7H7rDqfj?iR7q@x29uXwNOC7avGBD^|rvxM608OCglH&#n7By3eco
z#^}Bx-B+ypN_5{?-B+sn#_2v?_l?(m6Leph?whFl&d`06bl+s%SFZb}=)S4CZ<_9_
z(0ym>zUjK}EZtYB`)26AnYwS5?whUq=IFk;y3eQk=IOrqy6<e=caH8`p!*i;zAD|f
zNcUCizH@codAcvp>|;+IGw^g5ilCwu$KnZ^N5Ry0p&m@4iH)WD@4hbd159-O(Ms@-
ztN(QWA~ti;{$-rpZt>r^K!gTqd2*(>@!!_A5pn+E|H5Tm``0esLG{(v*6|ttpu2RP
giF)Bw6&mx@f6%>h^wnV8@G9HaYzK1w?tjqz|3Pq%!vFvP

literal 0
HcmV?d00001

diff --git a/test/parallel/test-compile-cache-success.js b/test/parallel/test-compile-cache-success.js
index c02a6243286972..9417b6bf63c490 100644
--- a/test/parallel/test-compile-cache-success.js
+++ b/test/parallel/test-compile-cache-success.js
@@ -64,3 +64,83 @@ const path = require('path');
       }
     });
 }
+
+// Exercise the dictionary-compressed path (added on top of #63861) for many
+// small modules, which is where the embedded dictionary helps most. We write
+// the cache, then read it back and assert every entry is accepted - this
+// proves each dict-compressed frame decompresses to exactly the bytes that
+// were persisted.
+{
+  tmpdir.refresh();
+  const dir = tmpdir.resolve('.compile_cache_dir');
+
+  // Generate a handful of small modules so the dictionary path is exercised.
+  const count = 8;
+  const modules = [];
+  for (let i = 0; i < count; i++) {
+    const file = tmpdir.resolve(`mod-${i}.js`);
+    fs.writeFileSync(
+      file,
+      `'use strict';\n` +
+      `module.exports = function value${i}(a, b) {\n` +
+      `  const sum = a + b + ${i};\n` +
+      `  return { id: ${i}, sum, label: 'module-${i}' };\n` +
+      `};\n`);
+    modules.push(file);
+  }
+  const reqCode = modules.map((m) => `require(${JSON.stringify(m)});`).join('');
+
+  // First run writes the cache for every module.
+  spawnSyncAndAssert(
+    process.execPath,
+    ['-e', reqCode],
+    {
+      env: {
+        ...process.env,
+        NODE_DEBUG_NATIVE: 'COMPILE_CACHE',
+        NODE_COMPILE_CACHE: dir
+      },
+      cwd: tmpdir.path
+    },
+    {
+      stderr(output) {
+        for (const m of modules) {
+          const name = path.basename(m).replace(/[.]/g, '\\.');
+          assert.match(output, new RegExp(`writing cache for .*${name}.*success`));
+        }
+        return true;
+      }
+    });
+
+  const cacheDirs = fs.readdirSync(dir);
+  assert.strictEqual(cacheDirs.length, 1);
+  // At least one entry per module (the `-e` runner is cached too).
+  const entries = fs.readdirSync(path.join(dir, cacheDirs[0]));
+  assert(entries.length >= count, `expected >= ${count} entries, got ${entries.length}`);
+
+  // Second run reads every cached entry back; "was accepted" only happens when
+  // the decompressed bytes match the freshly produced in-memory cache, so this
+  // is a full roundtrip check of the dictionary-compressed entries.
+  spawnSyncAndAssert(
+    process.execPath,
+    ['-e', reqCode],
+    {
+      env: {
+        ...process.env,
+        NODE_DEBUG_NATIVE: 'COMPILE_CACHE',
+        NODE_COMPILE_CACHE: dir
+      },
+      cwd: tmpdir.path
+    },
+    {
+      stderr(output) {
+        for (const m of modules) {
+          const name = path.basename(m).replace(/[.]/g, '\\.');
+          assert.match(
+            output,
+            new RegExp(`cache for .*${name} was accepted, keeping the in-memory entry`));
+        }
+        return true;
+      }
+    });
+}
diff --git a/tools/generate_compile_cache_dict.py b/tools/generate_compile_cache_dict.py
new file mode 100644
index 00000000000000..8794889775bb63
--- /dev/null
+++ b/tools/generate_compile_cache_dict.py
@@ -0,0 +1,37 @@
+#!/usr/bin/env python
+"""Generate compile_cache_zstd_dict.h from a trained zstd .dict file.
+
+Invoked by the GYP action in node.gyp at build time. Only the small binary
+.dict (src/compile_cache_zstd.dict) is checked into the repository; the C
+array it produces is generated into SHARED_INTERMEDIATE_DIR.
+"""
+import os
+import sys
+
+
+def main(dict_path, out_path):
+    with open(dict_path, 'rb') as f:
+        data = f.read()
+
+    lines = [
+        '// Generated by tools/generate_compile_cache_dict.py',
+        '// from %s' % os.path.basename(dict_path),
+        '// The .dict file is the source of truth; do not edit by hand.',
+        '',
+        'static const unsigned char kCompileCacheZstdDict[] = {',
+    ]
+    for i in range(0, len(data), 12):
+        chunk = data[i:i + 12]
+        lines.append('  %s,' % ', '.join('0x%02x' % b for b in chunk))
+    lines.append('};')
+    lines.append('static const size_t kCompileCacheZstdDictSize = %d;' %
+                 len(data))
+
+    with open(out_path, 'w') as f:
+        f.write('\n'.join(lines) + '\n')
+
+
+if __name__ == '__main__':
+    if len(sys.argv) != 3:
+        sys.exit('Usage: %s <input.dict> <output.h>' % sys.argv[0])
+    main(sys.argv[1], sys.argv[2])