新技能：通过代码缓存加速 Node.js 的启动

89次阅读

共计 4750 个字符，预计需要花费 12 分钟才能阅读完成。

导读	本文介绍在 Node.js 里如何利用代码缓存技术加速 Node.js 的启动。

新技能：通过代码缓存加速 Node.js 的启动
前言：之前的文章介绍了通过快照的方式加速 Node.js 的启动，除了快照，V8 还提供了另一种技术加速代码的执行，那就是代码缓存。通过 V8 第一次执行 JS 的时候，V8 需要即时进行解析和编译 JS 代码，这个是需要一定时间的，代码缓存可以把这个过程的一些信息保存下来，下次执行的时候，通过这个缓存的信息就可以加速 JS 代码的执行。本文介绍在 Node.js 里如何利用代码缓存技术加速 Node.js 的启动。

首先看一下 Node.js 的编译配置。

 'actions': [
  {
    'action_name': 'node_js2c',
    'process_outputs_as_sources': 1,
    'inputs': [
      'tools/js2c.py',
      '
 通过这个配置，在编译 Node.js 的时候，会执行 js2c.py，并且把输入写到 node_javascript.cc 文件。我们看一下生成的内容。
 
里面定义了一个函数，这个函数里面往 source_ 字段里不断追加一系列的内容，其中 key 是 Node.js 中的原生 JS 模块信息，值是模块的内容，我们随便看一个模块 assert/strict。
const data = [39,117,115,101, 32,115,116,114,105, 99,116, 39, 59, 10, 10,109,111,100,117,108,101, 46,101,120,112,111,114,116,115, 32,61, 32,114,101,113,117,105,114,101, 40, 39, 97,115,115,101,114,116, 39, 41, 46,115,116,114,105, 99,116, 59, 10];
console.log(Buffer.from(data).toString('utf-8'))
 输出如下。
'use strict';
module.exports = require('assert').strict;
 通过 js2c.py 脚本，Node.js 把原生 JS 模块的内容写到了文件中，并且编译进 Node.js 的可执行文件里，这样在 Node.js 启动时就不需要从硬盘里读取对应的文件，否则无论是启动还是运行时动态加载原生 JS 模块，都需要更多的耗时，因为内存的速度远快于硬盘。这是 Node.js 做的第一个优化，接下来看代码缓存，因为代码缓存是在这个基础上实现的。首先看一下编译配置。
['node_use_node_code_cache=="true"', {'dependencies': ['mkcodecache',],
  'actions': [
    {
      'action_name': 'run_mkcodecache',
      'process_outputs_as_sources': 1,
      'inputs': [
        '
 如果编译 Node.js 时 node_use_node_code_cache 为 true 则生成代码缓存。如果我们不需要可以关掉，具体执行 ./configure --without-node-code-cache。如果我们关闭代码缓存，Node.js 关于这部分的实现是空，具体在 node_code_cache_stub.cc。
const bool has_code_cache = false;
void NativeModuleEnv::InitializeCodeCache() {}
 也就是什么都不做。如果我们开启了代码缓存，就会执行 mkcodecache.cc 生成代码缓存。
int main(int argc, char* argv[]) {argv = uv_setup_args(argc, argv);
  std::ofstream out;
  out.open(argv[1], std::ios::out | std::ios::binary);
  node::per_process::enabled_debug_list.Parse(nullptr);
  std::unique_ptr<:platform> platform = v8::platform::NewDefaultPlatform();
  v8::V8::InitializePlatform(platform.get());
  v8::V8::Initialize();
  Isolate::CreateParams create_params;
  create_params.array_buffer_allocator_shared.reset(ArrayBuffer::Allocator::NewDefaultAllocator());
  Isolate* isolate = Isolate::New(create_params);
  {Isolate::Scope isolate_scope(isolate);
    v8::HandleScope handle_scope(isolate);
    v8::Local<:context> context = v8::Context::New(isolate);
    v8::Context::Scope context_scope(context);
    std::string cache = CodeCacheBuilder::Generate(context);
    out Dispose();
  v8::V8::ShutdownPlatform();
  return 0;
}
 
 首先打开文件，然后是 V8 的常用初始化逻辑，最后通过 Generate 生成代码缓存。
std::string CodeCacheBuilder::Generate(Local context) {NativeModuleLoader* loader = NativeModuleLoader::GetInstance();
  std::vector<:string> ids = loader->GetModuleIds();
  std::map<:string scriptcompiler::cacheddata> data;
  for (const auto& id : ids) {if (loader->CanBeRequired(id.c_str())) {
      NativeModuleLoader::Result result;
      USE(loader->CompileAsModule(context, id.c_str(), &result));
      ScriptCompiler::CachedData* cached_data = loader->GetCodeCache(id.c_str());
      data.emplace(id, cached_data);
    }
  }
  return GenerateCodeCache(data);
}
 
 首先新建一个 NativeModuleLoader。
NativeModuleLoader::NativeModuleLoader() : config_(GetConfig()) {LoadJavaScriptSource();
}
NativeModuleLoader 初始化时会执行 LoadJavaScriptSource，这个函数就是通过 python 脚本生成的 node_javascript.cc 文件里的函数，初始化完成后 NativeModuleLoader 对象的 source_ 字段就保存了原生 JS 模块的代码。接着遍历这些原生 JS 模块，通过 CompileAsModule 进行编译。
MaybeLocal NativeModuleLoader::CompileAsModule(Local context,
    const char* id,
    NativeModuleLoader::Result* result) {Isolate* isolate = context->GetIsolate();
  std::vector> parameters = {FIXED_ONE_BYTE_STRING(isolate, "exports"),
      FIXED_ONE_BYTE_STRING(isolate, "require"),
      FIXED_ONE_BYTE_STRING(isolate, "module"),
      FIXED_ONE_BYTE_STRING(isolate, "process"),
      FIXED_ONE_BYTE_STRING(isolate, "internalBinding"),
      FIXED_ONE_BYTE_STRING(isolate, "primordials")};
  return LookupAndCompile(context, id, &parameters, result);
}
 
 接着看 LookupAndCompile
MaybeLocal NativeModuleLoader::LookupAndCompile(Local context,
    const char* id,
    std::vector>* parameters,
    NativeModuleLoader::Result* result) {Isolate* isolate = context->GetIsolate();
  EscapableHandleScope scope(isolate);
  Local source;
  // 根据 key 从 source_ 字段找到模块内容
  if (!LoadBuiltinModuleSource(isolate, id).ToLocal(&source)) {return {};
  }
  std::string filename_s = std::string("node:") + id;
  Local filename =
      OneByteString(isolate, filename_s.c_str(), filename_s.size());
  ScriptOrigin origin(isolate, filename, 0, 0, true);
  ScriptCompiler::CachedData* cached_data = nullptr;
  {Mutex::ScopedLock lock(code_cache_mutex_);
    // 判断是否有代码缓存
    auto cache_it = code_cache_.find(id);
    if (cache_it != code_cache_.end()) {cached_data = cache_it->second.release();
      code_cache_.erase(cache_it);
    }
  }
  const bool has_cache = cached_data != nullptr;
  ScriptCompiler::CompileOptions options =
      has_cache ? ScriptCompiler::kConsumeCodeCache
                : ScriptCompiler::kEagerCompile;
  // 如果有代码缓存则传入             
  ScriptCompiler::Source script_source(source, origin, cached_data);
  // 进行编译
  MaybeLocal maybe_fun =
      ScriptCompiler::CompileFunctionInContext(context,
                                               &script_source,
                                               parameters->size(),
                                               parameters->data(),
                                               0,
                                               nullptr,
                                               options);
  Local fun;
  if (!maybe_fun.ToLocal(&fun)) {return MaybeLocal();}
  *result = (has_cache && !script_source.GetCachedData()->rejected)
                ? Result::kWithCache
                : Result::kWithoutCache;
  // 生成代码缓存保存下来，最后写入文件，下次使用
  std::unique_ptr

正文完

星哥玩云-微信公众号

发表至： linux教程

2024-07-25

0

转载说明：除特殊说明外本站文章皆由CC-4.0协议发布，转载请注明出处。

dnsmasq配置dns实战

Go 代码中如何绑定 Host

相比 Windows 为什么越来越多人选择Linux？

如何从 Docker Desktop 切换到 Colima

Ubuntu16.04最快捷搭建小型局域网Git服务器

Linux下磁盘分区工具cfdisk的使用

linux 命令行中的计算器

MySQL的半同步复制

带你进入Vue2响应式系统之嵌套之旅

新技能：通过代码缓存加速 Node.js 的启动

申请腾讯混元的API Key并且使用LobeChat调用混元AI

Docker部署搭建一个开源强大的图书管理系统

基于Docker快速搭建一个开源的IT人员在线工具箱-it-tools

让每个人都可以轻松使用Git-腾讯自研Git客户端

使用Docker部署开源的WPS-Office

详解:Linux 硬盘，格式化，分区详解

Python 中 set 是什么？为何要是用它？

简单3步部署本地国产大模型DeepSeek大模型

干货：基于nginx的tcp反向代理案例

2025年第一起运维事故-江教在线网传删库跑路？

	'actions': [
	{
	'action_name': 'node_js2c',
	'process_outputs_as_sources': 1,
	'inputs': [
	'tools/js2c.py',
	'
	通过这个配置，在编译 Node.js 的时候，会执行 js2c.py，并且把输入写到 node_javascript.cc 文件。我们看一下生成的内容。

	里面定义了一个函数，这个函数里面往 source_ 字段里不断追加一系列的内容，其中 key 是 Node.js 中的原生 JS 模块信息，值是模块的内容，我们随便看一个模块 assert/strict。
	const data = [39,117,115,101, 32,115,116,114,105, 99,116, 39, 59, 10, 10,109,111,100,117,108,101, 46,101,120,112,111,114,116,115, 32,61, 32,114,101,113,117,105,114,101, 40, 39, 97,115,115,101,114,116, 39, 41, 46,115,116,114,105, 99,116, 59, 10];
	console.log(Buffer.from(data).toString('utf-8'))
	输出如下。
	'use strict';
	module.exports = require('assert').strict;
	通过 js2c.py 脚本，Node.js 把原生 JS 模块的内容写到了文件中，并且编译进 Node.js 的可执行文件里，这样在 Node.js 启动时就不需要从硬盘里读取对应的文件，否则无论是启动还是运行时动态加载原生 JS 模块，都需要更多的耗时，因为内存的速度远快于硬盘。这是 Node.js 做的第一个优化，接下来看代码缓存，因为代码缓存是在这个基础上实现的。首先看一下编译配置。
	['node_use_node_code_cache=="true"', {'dependencies': ['mkcodecache',],
	'actions': [
	{
	'action_name': 'run_mkcodecache',
	'process_outputs_as_sources': 1,
	'inputs': [
	'
	如果编译 Node.js 时 node_use_node_code_cache 为 true 则生成代码缓存。如果我们不需要可以关掉，具体执行 ./configure --without-node-code-cache。如果我们关闭代码缓存，Node.js 关于这部分的实现是空，具体在 node_code_cache_stub.cc。
	const bool has_code_cache = false;
	void NativeModuleEnv::InitializeCodeCache() {}
	也就是什么都不做。如果我们开启了代码缓存，就会执行 mkcodecache.cc 生成代码缓存。
	int main(int argc, char* argv[]) {argv = uv_setup_args(argc, argv);
	std::ofstream out;
	out.open(argv[1], std::ios::out \| std::ios::binary);
	node::per_process::enabled_debug_list.Parse(nullptr);
	std::unique_ptr<:platform> platform = v8::platform::NewDefaultPlatform();
	v8::V8::InitializePlatform(platform.get());
	v8::V8::Initialize();
	Isolate::CreateParams create_params;
	create_params.array_buffer_allocator_shared.reset(ArrayBuffer::Allocator::NewDefaultAllocator());
	Isolate* isolate = Isolate::New(create_params);
	{Isolate::Scope isolate_scope(isolate);
	v8::HandleScope handle_scope(isolate);
	v8::Local<:context> context = v8::Context::New(isolate);
	v8::Context::Scope context_scope(context);
	std::string cache = CodeCacheBuilder::Generate(context);
	out Dispose();
	v8::V8::ShutdownPlatform();
	return 0;
	}

	首先打开文件，然后是 V8 的常用初始化逻辑，最后通过 Generate 生成代码缓存。
	std::string CodeCacheBuilder::Generate(Local context) {NativeModuleLoader* loader = NativeModuleLoader::GetInstance();
	std::vector<:string> ids = loader->GetModuleIds();
	std::map<:string scriptcompiler::cacheddata> data;
	for (const auto& id : ids) {if (loader->CanBeRequired(id.c_str())) {
	NativeModuleLoader::Result result;
	USE(loader->CompileAsModule(context, id.c_str(), &result));
	ScriptCompiler::CachedData* cached_data = loader->GetCodeCache(id.c_str());
	data.emplace(id, cached_data);
	}
	}
	return GenerateCodeCache(data);
	}

	首先新建一个 NativeModuleLoader。
	NativeModuleLoader::NativeModuleLoader() : config_(GetConfig()) {LoadJavaScriptSource();
	}
	NativeModuleLoader 初始化时会执行 LoadJavaScriptSource，这个函数就是通过 python 脚本生成的 node_javascript.cc 文件里的函数，初始化完成后 NativeModuleLoader 对象的 source_ 字段就保存了原生 JS 模块的代码。接着遍历这些原生 JS 模块，通过 CompileAsModule 进行编译。
	MaybeLocal NativeModuleLoader::CompileAsModule(Local context,
	const char* id,
	NativeModuleLoader::Result* result) {Isolate* isolate = context->GetIsolate();
	std::vector> parameters = {FIXED_ONE_BYTE_STRING(isolate, "exports"),
	FIXED_ONE_BYTE_STRING(isolate, "require"),
	FIXED_ONE_BYTE_STRING(isolate, "module"),
	FIXED_ONE_BYTE_STRING(isolate, "process"),
	FIXED_ONE_BYTE_STRING(isolate, "internalBinding"),
	FIXED_ONE_BYTE_STRING(isolate, "primordials")};
	return LookupAndCompile(context, id, &parameters, result);
	}

	接着看 LookupAndCompile
	MaybeLocal NativeModuleLoader::LookupAndCompile(Local context,
	const char* id,
	std::vector>* parameters,
	NativeModuleLoader::Result* result) {Isolate* isolate = context->GetIsolate();
	EscapableHandleScope scope(isolate);
	Local source;
	// 根据 key 从 source_ 字段找到模块内容
	if (!LoadBuiltinModuleSource(isolate, id).ToLocal(&source)) {return {};
	}
	std::string filename_s = std::string("node:") + id;
	Local filename =
	OneByteString(isolate, filename_s.c_str(), filename_s.size());
	ScriptOrigin origin(isolate, filename, 0, 0, true);
	ScriptCompiler::CachedData* cached_data = nullptr;
	{Mutex::ScopedLock lock(code_cache_mutex_);
	// 判断是否有代码缓存
	auto cache_it = code_cache_.find(id);
	if (cache_it != code_cache_.end()) {cached_data = cache_it->second.release();
	code_cache_.erase(cache_it);
	}
	}
	const bool has_cache = cached_data != nullptr;
	ScriptCompiler::CompileOptions options =
	has_cache ? ScriptCompiler::kConsumeCodeCache
	: ScriptCompiler::kEagerCompile;
	// 如果有代码缓存则传入
	ScriptCompiler::Source script_source(source, origin, cached_data);
	// 进行编译
	MaybeLocal maybe_fun =
	ScriptCompiler::CompileFunctionInContext(context,
	&script_source,
	parameters->size(),
	parameters->data(),
	0,
	nullptr,
	options);
	Local fun;
	if (!maybe_fun.ToLocal(&fun)) {return MaybeLocal();}
	*result = (has_cache && !script_source.GetCachedData()->rejected)
	? Result::kWithCache
	: Result::kWithoutCache;
	// 生成代码缓存保存下来，最后写入文件，下次使用
	std::unique_ptr