Skip to content

Commit d0b6ea1

Browse files
GeoffreyBoothjoyeecheung
authored andcommitted
module: eliminate performance cost of detection for cjs entry
PR-URL: nodejs#52093 Reviewed-By: Matteo Collina <[email protected]> Reviewed-By: Yagiz Nizipli <[email protected]> Reviewed-By: Joyee Cheung <[email protected]> Reviewed-By: Jacob Smith <[email protected]> Reviewed-By: Richard Lau <[email protected]>
1 parent c832e66 commit d0b6ea1

File tree

6 files changed

+192
-97
lines changed

6 files changed

+192
-97
lines changed

benchmark/misc/startup-core.js

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,7 @@ const bench = common.createBenchmark(main, {
99
script: [
1010
'benchmark/fixtures/require-builtins',
1111
'test/fixtures/semicolon',
12+
'test/fixtures/snapshot/typescript',
1213
],
1314
mode: ['process', 'worker'],
1415
n: [30],

lib/internal/modules/cjs/loader.js

Lines changed: 10 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -106,6 +106,7 @@ module.exports = {
106106
kModuleExportNames,
107107
kModuleCircularVisited,
108108
initializeCJS,
109+
entryPointSource: undefined, // Set below.
109110
Module,
110111
wrapSafe,
111112
kIsMainSymbol,
@@ -1391,8 +1392,15 @@ function wrapSafe(filename, content, cjsModuleInstance, codeCache) {
13911392
return result;
13921393
} catch (err) {
13931394
if (process.mainModule === cjsModuleInstance) {
1394-
const { enrichCJSError } = require('internal/modules/esm/translators');
1395-
enrichCJSError(err, content, filename);
1395+
if (getOptionValue('--experimental-detect-module')) {
1396+
// For the main entry point, cache the source to potentially retry as ESM.
1397+
module.exports.entryPointSource = content;
1398+
} else {
1399+
// We only enrich the error (print a warning) if we're sure we're going to for-sure throw it; so if we're
1400+
// retrying as ESM, wait until we know whether we're going to retry before calling `enrichCJSError`.
1401+
const { enrichCJSError } = require('internal/modules/esm/translators');
1402+
enrichCJSError(err, content, filename);
1403+
}
13961404
}
13971405
throw err;
13981406
}

lib/internal/modules/helpers.js

Lines changed: 35 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -19,6 +19,15 @@ const {
1919
} = require('internal/errors').codes;
2020
const { BuiltinModule } = require('internal/bootstrap/realm');
2121

22+
const {
23+
shouldRetryAsESM: contextifyShouldRetryAsESM,
24+
constants: {
25+
syntaxDetectionErrors: {
26+
esmSyntaxErrorMessages,
27+
throwsOnlyInCommonJSErrorMessages,
28+
},
29+
},
30+
} = internalBinding('contextify');
2231
const { validateString } = require('internal/validators');
2332
const fs = require('fs'); // Import all of `fs` so that it can be monkey-patched.
2433
const internalFS = require('internal/fs/utils');
@@ -329,6 +338,31 @@ function urlToFilename(url) {
329338
return url;
330339
}
331340

341+
let esmSyntaxErrorMessagesSet; // Declared lazily in shouldRetryAsESM
342+
let throwsOnlyInCommonJSErrorMessagesSet; // Declared lazily in shouldRetryAsESM
343+
/**
344+
* After an attempt to parse a module as CommonJS throws an error, should we try again as ESM?
345+
* We only want to try again as ESM if the error is due to syntax that is only valid in ESM; and if the CommonJS parse
346+
* throws on an error that would not have been a syntax error in ESM (like via top-level `await` or a lexical
347+
* redeclaration of one of the CommonJS variables) then we need to parse again to see if it would have thrown in ESM.
348+
* @param {string} errorMessage The string message thrown by V8 when attempting to parse as CommonJS
349+
* @param {string} source Module contents
350+
*/
351+
function shouldRetryAsESM(errorMessage, source) {
352+
esmSyntaxErrorMessagesSet ??= new SafeSet(esmSyntaxErrorMessages);
353+
if (esmSyntaxErrorMessagesSet.has(errorMessage)) {
354+
return true;
355+
}
356+
357+
throwsOnlyInCommonJSErrorMessagesSet ??= new SafeSet(throwsOnlyInCommonJSErrorMessages);
358+
if (throwsOnlyInCommonJSErrorMessagesSet.has(errorMessage)) {
359+
return /** @type {boolean} */(contextifyShouldRetryAsESM(source));
360+
}
361+
362+
return false;
363+
}
364+
365+
332366
// Whether we have started executing any user-provided CJS code.
333367
// This is set right before we call the wrapped CJS code (not after,
334368
// in case we are half-way in the execution when internals check this).
@@ -362,6 +396,7 @@ module.exports = {
362396
loadBuiltinModule,
363397
makeRequireFunction,
364398
normalizeReferrerURL,
399+
shouldRetryAsESM,
365400
stripBOM,
366401
toRealPath,
367402
hasStartedUserCJSExecution() {

lib/internal/modules/run_main.js

Lines changed: 32 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,6 @@ const {
44
StringPrototypeEndsWith,
55
} = primordials;
66

7-
const { containsModuleSyntax } = internalBinding('contextify');
87
const { getNearestParentPackageJSONType } = internalBinding('modules');
98
const { getOptionValue } = require('internal/options');
109
const { checkPackageJSONIntegrity } = require('internal/modules/package_json_reader');
@@ -82,10 +81,6 @@ function shouldUseESMLoader(mainPath) {
8281

8382
// No package.json or no `type` field.
8483
if (response === undefined || response[0] === 'none') {
85-
if (getOptionValue('--experimental-detect-module')) {
86-
// If the first argument of `containsModuleSyntax` is undefined, it will read `mainPath` from the file system.
87-
return containsModuleSyntax(undefined, mainPath);
88-
}
8984
return false;
9085
}
9186

@@ -160,12 +155,43 @@ function runEntryPointWithESMLoader(callback) {
160155
* by `require('module')`) even when the entry point is ESM.
161156
* This monkey-patchable code is bypassed under `--experimental-default-type=module`.
162157
* Because of backwards compatibility, this function is exposed publicly via `import { runMain } from 'node:module'`.
158+
* When `--experimental-detect-module` is passed, this function will attempt to run ambiguous (no explicit extension, no
159+
* `package.json` type field) entry points as CommonJS first; under certain conditions, it will retry running as ESM.
163160
* @param {string} main - First positional CLI argument, such as `'entry.js'` from `node entry.js`
164161
*/
165162
function executeUserEntryPoint(main = process.argv[1]) {
166163
const resolvedMain = resolveMainPath(main);
167164
const useESMLoader = shouldUseESMLoader(resolvedMain);
168-
if (useESMLoader) {
165+
166+
// Unless we know we should use the ESM loader to handle the entry point per the checks in `shouldUseESMLoader`, first
167+
// try to run the entry point via the CommonJS loader; and if that fails under certain conditions, retry as ESM.
168+
let retryAsESM = false;
169+
if (!useESMLoader) {
170+
const cjsLoader = require('internal/modules/cjs/loader');
171+
const { Module } = cjsLoader;
172+
if (getOptionValue('--experimental-detect-module')) {
173+
try {
174+
// Module._load is the monkey-patchable CJS module loader.
175+
Module._load(main, null, true);
176+
} catch (error) {
177+
const source = cjsLoader.entryPointSource;
178+
const { shouldRetryAsESM } = require('internal/modules/helpers');
179+
retryAsESM = shouldRetryAsESM(error.message, source);
180+
// In case the entry point is a large file, such as a bundle,
181+
// ensure no further references can prevent it being garbage-collected.
182+
cjsLoader.entryPointSource = undefined;
183+
if (!retryAsESM) {
184+
const { enrichCJSError } = require('internal/modules/esm/translators');
185+
enrichCJSError(error, source, resolvedMain);
186+
throw error;
187+
}
188+
}
189+
} else { // `--experimental-detect-module` is not passed
190+
Module._load(main, null, true);
191+
}
192+
}
193+
194+
if (useESMLoader || retryAsESM) {
169195
const mainPath = resolvedMain || main;
170196
const mainURL = pathToFileURL(mainPath).href;
171197

@@ -174,10 +200,6 @@ function executeUserEntryPoint(main = process.argv[1]) {
174200
// even after the event loop stops running.
175201
return cascadedLoader.import(mainURL, undefined, { __proto__: null }, true);
176202
});
177-
} else {
178-
// Module._load is the monkey-patchable CJS module loader.
179-
const { Module } = require('internal/modules/cjs/loader');
180-
Module._load(main, null, true);
181203
}
182204
}
183205

0 commit comments

Comments
 (0)