From fbc775495fcdfc6e4bd87050c1389df02538ece7 Mon Sep 17 00:00:00 2001 From: Paul Gschwendtner Date: Thu, 14 Jul 2022 18:47:01 +0000 Subject: [PATCH] fixup! Consistently perform bootstrap and encode Brotli config for improved caching/reduced complexity Re-add fast-path for ESM when we detect it before phase3. And simplify code. --- src/bin.ts | 126 ++++++++++++++++-------------- src/child/child-entrypoint.ts | 12 ++- src/child/child-exec-args.ts | 7 +- src/child/spawn-child-with-esm.ts | 6 +- 4 files changed, 84 insertions(+), 67 deletions(-) diff --git a/src/bin.ts b/src/bin.ts index bae950d48..2379fb341 100644 --- a/src/bin.ts +++ b/src/bin.ts @@ -32,6 +32,9 @@ import { callInChildWithEsm } from './child/spawn-child-with-esm'; import { findAndReadConfig } from './configuration'; import { getChildProcessArguments } from './child/child-exec-args'; +type MarkPropAsRequired = Omit & + Required>; + /** * Main `bin` functionality. * @@ -73,66 +76,74 @@ export interface BootstrapState { * only capture information that should be persisted to e.g. forked child processes. */ export interface BootstrapStateForForkedProcesses { - // For the final bootstrap we are only interested in the user arguments - // that should be passed to the entry-point script (or eval script). - // We don't want to encode any options that would break child forking. e.g. - // persisting the `--eval` option would break `child_process.fork` in scripts. - parseArgvResult: Pick, 'restArgs'>; + // For the final bootstrap we are only interested in the user arguments that should + // be passed to the entry-point script (or eval script). We don't want to encode any + // other options from `parseArgvResult` that would break child forking. + // e.g. persisting the `--eval` option would break `child_process.fork` in scripts. + restArgs: string[]; phase3Result: Pick< ReturnType, 'enableEsmLoader' | 'preloadedConfig' >; } -export interface BootstrapStateInitialProcessChild - extends Omit { - initialProcessOptions: { resolutionCwd: string } & Pick< - ReturnType, - // These are options which should not persist into forked child processes, - // but can be passed-through in the initial child process creation -- but should - // not be encoded in the Brotli state for child process forks (through `execArgv`.) - 'version' | 'showConfig' | 'code' | 'print' | 'interactive' - >; +export interface BootstrapStateInitialProcess + extends Omit { + initialChildArgv: ReturnType; + initialChildResolutionCwd: string; + phase3Result?: ReturnType; } -export type BootstrapStateForChild = Omit< - BootstrapStateForForkedProcesses, - 'initialProcessOptions' -> & - Partial; +export type BootstrapStateForChild = BootstrapStateForForkedProcesses & + Partial; /** @internal */ export function bootstrap(state: BootstrapState) { state.phase2Result = phase2(state); - state.phase3Result = phase3(state); - - const initialChildState: BootstrapStateInitialProcessChild = { - ...createBootstrapStateForChildProcess(state as Required), - // Aside with the default child process state, we attach the initial process - // options since this `callInChild` invocation is from the initial process. - // Later when forking, the initial process options are omitted / not persisted. - initialProcessOptions: { - code: state.parseArgvResult.code, - interactive: state.parseArgvResult.interactive, - print: state.parseArgvResult.print, - showConfig: state.parseArgvResult.showConfig, - version: state.parseArgvResult.version, - resolutionCwd: state.phase2Result.resolutionCwd, - }, + + const initialProcessState: BootstrapStateInitialProcess = { + restArgs: state.parseArgvResult.restArgs, + initialChildArgv: state.parseArgvResult, + initialChildResolutionCwd: state.phase2Result.resolutionCwd, }; + // Perf optimization for ESM until ESM hooks can be registered without needing + // a child process. We skip phase3 and defer it to the child process where we + // would load the TS compiler anyway, avoiding loading it twice in different processes. + if (initialProcessState.initialChildArgv.esm) { + callInChildWithEsm(initialProcessState, process.cwd()); + return; + } + + const phase3Result = phase3(initialProcessState); + // For ESM, we need to spawn a new Node process to be able to register our hooks. - if (state.phase3Result.enableEsmLoader) { + if (phase3Result.enableEsmLoader) { // Note: When transitioning into the child process for the final phase, // we want to preserve the initial user working directory. - callInChildWithEsm(initialChildState, process.cwd()); + callInChildWithEsm(initialProcessState, process.cwd()); } else { - completeBootstrap(initialChildState); + completeBootstrap({ ...initialProcessState, phase3Result }); } } /** Final phase of the bootstrap. */ -export function completeBootstrap(state: BootstrapStateForChild) { - return phase4(state); +export function completeBootstrap( + state: BootstrapStateForForkedProcesses | BootstrapStateInitialProcess +) { + // IMPORTANT: This is an optimization when we detected `--esm` early in the CLI. + // In such cases we skip phase3 and let phase3 to be processed in the child process here. + // This avoids loading the TS compiler twice as loading TS is rather slow. + // TODO: Remove this when we don't need to spawn a child process for ESM. See: + if (state.phase3Result === undefined) { + state.phase3Result = phase3(state as BootstrapStateInitialProcess); + } + + return phase4( + state as MarkPropAsRequired< + BootstrapStateForForkedProcesses | BootstrapStateInitialProcess, + 'phase3Result' + > + ); } function parseArgv(argv: string[], entrypointArgs: Record) { @@ -394,8 +405,8 @@ function phase3(payload: BootstrapState) { scopeDir, esm, experimentalSpecifierResolution, - } = payload.parseArgvResult; - const { resolutionCwd } = payload.phase2Result!; + } = payload.initialChildArgv; + const resolutionCwd = payload.initialChildResolutionCwd; // NOTE: When we transition to a child process for ESM, the entry-point script determined // here might not be the one used later in `phase4`. This can happen when we execute the @@ -405,7 +416,7 @@ function phase3(payload: BootstrapState) { // See: https://github.com/TypeStrong/ts-node/issues/1812. const { entryPointPath } = getEntryPointInfo( resolutionCwd, - payload.parseArgvResult! + payload.initialChildArgv ); const preloadedConfig = findAndReadConfig({ @@ -498,10 +509,9 @@ function getEntryPointInfo( } function phase4(payload: BootstrapStateForChild) { - const { restArgs } = payload.parseArgvResult; + const restArgs = payload.restArgs; const { preloadedConfig } = payload.phase3Result; - const resolutionCwd = - payload.initialProcessOptions?.resolutionCwd ?? process.cwd(); + const resolutionCwd = payload.initialChildResolutionCwd ?? process.cwd(); const { entryPointPath, @@ -510,9 +520,9 @@ function phase4(payload: BootstrapStateForChild) { executeRepl, executeStdin, } = getEntryPointInfo(resolutionCwd, { - code: payload.initialProcessOptions?.code, - interactive: payload.initialProcessOptions?.interactive, - restArgs: payload.parseArgvResult.restArgs, + code: payload.initialChildArgv?.code, + interactive: payload.initialChildArgv?.interactive, + restArgs: payload.restArgs, }); /** @@ -597,13 +607,13 @@ function phase4(payload: BootstrapStateForChild) { stdinStuff?.repl.setService(service); // Output project information. - if (payload.initialProcessOptions?.version === 2) { + if (payload.initialChildArgv?.version === 2) { console.log(`ts-node v${VERSION}`); console.log(`node ${process.version}`); console.log(`compiler v${service.ts.version}`); process.exit(0); } - if ((payload.initialProcessOptions?.version ?? 0) >= 3) { + if ((payload.initialChildArgv?.version ?? 0) >= 3) { console.log(`ts-node v${VERSION} ${dirname(__dirname)}`); console.log(`node ${process.version}`); console.log( @@ -612,7 +622,7 @@ function phase4(payload: BootstrapStateForChild) { process.exit(0); } - if (payload.initialProcessOptions?.showConfig) { + if (payload.initialChildArgv?.showConfig) { const ts = service.ts as any as TSInternal; if (typeof ts.convertToTSConfig !== 'function') { console.error( @@ -700,8 +710,8 @@ function phase4(payload: BootstrapStateForChild) { evalAndExitOnTsError( evalStuff!.repl, evalStuff!.module!, - payload.initialProcessOptions!.code!, - payload.initialProcessOptions!.print, + payload.initialChildArgv!.code!, + payload.initialChildArgv!.print, 'eval' ); } @@ -711,7 +721,7 @@ function phase4(payload: BootstrapStateForChild) { } if (executeStdin) { - let buffer = payload.initialProcessOptions?.code ?? ''; + let buffer = payload.initialChildArgv?.code ?? ''; process.stdin.on('data', (chunk: Buffer) => (buffer += chunk)); process.stdin.on('end', () => { evalAndExitOnTsError( @@ -719,7 +729,7 @@ function phase4(payload: BootstrapStateForChild) { stdinStuff!.module!, buffer, // `echo 123 | node -p` still prints 123 - payload.initialProcessOptions?.print ?? false, + payload.initialChildArgv?.print ?? false, 'stdin' ); }); @@ -728,14 +738,12 @@ function phase4(payload: BootstrapStateForChild) { } function createBootstrapStateForChildProcess( - state: BootstrapStateInitialProcessChild | BootstrapStateForForkedProcesses + state: BootstrapStateInitialProcess | BootstrapStateForForkedProcesses ): BootstrapStateForForkedProcesses { // NOTE: Build up the child process fork bootstrap state manually so that we do // not encode unnecessary properties into the bootstrap state that is persisted return { - parseArgvResult: { - restArgs: state.parseArgvResult.restArgs, - }, + restArgs: state.restArgs, phase3Result: { enableEsmLoader: state.phase3Result!.enableEsmLoader, preloadedConfig: state.phase3Result!.preloadedConfig, diff --git a/src/child/child-entrypoint.ts b/src/child/child-entrypoint.ts index ce9e9ed1a..bce6bcff5 100644 --- a/src/child/child-entrypoint.ts +++ b/src/child/child-entrypoint.ts @@ -1,11 +1,17 @@ -import { completeBootstrap, BootstrapStateForChild } from '../bin'; +import { + completeBootstrap, + BootstrapStateInitialProcess, + BootstrapStateForForkedProcesses, +} from '../bin'; import { argPrefix, decompress } from './argv-payload'; const base64ConfigArg = process.argv[2]; if (!base64ConfigArg.startsWith(argPrefix)) throw new Error('unexpected argv'); const base64Payload = base64ConfigArg.slice(argPrefix.length); -const state = decompress(base64Payload) as BootstrapStateForChild; +const state = decompress(base64Payload) as + | BootstrapStateForForkedProcesses + | BootstrapStateInitialProcess; -state.parseArgvResult.restArgs = process.argv.slice(3); +state.restArgs = process.argv.slice(3); completeBootstrap(state); diff --git a/src/child/child-exec-args.ts b/src/child/child-exec-args.ts index 65164aafb..19a6b79fc 100644 --- a/src/child/child-exec-args.ts +++ b/src/child/child-exec-args.ts @@ -1,11 +1,14 @@ import { pathToFileURL } from 'url'; import { brotliCompressSync } from 'zlib'; -import type { BootstrapStateForChild } from '../bin'; +import type { + BootstrapStateForForkedProcesses, + BootstrapStateInitialProcess, +} from '../bin'; import { argPrefix } from './argv-payload'; export function getChildProcessArguments( enableEsmLoader: boolean, - state: BootstrapStateForChild + state: BootstrapStateForForkedProcesses | BootstrapStateInitialProcess ) { const nodeExecArgs = []; diff --git a/src/child/spawn-child-with-esm.ts b/src/child/spawn-child-with-esm.ts index ca8892923..5e765257c 100644 --- a/src/child/spawn-child-with-esm.ts +++ b/src/child/spawn-child-with-esm.ts @@ -1,5 +1,5 @@ import { fork } from 'child_process'; -import type { BootstrapStateForChild } from '../bin'; +import type { BootstrapStateInitialProcess } from '../bin'; import { getChildProcessArguments } from './child-exec-args'; /** @@ -11,13 +11,13 @@ import { getChildProcessArguments } from './child-exec-args'; * the child process. */ export function callInChildWithEsm( - state: BootstrapStateForChild, + state: BootstrapStateInitialProcess, targetCwd: string ) { const { childScriptArgs, childScriptPath, nodeExecArgs } = getChildProcessArguments(/* enableEsmLoader */ true, state); - childScriptArgs.push(...state.parseArgvResult.restArgs); + childScriptArgs.push(...state.restArgs); const child = fork(childScriptPath, childScriptArgs, { stdio: 'inherit',