From b92e77c2b8548aee7a2186849cebe691181b47e7 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Philippe=20Rivi=C3=A8re?= Date: Mon, 16 Sep 2024 17:18:13 +0200 Subject: [PATCH] a $FILE_SERVER that tracks dependencies in the cache --- src/fileWatchers.ts | 74 ++++++++------ src/loader.ts | 97 ++++++++++++++++--- src/preview.ts | 8 +- test/input/build/chain/chain-source.json.sh | 1 + test/input/build/chain/chain.json.ts | 1 + test/input/build/chain/chain.md | 9 ++ test/input/build/chain/chain1.json.ts | 3 + test/input/build/chain/chain2.csv.ts | 3 + .../build/chain/_file/chain1.550fb08c.json | 4 + .../build/chain/_file/chain2.b1220d22.csv | 3 + .../build/chain/_npm/d3-dsv@3.0.1/cd372fb8.js | 0 .../chain/_observablehq/client.00000001.js | 0 .../chain/_observablehq/runtime.00000002.js | 0 .../chain/_observablehq/stdlib.00000003.js | 0 .../theme-air,near-midnight.00000004.css | 0 test/output/build/chain/chain.html | 61 ++++++++++++ 16 files changed, 221 insertions(+), 43 deletions(-) create mode 100644 test/input/build/chain/chain-source.json.sh create mode 100644 test/input/build/chain/chain.json.ts create mode 100644 test/input/build/chain/chain.md create mode 100644 test/input/build/chain/chain1.json.ts create mode 100644 test/input/build/chain/chain2.csv.ts create mode 100644 test/output/build/chain/_file/chain1.550fb08c.json create mode 100644 test/output/build/chain/_file/chain2.b1220d22.csv create mode 100644 test/output/build/chain/_npm/d3-dsv@3.0.1/cd372fb8.js create mode 100644 test/output/build/chain/_observablehq/client.00000001.js create mode 100644 test/output/build/chain/_observablehq/runtime.00000002.js create mode 100644 test/output/build/chain/_observablehq/stdlib.00000003.js create mode 100644 test/output/build/chain/_observablehq/theme-air,near-midnight.00000004.css create mode 100644 test/output/build/chain/chain.html diff --git a/src/fileWatchers.ts b/src/fileWatchers.ts index c1dcdf15e..63b8dc02b 100644 --- a/src/fileWatchers.ts +++ b/src/fileWatchers.ts @@ -1,5 +1,6 @@ import type {FSWatcher} from "node:fs"; -import {watch} from "node:fs"; +import {readFileSync, watch} from "node:fs"; +import {join} from "node:path/posix"; import {isEnoent} from "./error.js"; import {maybeStat} from "./files.js"; import type {LoaderResolver} from "./loader.js"; @@ -11,38 +12,55 @@ export class FileWatchers { static async of(loaders: LoaderResolver, path: string, names: Iterable, callback: (name: string) => void) { const that = new FileWatchers(); const {watchers} = that; + const {root} = loaders; for (const name of names) { - const watchPath = loaders.getWatchPath(resolvePath(path, name)); - if (!watchPath) continue; - let currentStat = await maybeStat(watchPath); - let watcher: FSWatcher; - const index = watchers.length; + const path0 = resolvePath(path, name); + const paths = new Set([path0]); try { - watcher = watch(watchPath, async function watched(type) { - // Re-initialize the watcher on the original path on rename. - if (type === "rename") { - watcher.close(); - try { - watcher = watchers[index] = watch(watchPath, watched); - } catch (error) { - if (!isEnoent(error)) throw error; - console.error(`file no longer exists: ${watchPath}`); + for (const path of JSON.parse( + readFileSync(join(root, ".observablehq", "cache", `${path0}__dependencies`), "utf-8") + )) + paths.add(path); + } catch (error) { + if (!isEnoent(error)) { + throw error; + } + } + + for (const path of paths) { + const watchPath = loaders.getWatchPath(path); + if (!watchPath) continue; + console.warn(watchPath, name); + let currentStat = await maybeStat(watchPath); + let watcher: FSWatcher; + const index = watchers.length; + try { + watcher = watch(watchPath, async function watched(type) { + // Re-initialize the watcher on the original path on rename. + if (type === "rename") { + watcher.close(); + try { + watcher = watchers[index] = watch(watchPath, watched); + } catch (error) { + if (!isEnoent(error)) throw error; + console.error(`file no longer exists: ${watchPath}`); + return; + } + setTimeout(() => watched("change"), 100); // delay to avoid a possibly-empty file return; } - setTimeout(() => watched("change"), 100); // delay to avoid a possibly-empty file - return; - } - const newStat = await maybeStat(watchPath); - // Ignore if the file was truncated or not modified. - if (currentStat?.mtimeMs === newStat?.mtimeMs || newStat?.size === 0) return; - currentStat = newStat; - callback(name); - }); - } catch (error) { - if (!isEnoent(error)) throw error; - continue; + const newStat = await maybeStat(watchPath); + // Ignore if the file was truncated or not modified. + if (currentStat?.mtimeMs === newStat?.mtimeMs || newStat?.size === 0) return; + currentStat = newStat; + callback(name); + }); + } catch (error) { + if (!isEnoent(error)) throw error; + continue; + } + watchers[index] = watcher; } - watchers[index] = watcher; } return that; } diff --git a/src/loader.ts b/src/loader.ts index 43be87896..8b6c99b1c 100644 --- a/src/loader.ts +++ b/src/loader.ts @@ -1,13 +1,13 @@ import {createHash} from "node:crypto"; import type {FSWatcher, WatchListener, WriteStream} from "node:fs"; -import {createReadStream, existsSync, statSync, watch} from "node:fs"; -import {open, readFile, rename, unlink} from "node:fs/promises"; +import {createReadStream, existsSync, readFileSync, statSync, watch} from "node:fs"; +import {open, readFile, rename, rm, unlink, writeFile} from "node:fs/promises"; import {dirname, extname, join} from "node:path/posix"; import {createGunzip} from "node:zlib"; import {spawn} from "cross-spawn"; import JSZip from "jszip"; import {extract} from "tar-stream"; -import {enoent} from "./error.js"; +import {enoent, isEnoent} from "./error.js"; import {maybeStat, prepareOutput, visitFiles} from "./files.js"; import {FileWatchers} from "./fileWatchers.js"; import {formatByteSize} from "./format.js"; @@ -16,6 +16,7 @@ import {findModule, getFileInfo} from "./javascript/module.js"; import type {Logger, Writer} from "./logger.js"; import type {MarkdownPage, ParseOptions} from "./markdown.js"; import {parseMarkdown} from "./markdown.js"; +import {preview} from "./preview.js"; import type {Params} from "./route.js"; import {isParameterized, requote, route} from "./route.js"; import {cyan, faint, green, red, yellow} from "./tty.js"; @@ -50,6 +51,9 @@ const defaultEffects: LoadEffects = { export interface LoadOptions { /** Whether to use a stale cache; true when building. */ useStale?: boolean; + + /** An asset server for chained data loaders. */ + FILE_SERVER?: string; } export interface LoaderOptions { @@ -60,7 +64,7 @@ export interface LoaderOptions { } export class LoaderResolver { - private readonly root: string; + readonly root: string; private readonly interpreters: Map; constructor({root, interpreters}: {root: string; interpreters?: Record}) { @@ -303,7 +307,21 @@ export class LoaderResolver { const info = getFileInfo(this.root, path); if (!info) return createHash("sha256").digest("hex"); const {hash} = info; - return path === name ? hash : createHash("sha256").update(hash).update(String(info.mtimeMs)).digest("hex"); + if (path === name) return hash; + const hash2 = createHash("sha256").update(hash).update(String(info.mtimeMs)); + try { + for (const path of JSON.parse( + readFileSync(join(this.root, ".observablehq", "cache", `${name}__dependencies`), "utf-8") + )) { + const info = getFileInfo(this.root, this.getSourceFilePath(path)); + if (info) hash2.update(info.hash).update(String(info.mtimeMs)); + } + } catch (error) { + if (!isEnoent(error)) { + throw error; + } + } + return hash2.digest("hex"); } getSourceInfo(name: string): FileInfo | undefined { @@ -394,12 +412,37 @@ abstract class AbstractLoader implements Loader { const outputPath = join(".observablehq", "cache", this.targetPath); const cachePath = join(this.root, outputPath); const loaderStat = await maybeStat(loaderPath); - const cacheStat = await maybeStat(cachePath); - if (!cacheStat) effects.output.write(faint("[missing] ")); - else if (cacheStat.mtimeMs < loaderStat!.mtimeMs) { - if (useStale) return effects.output.write(faint("[using stale] ")), outputPath; - else effects.output.write(faint("[stale] ")); - } else return effects.output.write(faint("[fresh] ")), outputPath; + const paths = new Set([cachePath]); + try { + for (const path of JSON.parse(await readFile(`${cachePath}__dependencies`, "utf-8"))) paths.add(path); + } catch (error) { + if (!isEnoent(error)) { + throw error; + } + } + + const FRESH = 0; + const STALE = 1; + const MISSING = 2; + let status = FRESH; + for (const path of paths) { + const cacheStat = await maybeStat(path); + if (!cacheStat) { + status = MISSING; + break; + } else if (cacheStat.mtimeMs < loaderStat!.mtimeMs) status = Math.max(status, STALE); + } + switch (status) { + case FRESH: + return effects.output.write(faint("[fresh] ")), outputPath; + case STALE: + if (useStale) return effects.output.write(faint("[using stale] ")), outputPath; + effects.output.write(faint("[stale] ")); + break; + case MISSING: + effects.output.write(faint("[missing] ")); + break; + } const tempPath = join(this.root, ".observablehq", "cache", `${this.targetPath}.${process.pid}`); const errorPath = tempPath + ".err"; const errorStat = await maybeStat(errorPath); @@ -411,8 +454,17 @@ abstract class AbstractLoader implements Loader { await prepareOutput(tempPath); await prepareOutput(cachePath); const tempFd = await open(tempPath, "w"); + + // Launch a server for chained data loaders. TODO configure host? + const dependencies = new Set(); + const {server} = await preview({root: this.root, verbose: false, hostname: "127.0.0.1", dependencies}); + const address = server.address(); + if (!address || typeof address !== "object") + throw new Error("Couldn't launch server for chained data loaders!"); + const FILE_SERVER = `http://${address.address}:${address.port}/_file/`; + try { - await this.exec(tempFd.createWriteStream({highWaterMark: 1024 * 1024}), {useStale}, effects); + await this.exec(tempFd.createWriteStream({highWaterMark: 1024 * 1024}), {useStale, FILE_SERVER}, effects); await rename(tempPath, cachePath); } catch (error) { await rename(tempPath, errorPath); @@ -420,6 +472,19 @@ abstract class AbstractLoader implements Loader { } finally { await tempFd.close(); } + + const cachedeps = `${cachePath}__dependencies`; + if (dependencies.size) await writeFile(cachedeps, JSON.stringify([...dependencies]), "utf-8"); + else + try { + await rm(cachedeps); + } catch (error) { + if (!isEnoent(error)) throw error; + } + + // TODO: server.close() might be enough? + await new Promise((closed) => server.close(closed)); + return outputPath; })(); command.finally(() => runningCommands.delete(key)).catch(() => {}); @@ -472,8 +537,12 @@ class CommandLoader extends AbstractLoader { this.args = args; } - async exec(output: WriteStream): Promise { - const subprocess = spawn(this.command, this.args, {windowsHide: true, stdio: ["ignore", output, "inherit"]}); + async exec(output: WriteStream, {FILE_SERVER}): Promise { + const subprocess = spawn(this.command, this.args, { + windowsHide: true, + stdio: ["ignore", output, "inherit"], + env: {...process.env, FILE_SERVER} + }); const code = await new Promise((resolve, reject) => { subprocess.on("error", reject); subprocess.on("close", resolve); diff --git a/src/preview.ts b/src/preview.ts index e458d9b02..3c59db234 100644 --- a/src/preview.ts +++ b/src/preview.ts @@ -45,6 +45,7 @@ export interface PreviewOptions { port?: number; origins?: string[]; verbose?: boolean; + dependencies?: Set; } export async function preview(options: PreviewOptions): Promise { @@ -58,19 +59,22 @@ export class PreviewServer { private readonly _server: ReturnType; private readonly _socketServer: WebSocketServer; private readonly _verbose: boolean; + private readonly dependencies: Set | undefined; private constructor({ config, root, origins = [], server, - verbose + verbose, + dependencies }: { config?: string; root?: string; origins?: string[]; server: Server; verbose: boolean; + dependencies?: Set; }) { this._config = config; this._root = root; @@ -80,6 +84,7 @@ export class PreviewServer { this._server.on("request", this._handleRequest); this._socketServer = new WebSocketServer({server: this._server}); this._socketServer.on("connection", this._handleConnection); + this.dependencies = dependencies; } static async start({verbose = true, hostname, port, open, ...options}: PreviewOptions) { @@ -171,6 +176,7 @@ export class PreviewServer { } throw enoent(path); } else if (pathname.startsWith("/_file/")) { + if (this.dependencies) this.dependencies.add(pathname.slice("/_file".length)); send(req, await loaders.loadFile(pathname.slice("/_file".length)), {root}).pipe(res); } else { if ((pathname = normalize(pathname)).startsWith("..")) throw new Error("Invalid path: " + pathname); diff --git a/test/input/build/chain/chain-source.json.sh b/test/input/build/chain/chain-source.json.sh new file mode 100644 index 000000000..3d99dd10c --- /dev/null +++ b/test/input/build/chain/chain-source.json.sh @@ -0,0 +1 @@ +echo '{"x": 3}' diff --git a/test/input/build/chain/chain.json.ts b/test/input/build/chain/chain.json.ts new file mode 100644 index 000000000..911822172 --- /dev/null +++ b/test/input/build/chain/chain.json.ts @@ -0,0 +1 @@ +console.log(JSON.stringify(process.env.address, null, 2)); \ No newline at end of file diff --git a/test/input/build/chain/chain.md b/test/input/build/chain/chain.md new file mode 100644 index 000000000..2356a792e --- /dev/null +++ b/test/input/build/chain/chain.md @@ -0,0 +1,9 @@ +# Chained data loaders + +```js +FileAttachment("chain1.json").json() +``` + +```js +FileAttachment("chain2.csv").csv({typed: true}) +``` diff --git a/test/input/build/chain/chain1.json.ts b/test/input/build/chain/chain1.json.ts new file mode 100644 index 000000000..37a628bcf --- /dev/null +++ b/test/input/build/chain/chain1.json.ts @@ -0,0 +1,3 @@ +const {FILE_SERVER} = process.env; +const {x} = await fetch(`${FILE_SERVER}chain-source.json`).then((response) => response.json()); +console.log(JSON.stringify({x, "x^2": x * x}, null, 2)); diff --git a/test/input/build/chain/chain2.csv.ts b/test/input/build/chain/chain2.csv.ts new file mode 100644 index 000000000..7c428b0c6 --- /dev/null +++ b/test/input/build/chain/chain2.csv.ts @@ -0,0 +1,3 @@ +const {FILE_SERVER} = process.env; +const {x} = await fetch(`${FILE_SERVER}chain-source.json`).then((response) => response.json()); +console.log(`name,value\nx,${x}\nx^2,${x * x}`); diff --git a/test/output/build/chain/_file/chain1.550fb08c.json b/test/output/build/chain/_file/chain1.550fb08c.json new file mode 100644 index 000000000..82cebd520 --- /dev/null +++ b/test/output/build/chain/_file/chain1.550fb08c.json @@ -0,0 +1,4 @@ +{ + "x": 3, + "x^2": 9 +} diff --git a/test/output/build/chain/_file/chain2.b1220d22.csv b/test/output/build/chain/_file/chain2.b1220d22.csv new file mode 100644 index 000000000..8d5b044f1 --- /dev/null +++ b/test/output/build/chain/_file/chain2.b1220d22.csv @@ -0,0 +1,3 @@ +name,value +x,3 +x^2,9 diff --git a/test/output/build/chain/_npm/d3-dsv@3.0.1/cd372fb8.js b/test/output/build/chain/_npm/d3-dsv@3.0.1/cd372fb8.js new file mode 100644 index 000000000..e69de29bb diff --git a/test/output/build/chain/_observablehq/client.00000001.js b/test/output/build/chain/_observablehq/client.00000001.js new file mode 100644 index 000000000..e69de29bb diff --git a/test/output/build/chain/_observablehq/runtime.00000002.js b/test/output/build/chain/_observablehq/runtime.00000002.js new file mode 100644 index 000000000..e69de29bb diff --git a/test/output/build/chain/_observablehq/stdlib.00000003.js b/test/output/build/chain/_observablehq/stdlib.00000003.js new file mode 100644 index 000000000..e69de29bb diff --git a/test/output/build/chain/_observablehq/theme-air,near-midnight.00000004.css b/test/output/build/chain/_observablehq/theme-air,near-midnight.00000004.css new file mode 100644 index 000000000..e69de29bb diff --git a/test/output/build/chain/chain.html b/test/output/build/chain/chain.html new file mode 100644 index 000000000..c276e2158 --- /dev/null +++ b/test/output/build/chain/chain.html @@ -0,0 +1,61 @@ + + + + +Chained data loaders + + + + + + + + + + + + + + + +
+
+

Chained data loaders

+
+
+
+ +