Files
moltbot/src/plugins/document-extractors.runtime.ts
Vincent Koc e3cba98f39 refactor(pdf): move document extraction to plugin
* refactor(pdf): move document extraction to plugin

* fix(deps): sync document extract lockfile

* fix(pdf): harden document extraction plugin
2026-04-24 17:15:05 -07:00

135 lines
4.4 KiB
TypeScript

import type { OpenClawConfig } from "../config/types.openclaw.js";
import { resolveBundledPluginCompatibleLoadValues } from "./activation-context.js";
import {
createPluginActivationSource,
normalizePluginsConfig,
resolveEffectivePluginActivationState,
} from "./config-state.js";
import { loadBundledDocumentExtractorEntriesFromDir } from "./document-extractor-public-artifacts.js";
import type { PluginDocumentExtractorEntry } from "./document-extractor-types.js";
import { loadPluginManifestRegistry } from "./manifest-registry.js";
import type { PluginManifestRecord } from "./manifest-registry.js";
function compareExtractors(
left: PluginDocumentExtractorEntry,
right: PluginDocumentExtractorEntry,
): number {
const leftOrder = left.autoDetectOrder ?? Number.MAX_SAFE_INTEGER;
const rightOrder = right.autoDetectOrder ?? Number.MAX_SAFE_INTEGER;
if (leftOrder !== rightOrder) {
return leftOrder - rightOrder;
}
return left.id.localeCompare(right.id) || left.pluginId.localeCompare(right.pluginId);
}
function resolveBundledDocumentExtractorCompatPluginIds(params: {
config?: OpenClawConfig;
workspaceDir?: string;
env?: NodeJS.ProcessEnv;
onlyPluginIds?: readonly string[];
}): string[] {
const onlyPluginIdSet =
params.onlyPluginIds && params.onlyPluginIds.length > 0 ? new Set(params.onlyPluginIds) : null;
return loadPluginManifestRegistry({
config: params.config,
workspaceDir: params.workspaceDir,
env: params.env,
})
.plugins.filter(
(plugin) =>
plugin.origin === "bundled" &&
(!onlyPluginIdSet || onlyPluginIdSet.has(plugin.id)) &&
(plugin.contracts?.documentExtractors?.length ?? 0) > 0,
)
.map((plugin) => plugin.id)
.toSorted((left, right) => left.localeCompare(right));
}
function resolveEnabledBundledDocumentExtractorPlugins(params: {
config?: OpenClawConfig;
workspaceDir?: string;
env?: NodeJS.ProcessEnv;
onlyPluginIds?: readonly string[];
}): PluginManifestRecord[] {
if (params.config?.plugins?.enabled === false) {
return [];
}
const activation = resolveBundledPluginCompatibleLoadValues({
rawConfig: params.config,
env: params.env,
workspaceDir: params.workspaceDir,
onlyPluginIds: params.onlyPluginIds,
applyAutoEnable: true,
compatMode: {
allowlist: false,
enablement: "allowlist",
vitest: true,
},
resolveCompatPluginIds: resolveBundledDocumentExtractorCompatPluginIds,
});
const normalizedPlugins = normalizePluginsConfig(activation.config?.plugins);
const activationSource = createPluginActivationSource({
config: activation.activationSourceConfig,
});
const onlyPluginIdSet =
params.onlyPluginIds && params.onlyPluginIds.length > 0 ? new Set(params.onlyPluginIds) : null;
return loadPluginManifestRegistry({
config: activation.config,
workspaceDir: params.workspaceDir,
env: params.env,
}).plugins.filter((plugin) => {
if (
plugin.origin !== "bundled" ||
(onlyPluginIdSet && !onlyPluginIdSet.has(plugin.id)) ||
(plugin.contracts?.documentExtractors?.length ?? 0) === 0
) {
return false;
}
return resolveEffectivePluginActivationState({
id: plugin.id,
origin: plugin.origin,
config: normalizedPlugins,
rootConfig: activation.config,
enabledByDefault: plugin.enabledByDefault,
activationSource,
}).enabled;
});
}
export function resolvePluginDocumentExtractors(params?: {
config?: OpenClawConfig;
workspaceDir?: string;
env?: NodeJS.ProcessEnv;
onlyPluginIds?: readonly string[];
}): PluginDocumentExtractorEntry[] {
const extractors: PluginDocumentExtractorEntry[] = [];
const loadErrors: unknown[] = [];
for (const plugin of resolveEnabledBundledDocumentExtractorPlugins({
config: params?.config,
workspaceDir: params?.workspaceDir,
env: params?.env,
onlyPluginIds: params?.onlyPluginIds,
})) {
let loaded: PluginDocumentExtractorEntry[] | null;
try {
loaded = loadBundledDocumentExtractorEntriesFromDir({
dirName: plugin.id,
pluginId: plugin.id,
});
} catch (error) {
loadErrors.push(error);
continue;
}
if (loaded) {
extractors.push(...loaded);
}
}
if (extractors.length === 0 && loadErrors.length > 0) {
throw new Error("Unable to load document extractor plugins", {
cause: loadErrors.length === 1 ? loadErrors[0] : new AggregateError(loadErrors),
});
}
return extractors.toSorted(compareExtractors);
}