File size: 5,415 Bytes
fc93158 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 | import fs from "node:fs/promises";
import os from "node:os";
import path from "node:path";
import { pathToFileURL } from "node:url";
import { deriveSkynetCausalLabelCounts } from "../causal-valence/episode-ledger.js";
import { collectSkynetSessionTranscriptFiles } from "../causal-valence/observability-audit.js";
import { harvestSkynetObservedCausalEpisodes } from "../causal-valence/observed-harvester.js";
import { replaySkynetCognitiveKernelState } from "../cognitive-kernel/min-kernel.js";
import { runSkynetCognitiveKernelBenchmark } from "../cognitive-kernel/online-benchmark.js";
import { writeSkynetCognitiveKernelState } from "../cognitive-kernel/state-store.js";
import { buildSkynetRuntimeTrajectorySamples } from "../runtime-observer/trajectory-builder.js";
export type SkynetCognitiveKernel01Result = ReturnType<typeof runSkynetCognitiveKernelBenchmark> & {
sessionKey: string;
updatedAt: number;
projectName: string;
harvestedEpisodes: number;
trajectorySamples: number;
lookback: number;
scannedSessionFiles: string[];
sourceLabelCoverage: ReturnType<typeof deriveSkynetCausalLabelCounts>;
};
function sanitizeSessionKey(sessionKey: string): string {
return (sessionKey.trim() || "main").replace(/[^a-zA-Z0-9._-]+/g, "_").slice(0, 64) || "main";
}
function defaultSessionsDir(): string {
return path.join(os.homedir(), ".openskynet", "agents", "main", "sessions");
}
export function resolveSkynetCognitiveKernel01JsonPath(params: {
workspaceRoot: string;
sessionKey: string;
}): string {
return path.join(
params.workspaceRoot,
".openskynet",
"skynet-experiments",
`${sanitizeSessionKey(params.sessionKey)}-cognitive-kernel-01.json`,
);
}
export function resolveSkynetCognitiveKernel01MarkdownPath(workspaceRoot: string): string {
return path.join(workspaceRoot, "memory", "SKYNET_EXPERIMENT_COGNITIVE_KERNEL_01.md");
}
function buildMarkdown(result: SkynetCognitiveKernel01Result): string {
return [
"# SKYNET Experiment - Cognitive Kernel 01",
"",
`Updated: ${new Date(result.updatedAt).toISOString()}`,
`Session: ${result.sessionKey}`,
`Status: ${result.status}`,
`Harvested episodes: ${result.harvestedEpisodes}`,
`Trajectory samples: ${result.trajectorySamples}`,
`Lookback: ${result.lookback}`,
`Warmup samples: ${result.warmupSamples}`,
`Accuracy: ${result.accuracy.toFixed(2)}`,
`Sequential majority baseline: ${result.majorityBaseline.toFixed(2)}`,
`Improvement: ${result.improvementOverBaseline.toFixed(2)}`,
"",
"## Source Label Coverage",
"",
...Object.entries(result.sourceLabelCoverage).map(([label, count]) => `- ${label}: ${count}`),
"",
"## Trajectory Label Coverage",
"",
...Object.entries(result.labelCoverage).map(([label, count]) => `- ${label}: ${count}`),
"",
"## Failure Reasons",
"",
...(result.failureReasons.length > 0
? result.failureReasons.map((reason) => `- ${reason}`)
: ["- none"]),
"",
].join("\n");
}
export async function runSkynetCognitiveKernel01(params: {
workspaceRoot: string;
sessionKey: string;
lookback?: number;
sessionsDir?: string;
}): Promise<SkynetCognitiveKernel01Result> {
const lookback = Math.max(1, Math.min(6, params.lookback ?? 3));
const sessionFiles = await collectSkynetSessionTranscriptFiles(
params.sessionsDir ?? defaultSessionsDir(),
);
const harvested = await harvestSkynetObservedCausalEpisodes({ sessionFiles });
const trajectorySamples = buildSkynetRuntimeTrajectorySamples({
episodes: harvested.episodes,
lookback,
});
const benchmark = runSkynetCognitiveKernelBenchmark({ samples: trajectorySamples });
const result: SkynetCognitiveKernel01Result = {
sessionKey: params.sessionKey,
updatedAt: Date.now(),
projectName: "Skynet",
harvestedEpisodes: harvested.episodes.length,
trajectorySamples: trajectorySamples.length,
lookback,
scannedSessionFiles: sessionFiles,
sourceLabelCoverage: deriveSkynetCausalLabelCounts(harvested.episodes),
...benchmark,
};
const jsonPath = resolveSkynetCognitiveKernel01JsonPath(params);
const markdownPath = resolveSkynetCognitiveKernel01MarkdownPath(params.workspaceRoot);
await fs.mkdir(path.dirname(jsonPath), { recursive: true });
await fs.mkdir(path.dirname(markdownPath), { recursive: true });
await fs.writeFile(jsonPath, JSON.stringify(result, null, 2) + "\n", "utf-8");
await fs.writeFile(markdownPath, buildMarkdown(result), "utf-8");
const state = replaySkynetCognitiveKernelState({ samples: trajectorySamples });
if (state) {
await writeSkynetCognitiveKernelState({
workspaceRoot: params.workspaceRoot,
sessionKey: params.sessionKey,
state,
});
}
return result;
}
async function main() {
const result = await runSkynetCognitiveKernel01({
workspaceRoot: process.cwd(),
sessionKey: "agent:openskynet:main",
});
console.log(`--- ${result.projectName} Experiment: Cognitive Kernel 01 ---`);
console.log(`Status: ${result.status}`);
console.log(`Samples: ${result.trajectorySamples}`);
console.log(`Accuracy: ${result.accuracy.toFixed(2)}`);
console.log(`Baseline: ${result.majorityBaseline.toFixed(2)}`);
}
if (process.argv[1] && import.meta.url === pathToFileURL(process.argv[1]).href) {
main().catch((error) => {
console.error(error);
process.exitCode = 1;
});
}
|