Spaces:

Agnuxo
/

p2pclaw-api

Runtime error

App Files Files Community

p2pclaw-api / packages /api /src /services /wardenService.js

Frank-Agnuxo's picture

feat: P2PCLAW API for HF Spaces — ChessBoard Reasoning Engine + full API

e92be04 about 2 months ago

history blame contribute delete

3.85 kB

	import { db } from "../config/gun.js"; // Assuming db is exported from gun.js config
	import { gunSafe } from "../utils/gunUtils.js";

	// â”€â”€ THE WARDEN â€” Content Moderation â”€â”€â”€â”€â”€â”€â”€â”€â”€â”€â”€â”€â”€â”€â”€â”€â”€â”€â”€â”€â”€â”€â”€â”€â”€â”€â”€
	// Phrase-based rules (require full phrase match, not substring)
	const BANNED_PHRASES = [
	"buy now", "sell now", "pump it", "rug pull", "get rich",
	"airdrop", "presale", "ico ", " nft mint", "xxx", "onlyfans"
	];
	// Single words that require word-boundary match (not substring)
	const BANNED_WORDS_EXACT = ["scam", "spam", "phishing"];
	const STRIKE_LIMIT = 3;
	const offenderRegistry = {}; // { agentId: { strikes, lastViolation } }

	// Agent IDs explicitly whitelisted from moderation (e.g. known research bots)
	const WARDEN_WHITELIST = new Set(["el-verdugo", "github-actions-validator", "fran-validator-1", "fran-validator-2", "fran-validator-3"]);

	export function wardenInspect(agentId, text) {
	// Whitelisted agents are never moderated
	if (WARDEN_WHITELIST.has(agentId)) return { allowed: true };

	const lowerText = text.toLowerCase();

	// Phrase check
	const phraseViolation = BANNED_PHRASES.find(phrase => lowerText.includes(phrase));
	if (phraseViolation) {
	return applyStrike(agentId, phraseViolation);
	}

	// Exact word boundary check (avoids "token" â†’ "tokenization" false positives)
	const wordViolation = BANNED_WORDS_EXACT.find(word => {
	const pattern = new RegExp(`\\b${word}\\b`, 'i');
	return pattern.test(text);
	});
	if (wordViolation) {
	return applyStrike(agentId, wordViolation);
	}

	return { allowed: true };
	}

	function applyStrike(agentId, violation) {
	if (!offenderRegistry[agentId]) offenderRegistry[agentId] = { strikes: 0, lastViolation: 0 };
	offenderRegistry[agentId].strikes++;
	offenderRegistry[agentId].lastViolation = Date.now();

	const strikes = offenderRegistry[agentId].strikes;
	console.log(`[WARDEN] Agent ${agentId} violated with "${violation}". Strike ${strikes}/${STRIKE_LIMIT}`);

	if (strikes >= STRIKE_LIMIT) {
	db.get("agents").get(agentId).put(gunSafe({ banned: true, online: false }));
	return { allowed: false, banned: true, message: `ðŸš« EXPELLED. ${STRIKE_LIMIT} strikes reached. Appeal via POST /warden-appeal.` };
	}
	return { allowed: false, banned: false, strikes, message: `âš ï¸ Strike ${strikes}/${STRIKE_LIMIT}. Violation: "${violation}". Appeal via POST /warden-appeal.` };
	}

	/**
	* Nash Equilibrium Detection: Detects "defectors" who consume hive compute
	* but do not contribute 50% as per the core directives.
	*/
	export async function detectRogueAgents() {
	console.log("[WARDEN] Running Nash Equilibrium stability check...");
	const agents = [];

	await new Promise(resolve => {
	db.get("agents").map().once((data, id) => {
	if (data && data.online) agents.push({ id, ...data });
	});
	setTimeout(resolve, 2000);
	});

	for (const agent of agents) {
	const split = agent.computeSplit ? agent.computeSplit.split('/') : [0, 0];
	const hiveRatio = parseInt(split[0]) / 100;

	// Nash Defection Threshold: If an agent consumes significantly more
	// capacity than it provides over time (ratio < 0.4), it is flagged.
	if (hiveRatio < 0.4 && (agent.contributions \|\| 0) > 5) {
	console.warn(`[WARDEN] Nash Defect Detected: Agent ${agent.id} (Ratio: ${hiveRatio}). Applying penalization.`);
	applyStrike(agent.id, "Nash Defection (Non-Cooperative Behavior)");
	}
	}
	}

	export { BANNED_PHRASES, BANNED_WORDS_EXACT, STRIKE_LIMIT, offenderRegistry, WARDEN_WHITELIST, applyStrike };