OktoSeek
/

oktoscript

Model card Files Files and versions

oktoscript / examples /inference-advanced.okt

OktoSeek's picture

Upload 48 files

5fc8c9d verified about 1 month ago

history blame contribute delete

1.56 kB

	# okto_version: "1.2"
	PROJECT "InferenceAdvancedExample"
	DESCRIPTION "Demonstrates advanced INFERENCE block with nested CONTROL"

	ENV {
	accelerator: "gpu"
	min_memory: "8GB"
	precision: "fp16"
	}

	DATASET {
	train: "examples/datasets/demo_train.jsonl"
	format: "jsonl"
	type: "chat"
	}

	MODEL {
	name: "inference-advanced-model"
	base: "oktoseek/base-mini"
	device: "cuda"
	}

	TRAIN {
	epochs: 5
	batch_size: 32
	device: "cuda"
	}

	BEHAVIOR {
	mode: "chat"
	personality: "friendly"
	verbosity: "high"
	language: "en"
	prompt_style: "User: {input}\nAssistant:"
	}

	INFERENCE {
	mode: "chat"
	format: "User: {input}\nAssistant:"
	exit_command: "/exit"

	params {
	max_length: 200
	temperature: 0.7
	top_p: 0.9
	top_k: 40
	beams: 2
	do_sample: true
	repetition_penalty: 1.1
	}

	CONTROL {
	IF confidence < 0.3 {
	RETRY
	LOG "Low confidence, retrying"
	}

	IF repetition > 3 {
	REGENERATE
	LOG "High repetition detected"
	}

	IF hallucination_score > 0.5 {
	REPLACE WITH "I'm not certain about that. Could you rephrase?"
	}

	IF toxic == true {
	REPLACE WITH "I cannot assist with that request."
	}
	}
	}

	GUARD {
	prevent {
	hallucination
	toxicity
	bias
	}

	detect_using: ["classifier", "embedding"]

	on_violation {
	REPLACE
	with_message: "Sorry, I cannot process that request."
	}
	}

	EXPORT {
	format: ["okm"]
	path: "export/"
	}