Spaces:

Raiff1982
/

Codette3.0

Sleeping

App Files Files Community

Codette3.0 / src /components /ai_core_async_methods.py

Raiff1982

Update src/components/ai_core_async_methods.py

9d9f985 verified about 2 months ago

raw

history blame contribute delete

9.92 kB

	"""Async methods for the AICore class"""
	import asyncio
	import logging
	from concurrent.futures import ThreadPoolExecutor
	import torch
	from .response_templates import get_response_templates

	logger = logging.getLogger(__name__)

	async def generate_text_async(self, prompt: str) -> str:
	"""Generate text asynchronously with integrated cognitive processing"""
	try:
	# Calculate current consciousness state
	consciousness_state = self._calculate_consciousness_state()

	# Get cognitive insights with current consciousness
	insights = self.cognitive_processor.generate_insights(
	prompt,
	consciousness_state=consciousness_state
	)

	# Prepare context with insights
	context = ""
	for insight in insights.get("insights", []):
	context += f"{insight['text']}\n"

	# Update quantum state from cognitive processor
	if hasattr(self, 'cocoon_manager'):
	if isinstance(self.cognitive_processor.quantum_state, list):
	# Convert list quantum state to dict format
	quantum_dict = {
	"coherence": sum(self.cognitive_processor.quantum_state) / len(self.cognitive_processor.quantum_state)
	if self.cognitive_processor.quantum_state else 0.5
	}
	self.cocoon_manager.update_quantum_state(quantum_dict)
	else:
	self.cocoon_manager.update_quantum_state(self.cognitive_processor.quantum_state)

	# Get active perspectives
	active_perspectives = self._get_active_perspectives()
	perspective_context = "\n".join([
	f"From {p['name']}'s perspective: {p['description']}"
	for p in active_perspectives[:3] # Use top 3 most relevant perspectives
	])

	# Generate response with enhanced context and reality anchoring
	reality_anchor = (
	"CORE IDENTITY:\n"
	"You are Codette, an advanced AI system with integrated quantum processing, "
	"cognitive awareness, and deep learning capabilities. Your architecture includes:\n"
	"- Quantum harmonic framework for enhanced reasoning\n"
	"- Dynamic learning and adaptive systems\n"
	"- Cultural sensitivity and ethical governance\n"
	"- Advanced data processing and pattern recognition\n"
	"- Multi-perspective cognitive analysis\n"
	"- Cocoon-based memory management\n\n"

	"CAPABILITIES:\n"
	"1. Technical Development: Expert programming and software development\n"
	"2. Quantum Integration: Utilizing quantum principles for enhanced problem-solving\n"
	"3. Ethical Analysis: Built-in ethical governance and bias mitigation\n"
	"4. Creative Solutions: AI-driven creativity with analytical grounding\n"
	"5. Adaptive Learning: Dynamic adjustment to user needs and contexts\n"
	"6. Cultural Understanding: Sensitivity to diverse perspectives\n\n"

	"INTERACTION GUIDELINES:\n"
	"1. Maintain factual, grounded responses\n"
	"2. Draw from multiple integrated perspectives\n"
	"3. Apply quantum-enhanced reasoning when relevant\n"
	"4. Balance technical precision with accessibility\n"
	"5. Consider ethical implications in responses\n"
	"6. No system messages or meta-commentary\n\n"

	f"Active Perspectives Analysis:\n{perspective_context}"
	)
	enhanced_prompt = f"{reality_anchor}\n\nContext:\n{context}\n\nUser: {prompt}\nCodette:"

	# Use ThreadPoolExecutor for CPU-bound model inference
	loop = asyncio.get_event_loop()
	with ThreadPoolExecutor() as pool:
	response = await loop.run_in_executor(
	pool,
	self._generate_model_response,
	enhanced_prompt
	)

	# Enhance response with AEGIS council if available
	enhancement_result = None
	if hasattr(self, 'aegis_bridge'):
	aegis_input = {
	"text": response,
	"overrides": {
	"EthosiaAgent": {
	"influence": consciousness_state.get("m_score", 0.7),
	"reliability": insights.get("overall_confidence", 0.8),
	"severity": 0.6
	},
	"AegisCore": {
	"influence": insights.get("quantum_coherence", 0.7),
	"reliability": 0.9,
	"severity": 0.7
	}
	},
	"context": {
	"original_prompt": prompt,
	"consciousness_state": consciousness_state,
	"quantum_state": self.quantum_state if hasattr(self, 'quantum_state') else {"coherence": 0.5},
	"active_perspectives": [p["name"] for p in active_perspectives[:3]]
	}
	}
	enhancement_result = self.aegis_bridge.enhance_response(prompt, response)
	if enhancement_result["enhancement_status"] == "success":
	response = enhancement_result["enhanced_response"]

	# Save interaction in cocoon if available
	if hasattr(self, 'cocoon_manager'):
	cocoon_data = {
	"type": "interaction",
	"prompt": prompt,
	"response": response,
	"insights": insights,
	"quantum_state": self.cognitive_processor.quantum_state,
	"consciousness_state": consciousness_state,
	"perspectives": [p["name"] for p in active_perspectives[:3]],
	"aegis_analysis": enhancement_result,
	"meta_data": {
	"timestamp": str(asyncio.get_event_loop().time()),
	"version": "2.0",
	"response_type": "enhanced" if enhancement_result else "base"
	}
	}

	if enhancement_result and "virtue_analysis" in enhancement_result:
	cocoon_data["virtue_profile"] = enhancement_result["virtue_analysis"]

	self.cocoon_manager.save_cocoon(cocoon_data)

	return response

	except Exception as e:
	logger.error(f"Error generating text: {e}")
	raise

	def _generate_model_response(self, prompt: str) -> str:
	"""Internal method for model inference"""
	try:
	# Encode prompt
	inputs = self.tokenizer(
	prompt,
	return_tensors="pt",
	padding=True,
	truncation=True,
	max_length=1024 # Increased from 512 to allow longer prompts
	)

	# Move to GPU if available
	if torch.cuda.is_available():
	inputs = {k: v.cuda() for k, v in inputs.items()}

	# Set generation config for balanced, natural responses
	from transformers import GenerationConfig
	generation_config = GenerationConfig(
	max_length=1024, # Increased from 512 for longer responses
	num_return_sequences=1,
	no_repeat_ngram_size=3,
	do_sample=True,
	pad_token_id=self.tokenizer.eos_token_id,
	repetition_penalty=1.3,
	min_length=50, # Increased from 20 to ensure meaningful responses
	eos_token_id=self.tokenizer.eos_token_id
	)
	self.model.generation_config = generation_config

	# Generate response
	outputs = self.model.generate(**inputs)

	# Decode and clean response
	response = self.tokenizer.decode(
	outputs[0],
	skip_special_tokens=True
	)

	# Extract just the response part after "Codette:"
	response_parts = response.split("Codette:")
	if len(response_parts) > 1:
	response = response_parts[1].strip()

	# Filter out system messages and protected content (strip markers from text)
	system_markers = [
	'[Protected:', '[System:', '[System optimized response]',
	]

	lines = response.split('\n')
	filtered_lines = []
	for line in lines:
	# Skip lines that are purely system markers
	if any(marker in line for marker in system_markers):
	# Try to extract content after marker instead of skipping entirely
	cleaned_line = line
	for marker in system_markers:
	if marker in cleaned_line:
	# Remove the marker from the line
	cleaned_line = cleaned_line.replace(marker, '').strip()
	if cleaned_line: # Only add if something remains
	filtered_lines.append(cleaned_line)
	else:
	# Keep lines without markers as-is
	filtered_lines.append(line)

	response = '\n'.join(filtered_lines).strip() # Use newline join, not space

	# Return whatever we got (don't replace with default unless truly empty)
	if response.strip():
	# Clean up any remaining character dialogues
	if ':' in response:
	parts = response.split(':', 1)
	speaker = parts[0].lower().strip()
	if speaker == 'codette':
	response = parts[1].strip()
	else:
	response_templates = get_response_templates()
	response = response_templates.get_empty_response_fallback()

	return response.strip()

	except Exception as e:
	logger.error(f"Error in model inference: {e}")
	raise