File size: 1,207 Bytes
8278269
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
# Configuraci贸n del Sistema de IA Multimodal

# Configuraci贸n de modelos
models:
  text_embedder: "sentence-transformers/all-MiniLM-L6-v2"
  sentiment_analyzer: "cardiffnlp/twitter-roberta-base-sentiment-latest"
  image_captioner: "Salesforce/blip-image-captioning-base"
  image_classifier: "google/vit-base-patch16-224"
  
# Configuraci贸n de procesamiento
processing:
  max_text_length: 512
  image_size: [224, 224]
  audio_sample_rate: 16000
  batch_size: 8
  max_concurrent_requests: 10

# Configuraci贸n de reducci贸n dimensional
dimensionality_reduction:
  umap:
    n_components: 2
    n_neighbors: 15
    min_dist: 0.1
    random_state: 42
  tsne:
    n_components: 2
    perplexity: 30
    random_state: 42
  dbscan:
    eps: 0.5
    min_samples: 5

# Configuraci贸n de la interfaz
interface:
  title: "Sistema de IA Multimodal Avanzado"
  theme: "soft"
  max_file_size: "10MB"
  allowed_extensions: [".jpg", ".png", ".wav", ".mp3", ".txt"]

# Configuraci贸n de logging
logging:
  level: "INFO"
  format: "%(asctime)s - %(name)s - %(levelname)s - %(message)s"
  file: "multimodal_system.log"

# Configuraci贸n de recursos
resources:
  gpu_memory_fraction: 0.8
  cpu_threads: 4
  cache_size: "1GB"