Spaces:

Trujasx
/

RobotCleanPupusas

Runtime error

File size: 24,202 Bytes

5ed0597

# backend/train_robot.py
import subprocess
import os
import gradio as gr
import json
import torch

# --- Helper Functions (reused from record_controller for consistency) ---

def run_command(command: str, description: str):
    """
    Ejecuta un comando de shell y captura su salida, manejando errores.
    """
    print(f"\n--- {description} ---")
    process_output = []
    try:
        # Use Popen to stream output in real-time
        process = subprocess.Popen(
            command,
            shell=True,
            stdout=subprocess.PIPE,
            stderr=subprocess.STDOUT, # Redirect stderr to stdout
            text=True
        )

        for line in iter(process.stdout.readline, ''):
            print(line, end='') # Print to console
            process_output.append(line)
            # You might want to yield here for Gradio's gr.Progress,
            # but for simplicity, we'll collect all output and return at the end.

        process.wait() # Wait for the process to complete

        if process.returncode == 0:
            print(f"Éxito: {description}")
            return True, "".join(process_output)
        else:
            error_message = f"Error durante '{description}': El comando devolvió el código de salida {process.returncode}"
            print(error_message)
            return False, "".join(process_output) # Return all collected output, including errors
    except Exception as e:
        error_message = f"Ocurrió un error inesperado durante '{description}': {e}"
        print(error_message)
        return False, error_message

def login_to_huggingface(token: str):
    """
    Inicia sesión en Hugging Face CLI con el token proporcionado.
    """
    if not token or token == "hf_YOUR_ACTUAL_WRITE_TOKEN_HERE":
        return False, "Error: Por favor, proporciona un token de Hugging Face válido."

    success, output = run_command(
        f"huggingface-cli login --token {token} --add-to-git-credential",
        "Iniciando sesión en Hugging Face CLI"
    )
    if success:
        return True, "¡Inicio de sesión en Hugging Face exitoso!"
    else:
        return False, output

def get_huggingface_user():
    """
    Obtiene el nombre de usuario de Hugging Face.
    """
    success, output = run_command(
        "huggingface-cli whoami | head -n 1",
        "Obteniendo nombre de usuario de Hugging Face"
    )
    if success:
        # The output might contain warnings before the actual username.
        # Try to find the username, which should be the first non-empty, non-warning line.
        lines = output.splitlines()
        for line in lines:
            if line.strip() and not (line.strip().startswith("warnings.") or "deprecated" in line.lower()):
                return True, line.strip()
        return False, "No se pudo extraer el nombre de usuario de la salida de 'whoami'."
    else:
        return False, output

# --- Core Training and Upload Logic ---

def train_policy_core(hf_user: str,
                      dataset_repo_id: str,
                      policy_type: str,
                      output_dir: str,
                      job_name: str,
                      policy_device: str,
                      wandb_enable: bool,
                      resume: bool,
                      resume_config_path: str):
    """
    Entrena una política de robot usando el script `lerobot/scripts/train.py`.
    """
    if not hf_user:
        return False, "Error: Nombre de usuario de Hugging Face no disponible. Por favor, inicia sesión primero."
    if not dataset_repo_id.startswith(f"{hf_user}/"):
        dataset_repo_id = f"{hf_user}/{dataset_repo_id.split('/')[-1]}" # Ensure correct repo_id format

    print(f"\nPreparando para entrenar la política '{policy_type}' con el dataset '{dataset_repo_id}'...")

    command = [
        "python", "-m", "lerobot.scripts.train" # Changed to -m lerobot.scripts.train
    ]

    if resume and resume_config_path:
        command.extend([
            f"--config_path={resume_config_path}",
            "--resume=true"
        ])
    else:
        command.extend([
            f"--dataset.repo_id={dataset_repo_id}",
            f"--policy.type={policy_type}",
            f"--output_dir={output_dir}",
            f"--job_name={job_name}",
            f"--policy.device={policy_device}"
        ])
        if wandb_enable:
            command.append("--wandb.enable=true")

    full_command = " ".join(command)

    success, output = run_command(full_command, "Entrenamiento de la Política")
    if success:
        final_message = f"¡Entrenamiento de la política completado exitosamente!\n"
        final_message += f"Los checkpoints se guardaron en: {output_dir}/checkpoints\n"
        if wandb_enable:
            final_message += "Revisa Weights & Biases para los gráficos de entrenamiento.\n"
        return True, final_message + "\n" + output # Add full output for visibility
    else:
        return False, f"Error durante el entrenamiento: {output}"

def upload_policy_core(hf_user: str, policy_repo_name: str, checkpoint_path: str, is_intermediate: bool = False):
    """
    Sube un checkpoint de política a Hugging Face Hub.
    """
    if not hf_user:
        return False, "Error: Nombre de usuario de Hugging Face no disponible. Por favor, inicia sesión primero."
    if not policy_repo_name:
        return False, "Error: El nombre del repositorio de la política no puede estar vacío."
    if not checkpoint_path:
        return False, "Error: La ruta al checkpoint no puede estar vacía."
    if not os.path.exists(checkpoint_path):
        return False, f"Error: La ruta del checkpoint '{checkpoint_path}' no existe."

    full_repo_id = f"{hf_user}/{policy_repo_name}"
    
    # Hugging Face CLI upload expects the local path to be the second argument
    command = [
        "huggingface-cli", "upload",
        full_repo_id,
        checkpoint_path,
        "--repo-type=model" # Specify repo type as model for policies
    ]
    
    if is_intermediate:
        # For intermediate, we might want to append CKPT to the repo name or use a specific folder within the repo
        # The provided doc uses policy_nameCKPT. Let's adapt to that if the user provides just base name
        # However, huggingface-cli upload expects a repo_id, which is HF_USER/REPO_NAME
        # The common practice is to upload to the same repo but into a different subfolder.
        # For simplicity, we'll stick to uploading the specified path to the given repo_id.
        pass # The logic for is_intermediate might depend on how the user names their repos/checkpoints

    full_command = " ".join(command)

    success, output = run_command(full_command, f"Subiendo política a {full_repo_id}")
    if success:
        return True, f"¡Política subida exitosamente a https://huggingface.co/{full_repo_id}!"
    else:
        return False, f"Error al subir política: {output}"

def evaluate_policy_core(hf_user: str,
                         robot_type: str,
                         robot_port: str,
                         robot_cameras: str, # Raw string for cameras
                         robot_id: str,
                         display_data: bool,
                         dataset_repo_id_eval: str,
                         single_task: str,
                         policy_path: str,
                         teleop_enable: bool = False, # Optional teleop for evaluation
                         teleop_type: str = "",
                         teleop_port: str = "",
                         teleop_id: str = ""):
    """
    Evalúa una política utilizando el script `lerobot.record` modificado.
    """
    if not hf_user:
        return False, "Error: Nombre de usuario de Hugging Face no disponible. Por favor, inicia sesión primero."
    if not policy_path:
        return False, "Error: La ruta a la política para evaluar no puede estar vacía."

    # Ensure eval dataset repo ID starts with user
    if not dataset_repo_id_eval.startswith(f"{hf_user}/"):
        dataset_repo_id_eval = f"{hf_user}/{dataset_repo_id_eval.split('/')[-1]}"


    print(f"\nPreparando para evaluar la política '{policy_path}'...")

    command = [
        "python", "-m", "lerobot.record",
        f"--robot.type={robot_type}",
        f"--robot.port={robot_port}",
        f"--robot.cameras=\"{robot_cameras}\"", # Use the raw string provided by user
        f"--robot.id={robot_id}",
        f"--display_data={str(display_data).lower()}",
        f"--dataset.repo_id={dataset_repo_id_eval}",
        f"--dataset.single_task=\"{single_task}\"",
        f"--policy.path={policy_path}"
    ]

    if teleop_enable:
        command.extend([
            f"--teleop.type={teleop_type}",
            f"--teleop.port={teleop_port}",
            f"--teleop.id={teleop_id}"
        ])

    full_command = " ".join(command)

    success, output = run_command(full_command, "Evaluación de la Política")
    if success:
        final_message = f"¡Evaluación de la política completada exitosamente!\n"
        final_message += f"Los datos de evaluación se guardaron en: ~/.cache/huggingface/lerobot/{dataset_repo_id_eval}\n"
        return True, final_message + "\n" + output
    else:
        return False, f"Error durante la evaluación: {output}"

# --- Gradio Interface Logic ---

# Variable global para almacenar el usuario de Hugging Face
current_hf_user = None

def gradio_login(hf_token_input: str):
    """Interfaz Gradio para iniciar sesión en Hugging Face."""
    global current_hf_user
    success, message = login_to_huggingface(hf_token_input)
    if success:
        gr.Info(message)
        success_user, user_name = get_huggingface_user()
        if success_user:
            current_hf_user = user_name
            return gr.update(value=user_name, interactive=False), gr.update(visible=True, value=message)
        else:
            return gr.update(value="", interactive=True), gr.update(visible=True, value=user_name)
    else:
        current_hf_user = None
        return gr.update(value="", interactive=True), gr.update(visible=True, value=message)

def gradio_train(dataset_repo_id_input: str,
                 policy_type_input: str,
                 output_dir_input: str,
                 job_name_input: str,
                 policy_device_input: str,
                 wandb_enable_input: bool,
                 resume_input: bool,
                 resume_config_path_input: str):
    """Interfaz Gradio para iniciar el entrenamiento."""
    global current_hf_user
    if not current_hf_user:
        return gr.update(visible=True, value="Error: No se ha iniciado sesión en Hugging Face o no se pudo obtener el usuario. Por favor, inicia sesión primero.")

    gr.Info("Iniciando entrenamiento del modelo. Esto puede tardar mucho tiempo...")
    success, message = train_policy_core(
        hf_user=current_hf_user,
        dataset_repo_id=dataset_repo_id_input,
        policy_type=policy_type_input,
        output_dir=output_dir_input,
        job_name=job_name_input,
        policy_device=policy_device_input,
        wandb_enable=wandb_enable_input,
        resume=resume_input,
        resume_config_path=resume_config_path_input
    )
    if success:
        gr.Info("Entrenamiento completado. Revisa la salida para los detalles.")
    else:
        gr.Info("Entrenamiento fallido. Revisa la salida para los errores.")
    return gr.update(visible=True, value=message)

def gradio_upload(policy_repo_name_input: str, checkpoint_path_input: str):
    """Interfaz Gradio para subir un checkpoint."""
    global current_hf_user
    if not current_hf_user:
        return gr.update(visible=True, value="Error: No se ha iniciado sesión en Hugging Face. Por favor, inicia sesión primero.")

    gr.Info(f"Subiendo checkpoint '{checkpoint_path_input}' a '{policy_repo_name_input}'...")
    success, message = upload_policy_core(
        hf_user=current_hf_user,
        policy_repo_name=policy_repo_name_input,
        checkpoint_path=checkpoint_path_input
    )
    if success:
        gr.Info("Subida completada.")
    else:
        gr.Info("Subida fallida. Revisa la salida.")
    return gr.update(visible=True, value=message)

def gradio_evaluate(robot_type_input: str,
                    robot_port_input: str,
                    robot_cameras_input: str,
                    robot_id_input: str,
                    display_data_input: bool,
                    dataset_repo_id_eval_input: str,
                    single_task_eval_input: str,
                    policy_path_input: str,
                    teleop_enable_input: bool,
                    teleop_type_input: str,
                    teleop_port_input: str,
                    teleop_id_input: str):
    """Interfaz Gradio para evaluar una política."""
    global current_hf_user
    if not current_hf_user:
        return gr.update(visible=True, value="Error: No se ha iniciado sesión en Hugging Face. Por favor, inicia sesión primero.")

    gr.Info("Iniciando evaluación de la política...")
    success, message = evaluate_policy_core(
        hf_user=current_hf_user,
        robot_type=robot_type_input,
        robot_port=robot_port_input,
        robot_cameras=robot_cameras_input,
        robot_id=robot_id_input,
        display_data=display_data_input,
        dataset_repo_id_eval=dataset_repo_id_eval_input,
        single_task=single_task_eval_input,
        policy_path=policy_path_input,
        teleop_enable=teleop_enable_input,
        teleop_type=teleop_type_input,
        teleop_port=teleop_port_input,
        teleop_id=teleop_id_input
    )
    if success:
        gr.Info("Evaluación completada.")
    else:
        gr.Info("Evaluación fallida. Revisa la salida.")
    return gr.update(visible=True, value=message)

# --- Gradio Interface Definition ---

with gr.Blocks(title="Controlador de Entrenamiento y Evaluación LeRobot") as demo:
    gr.Markdown("# <center>Controlador de Entrenamiento y Evaluación de Políticas LeRobot</center>")
    gr.Markdown("Esta interfaz te permite entrenar, subir y evaluar políticas de robot con LeRobot.")

    with gr.Tab("1. Configuración de Hugging Face"):
        gr.Markdown("## Configuración de Hugging Face")
        gr.Markdown(
            "Introduce tu **token de Hugging Face con permisos de escritura**. "
            "Puedes generarlo en [huggingface.co/settings/tokens](https://huggingface.co/settings/tokens)."
        )
        hf_token_input = gr.Textbox(
            label="Token de Hugging Face",
            type="password",
            placeholder="hf_YOUR_ACTUAL_WRITE_TOKEN_HERE",
            info="El token debe tener permisos de escritura (write)."
        )
        login_btn = gr.Button("Iniciar Sesión / Verificar Token")
        hf_user_output = gr.Textbox(label="Usuario de Hugging Face Actual", interactive=False, placeholder="No autenticado", show_copy_button=True)
        login_status_output = gr.Textbox(label="Estado de Autenticación", interactive=False, visible=False, lines=3)
        
        login_btn.click(
            fn=gradio_login,
            inputs=hf_token_input,
            outputs=[hf_user_output, login_status_output]
        )

    with gr.Tab("2. Entrenamiento de la Política"):
        gr.Markdown("## Entrenar una Política")
        gr.Markdown(
            "Configura los parámetros para entrenar tu política. Asegúrate de tener el dataset listo en Hugging Face Hub."
        )
        with gr.Row():
            dataset_repo_id_input = gr.Textbox(
                label="ID del Repositorio del Dataset (ej. YOUR_USER/so101_test)",
                value="YOUR_USER/so101_test", # Placeholder, will be updated by HF user
                placeholder="Dataset para entrenar",
                info="Asegúrate de que este dataset ya haya sido subido con el script de grabación."
            )
            policy_type_input = gr.Dropdown(
                label="Tipo de Política",
                choices=["act", "diffusion", "rlds"], # Add more types as needed from LeRobot
                value="act",
                info="Tipo de arquitectura de política a entrenar (e.g., ACT)."
            )
        with gr.Row():
            output_dir_input = gr.Textbox(
                label="Directorio de Salida para Checkpoints",
                value="outputs/train/act_so101_test",
                placeholder="Directorio donde se guardarán los resultados del entrenamiento."
            )
            job_name_input = gr.Textbox(
                label="Nombre del Trabajo (Job Name)",
                value="act_so101_test",
                placeholder="Nombre para identificar tu sesión de entrenamiento."
            )
        with gr.Row():
            policy_device_input = gr.Dropdown(
                label="Dispositivo de Entrenamiento",
                choices=["cuda", "mps", "cpu"],
                value="cuda" if torch.cuda.is_available() else ("mps" if torch.backends.mps.is_available() else "cpu"), # Auto-detect simple device
                info="Dispositivo a usar para el entrenamiento (GPU Nvidia: cuda, Apple Silicon: mps, CPU: cpu)."
            )
            wandb_enable_input = gr.Checkbox(
                label="Habilitar Weights & Biases",
                value=True,
                info="Habilita el seguimiento de métricas con Weights & Biases (asegúrate de haber ejecutado 'wandb login')."
            )
        
        gr.Markdown("### Opciones de Reanudación")
        resume_input = gr.Checkbox(
            label="Reanudar Entrenamiento Existente",
            value=False,
            info="Marca esta casilla para continuar un entrenamiento desde un checkpoint."
        )
        resume_config_path_input = gr.Textbox(
            label="Ruta al train_config.json para Reanudar (ej. outputs/train/act_so101_test/checkpoints/last/pretrained_model/train_config.json)",
            placeholder="Ruta al archivo train_config.json del checkpoint a reanudar.",
            visible=False # Hidden by default, shown when resume is checked
        )
        
        resume_input.change(
            lambda x: gr.update(visible=x),
            inputs=resume_input,
            outputs=resume_config_path_input
        )

        train_btn = gr.Button("🚀 Iniciar Entrenamiento 🚀", variant="primary")
        train_status_output = gr.Textbox(
            label="Log de Entrenamiento",
            interactive=False,
            visible=False,
            lines=20,
            autoscroll=True
        )

        train_btn.click(
            fn=gradio_train,
            inputs=[
                dataset_repo_id_input,
                policy_type_input,
                output_dir_input,
                job_name_input,
                policy_device_input,
                wandb_enable_input,
                resume_input,
                resume_config_path_input
            ],
            outputs=train_status_output
        )

    with gr.Tab("3. Subir Checkpoint de Política"):
        gr.Markdown("## Subir Checkpoint de Política al Hub")
        gr.Markdown(
            "Sube tus modelos entrenados a Hugging Face Hub para compartirlos o usarlos en evaluación."
        )
        policy_repo_name_input = gr.Textbox(
            label="Nombre del Repositorio de la Política (ej. act_so101_test)",
            value="act_so101_test",
            placeholder="Nombre del repositorio en Hugging Face Hub para tu política."
        )
        checkpoint_path_input = gr.Textbox(
            label="Ruta Local al Directorio del Checkpoint (ej. outputs/train/act_so101_test/checkpoints/last/pretrained_model)",
            placeholder="Ruta completa al directorio 'pretrained_model' del checkpoint."
        )
        upload_btn = gr.Button("⬆️ Subir Política ⬆️", variant="secondary")
        upload_status_output = gr.Textbox(
            label="Log de Subida",
            interactive=False,
            visible=False,
            lines=5
        )

        upload_btn.click(
            fn=gradio_upload,
            inputs=[policy_repo_name_input, checkpoint_path_input],
            outputs=upload_status_output
        )

    with gr.Tab("4. Evaluar Política"):
        gr.Markdown("## Evaluar una Política Entrenada")
        gr.Markdown(
            "Usa esta sección para probar tu política entrenada con el robot real. "
            "La teleoperación es opcional durante la evaluación."
        )
        with gr.Row():
            robot_type_eval_input = gr.Textbox(label="Tipo de Robot (e.g., so100_follower)", value="so100_follower")
            robot_port_eval_input = gr.Textbox(label="Puerto del Robot (e.g., /dev/ttyACM1)", value="/dev/ttyACM1")
        
        robot_cameras_eval_input = gr.Textbox(
            label="Configuración de Cámaras (JSON string)",
            value='{ up: {type: opencv, index_or_path: /dev/video10, width: 640, height: 480, fps: 30}}',
            info="Define tus cámaras como un string JSON. Asegúrate de escapar las comillas internas si es necesario."
        )
        robot_id_eval_input = gr.Textbox(label="ID del Robot", value="my_awesome_follower_arm")
        display_data_eval_input = gr.Checkbox(label="Mostrar Datos (Display Data)", value=False)
        dataset_repo_id_eval_input = gr.Textbox(
            label="ID del Repositorio del Dataset de Evaluación (ej. YOUR_USER/eval_so100)",
            value="YOUR_USER/eval_so100",
            info="El nombre del dataset para guardar los resultados de la evaluación (suele empezar con 'eval_')."
        )
        single_task_eval_input = gr.Textbox(
            label="Descripción de la Tarea (Single Task)",
            value="Put lego brick into the transparent box"
        )
        policy_path_input = gr.Textbox(
            label="Ruta de la Política a Evaluar (local o Hugging Face Hub ID)",
            placeholder="ej. outputs/train/eval_act_so101_test/checkpoints/last/pretrained_model O YOUR_USER/my_policy",
            info="Puede ser una ruta local al checkpoint o el ID de un repositorio de modelo en Hugging Face Hub."
        )

        gr.Markdown("### Teleoperación (Opcional durante la Evaluación)")
        teleop_enable_eval_input = gr.Checkbox(label="Habilitar Teleoperación Durante Evaluación", value=False)
        with gr.Row(visible=False) as teleop_options_row: # Hidden by default
            teleop_type_eval_input = gr.Textbox(label="Tipo de Teleop (e.g., so100_leader)", value="so100_leader")
            teleop_port_eval_input = gr.Textbox(label="Puerto de Teleop (e.g., /dev/ttyACM0)", value="/dev/ttyACM0")
            teleop_id_eval_input = gr.Textbox(label="ID de Teleop", value="my_awesome_leader_arm")
        
        teleop_enable_eval_input.change(
            lambda x: gr.update(visible=x),
            inputs=teleop_enable_eval_input,
            outputs=teleop_options_row
        )

        evaluate_btn = gr.Button("📊 Iniciar Evaluación 📊", variant="primary")
        evaluate_status_output = gr.Textbox(
            label="Log de Evaluación",
            interactive=False,
            visible=False,
            lines=15,
            autoscroll=True
        )

        evaluate_btn.click(
            fn=gradio_evaluate,
            inputs=[
                robot_type_eval_input,
                robot_port_eval_input,
                robot_cameras_eval_input,
                robot_id_eval_input,
                display_data_eval_input,
                dataset_repo_id_eval_input,
                single_task_eval_input,
                policy_path_input,
                teleop_enable_eval_input,
                teleop_type_eval_input,
                teleop_port_eval_input,
                teleop_id_eval_input
            ],
            outputs=evaluate_status_output
        )

    gr.Markdown("---")
    gr.Markdown("Hecho con ❤️ para RobotCleanPupusas503")

# Auto-detect CUDA/MPS availability for default device selection (requires torch)
try:
    import torch
except ImportError:
    print("Advertencia: PyTorch no está instalado. No se podrá auto-detectar 'cuda' o 'mps'.")
    torch = None

if __name__ == "__main__":
    demo.launch(share=False)