Update main_process/moe_router.py
Browse files- main_process/moe_router.py +84 -54
main_process/moe_router.py
CHANGED
|
@@ -61,18 +61,30 @@ class NState(dict):
|
|
| 61 |
|
| 62 |
# ---------------- LLM utilizado para el free_narration ----------------
|
| 63 |
class SalamandraClient:
|
| 64 |
-
|
| 65 |
-
|
| 66 |
-
self.tokenizer = AutoTokenizer.from_pretrained(model_id)
|
| 67 |
self.model = AutoModelForCausalLM.from_pretrained(
|
| 68 |
model_id,
|
| 69 |
device_map="auto",
|
| 70 |
-
torch_dtype=torch.bfloat16
|
|
|
|
| 71 |
)
|
| 72 |
-
'''
|
| 73 |
|
| 74 |
-
def chat(self,
|
| 75 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 76 |
|
| 77 |
# Esto aqu铆 s贸lo se utiliza para la valoraci贸n:
|
| 78 |
class GPT5Client:
|
|
@@ -1469,7 +1481,7 @@ async def generate_salamadra_result(
|
|
| 1469 |
state = tool(state, srt_final, csv_evaluacion)
|
| 1470 |
|
| 1471 |
elif isinstance(tool, Free_Narration):
|
| 1472 |
-
state = tool(state, srt_final,
|
| 1473 |
|
| 1474 |
messages_registro.append({"role": "assistant", "content": f"Ejecut茅 {tool_name} correctamente."})
|
| 1475 |
else:
|
|
@@ -1479,64 +1491,82 @@ async def generate_salamadra_result(
|
|
| 1479 |
|
| 1480 |
messages_registro = [{"role": "system", "content": "Eres un agente que puede ejecutar herramientas Python usando las herramientas disponibles."}]
|
| 1481 |
|
| 1482 |
-
|
| 1483 |
|
| 1484 |
-
|
| 1485 |
-
|
| 1486 |
-
state = add_ad(state, temp_srt_files[0].name, temp_srt_files[1].name)
|
| 1487 |
-
print("Transcripci贸n con AD guardada")
|
| 1488 |
|
| 1489 |
-
|
| 1490 |
-
|
| 1491 |
-
|
| 1492 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1493 |
|
| 1494 |
-
|
| 1495 |
-
|
| 1496 |
-
state = unir_ad_silence(state, temp_srt_files[2].name, temp_srt_files[3].name)
|
| 1497 |
-
print("Transcripci贸n con AD y Unir_AD_Silence guardada")
|
| 1498 |
|
| 1499 |
-
|
|
|
|
| 1500 |
|
| 1501 |
-
|
| 1502 |
-
|
| 1503 |
-
#final_state, messages_registro = run_salamandra_agent(salamandraclient, final_state, tools, user_prompt, messages_registro, count)
|
| 1504 |
-
print("Transcripci贸n con AD y Add_Silence_AD guardada")
|
| 1505 |
|
| 1506 |
-
|
| 1507 |
-
|
| 1508 |
-
#final_state, messages_registro = run_salamandra_agent(salamandraclient, final_state, tools, user_prompt, messages_registro, count)
|
| 1509 |
-
print("Transcripci贸n con AD y Unir_AD_Silences_a_ADs guardada")
|
| 1510 |
|
| 1511 |
-
|
| 1512 |
-
|
| 1513 |
-
#final_state, messages_registro = run_salamandra_agent(salamandraclient, final_state, tools, user_prompt, messages_registro, count)
|
| 1514 |
-
print("Transcripci贸n con AD, Add_Silence_AD e Introduccion_OCR guardada")
|
| 1515 |
|
| 1516 |
-
|
| 1517 |
-
|
| 1518 |
-
#final_state, messages_registro = run_salamandra_agent(salamandraclient, final_state, tools, user_prompt, messages_registro, count)
|
| 1519 |
-
print("Transcripci贸n con AD, Add_Silence_AD, Introduccion_OCR e Identity_Manager guardada")
|
| 1520 |
|
| 1521 |
-
|
| 1522 |
-
|
| 1523 |
-
#final_state, messages_registro = run_salamandra_agent(salamandraclient, final_state, tools, user_prompt, messages_registro, count)
|
| 1524 |
-
print("Transcripci贸n con AD, Add_Silence_AD, Introduccion_OCR, Identity_Manager y norma UNE guardada")
|
| 1525 |
|
| 1526 |
-
|
| 1527 |
-
|
| 1528 |
-
#final_state, messages_registro = run_salamandra_agent(salamandraclient, final_state, tools, user_prompt, messages_registro, count)
|
| 1529 |
-
print("Transcripci贸n con AD, Add_Silence_AD, Introduccion_OCR, Identity_Manager y norma UNE guardada")
|
| 1530 |
|
| 1531 |
-
|
| 1532 |
-
|
| 1533 |
-
#final_state, messages_registro = run_salamandra_agent(salamandraclient, final_state, tools, user_prompt, messages_registro, count)
|
| 1534 |
-
print("Valoraci贸n guardada")
|
| 1535 |
|
| 1536 |
-
|
| 1537 |
-
|
| 1538 |
-
state = free_narration(state, srt_final, free_narration_salamandra)
|
| 1539 |
-
print("Free Narration guardada")
|
| 1540 |
|
| 1541 |
srt_update(srt_final,srt_final)
|
| 1542 |
|
|
|
|
| 61 |
|
| 62 |
# ---------------- LLM utilizado para el free_narration ----------------
|
| 63 |
class SalamandraClient:
|
| 64 |
+
def __init__(self, model_id="BSC-LT/salamandra-7b-instruct-tools"):
|
| 65 |
+
self.tokenizer = AutoTokenizer.from_pretrained(model_id, use_auth_token=HF_TOKEN)
|
|
|
|
| 66 |
self.model = AutoModelForCausalLM.from_pretrained(
|
| 67 |
model_id,
|
| 68 |
device_map="auto",
|
| 69 |
+
torch_dtype=torch.bfloat16,
|
| 70 |
+
use_auth_token= HF_TOKEN
|
| 71 |
)
|
|
|
|
| 72 |
|
| 73 |
+
def chat(self, message, tools) -> str:
|
| 74 |
+
date_string = datetime.today().strftime('%Y-%m-%d')
|
| 75 |
+
|
| 76 |
+
prompt = self.tokenizer.apply_chat_template(
|
| 77 |
+
message,
|
| 78 |
+
tokenize=False,
|
| 79 |
+
add_generation_prompt=True,
|
| 80 |
+
date_string=date_string,
|
| 81 |
+
tools=tools
|
| 82 |
+
)
|
| 83 |
+
|
| 84 |
+
inputs = self.tokenizer.encode(prompt, add_special_tokens=False, return_tensors="pt")
|
| 85 |
+
outputs = self.model.generate(input_ids=inputs.to(self.model.device), max_new_tokens=200)
|
| 86 |
+
|
| 87 |
+
return self.tokenizer.decode(outputs[0], skip_special_tokens=True)
|
| 88 |
|
| 89 |
# Esto aqu铆 s贸lo se utiliza para la valoraci贸n:
|
| 90 |
class GPT5Client:
|
|
|
|
| 1481 |
state = tool(state, srt_final, csv_evaluacion)
|
| 1482 |
|
| 1483 |
elif isinstance(tool, Free_Narration):
|
| 1484 |
+
state = tool(state, srt_final, free_narration_salamandra)
|
| 1485 |
|
| 1486 |
messages_registro.append({"role": "assistant", "content": f"Ejecut茅 {tool_name} correctamente."})
|
| 1487 |
else:
|
|
|
|
| 1491 |
|
| 1492 |
messages_registro = [{"role": "system", "content": "Eres un agente que puede ejecutar herramientas Python usando las herramientas disponibles."}]
|
| 1493 |
|
| 1494 |
+
import yaml
|
| 1495 |
|
| 1496 |
+
with open("config.yaml", "r") as file:
|
| 1497 |
+
config = yaml.safe_load(file)
|
|
|
|
|
|
|
| 1498 |
|
| 1499 |
+
stools_enabled = config.get("stools", False)
|
| 1500 |
+
|
| 1501 |
+
if stools_enabled:
|
| 1502 |
+
count = 1
|
| 1503 |
+
user_prompt = "Ejecuta la funci贸n add_ad"
|
| 1504 |
+
final_state, messages_registro = run_salamandra_agent(salamandraclient, state, tools, user_prompt, messages_registro, count)
|
| 1505 |
+
|
| 1506 |
+
user_prompt = "Ejecuta la funci贸n add_silence_ad"
|
| 1507 |
+
final_state, messages_registro = run_salamandra_agent(salamandraclient, final_state, tools, user_prompt, messages_registro, count)
|
| 1508 |
+
|
| 1509 |
+
user_prompt = "Ejecuta la funci贸n unir_ad_silence"
|
| 1510 |
+
final_state, messages_registro = run_salamandra_agent(salamandraclient, final_state, tools, user_prompt, messages_registro, count)
|
| 1511 |
+
|
| 1512 |
+
count = 2
|
| 1513 |
+
user_prompt = "Ejecuta la funci贸n add_silence_ad"
|
| 1514 |
+
final_state, messages_registro = run_salamandra_agent(salamandraclient, final_state, tools, user_prompt, messages_registro, count)
|
| 1515 |
+
|
| 1516 |
+
user_prompt = "Ejecuta la funci贸n Unir_AD_Silences_a_ADs"
|
| 1517 |
+
final_state, messages_registro = run_salamandra_agent(salamandraclient, final_state, tools, user_prompt, messages_registro, count)
|
| 1518 |
+
|
| 1519 |
+
user_prompt = "Ejecuta la funci贸n Introduccion_OCR"
|
| 1520 |
+
final_state, messages_registro = run_salamandra_agent(salamandraclient, final_state, tools, user_prompt, messages_registro, count)
|
| 1521 |
+
|
| 1522 |
+
user_prompt = "Ejecuta la funci贸n Identity_Manager"
|
| 1523 |
+
final_state, messages_registro = run_salamandra_agent(salamandraclient, final_state, tools, user_prompt, messages_registro, count)
|
| 1524 |
+
|
| 1525 |
+
user_prompt = "Ejecuta la funci贸n UNE_Actor_prev"
|
| 1526 |
+
final_state, messages_registro = run_salamandra_agent(salamandraclient, final_state, tools, user_prompt, messages_registro, count)
|
| 1527 |
+
|
| 1528 |
+
user_prompt = "Ejecuta la funci贸n UNE_Actor"
|
| 1529 |
+
final_state, messages_registro = run_salamandra_agent(salamandraclient, final_state, tools, user_prompt, messages_registro, count)
|
| 1530 |
+
|
| 1531 |
+
user_prompt = "Ejecuta la funci贸n Valoracion_Final"
|
| 1532 |
+
final_state, messages_registro = run_salamandra_agent(salamandraclient, final_state, tools, user_prompt, messages_registro, count)
|
| 1533 |
+
|
| 1534 |
+
user_prompt = "Ejecuta la funci贸n Free_Narration"
|
| 1535 |
+
final_state, messages_registro = run_salamandra_agent(salamandraclient, final_state, tools, user_prompt, messages_registro, count)
|
| 1536 |
+
|
| 1537 |
+
else:
|
| 1538 |
+
state = add_ad(state, temp_srt_files[0].name, temp_srt_files[1].name)
|
| 1539 |
+
print("Transcripci贸n con AD guardada")
|
| 1540 |
|
| 1541 |
+
state = add_silence_ad(state, temp_srt_files[1].name, temp_srt_files[2].name)
|
| 1542 |
+
print("Transcripci贸n con AD y Add_Silence_AD guardada")
|
|
|
|
|
|
|
| 1543 |
|
| 1544 |
+
state = unir_ad_silence(state, temp_srt_files[2].name, temp_srt_files[3].name)
|
| 1545 |
+
print("Transcripci贸n con AD y Unir_AD_Silence guardada")
|
| 1546 |
|
| 1547 |
+
state = add_silence_ad(state, temp_srt_files[3].name, temp_srt_files[4].name)
|
| 1548 |
+
print("Transcripci贸n con AD y Add_Silence_AD guardada")
|
|
|
|
|
|
|
| 1549 |
|
| 1550 |
+
state = unir_ad_silences_a_ads(state, temp_srt_files[4].name, temp_srt_files[5].name)
|
| 1551 |
+
print("Transcripci贸n con AD y Unir_AD_Silences_a_ADs guardada")
|
|
|
|
|
|
|
| 1552 |
|
| 1553 |
+
state = introduccion_ocr(state, temp_srt_files[5].name, temp_srt_files[6].name)
|
| 1554 |
+
print("Transcripci贸n con AD, Add_Silence_AD e Introduccion_OCR guardada")
|
|
|
|
|
|
|
| 1555 |
|
| 1556 |
+
state = identity_manager(state, temp_srt_files[6].name, temp_srt_files[7].name)
|
| 1557 |
+
print("Transcripci贸n con AD, Add_Silence_AD, Introduccion_OCR e Identity_Manager guardada")
|
|
|
|
|
|
|
| 1558 |
|
| 1559 |
+
state = une_actor_prev(state, temp_srt_files[7].name, temp_srt_files[8].name)
|
| 1560 |
+
print("Transcripci贸n con AD, Add_Silence_AD, Introduccion_OCR, Identity_Manager y norma UNE guardada")
|
|
|
|
|
|
|
| 1561 |
|
| 1562 |
+
state = une_actor(state, temp_srt_files[8].name, srt_final)
|
| 1563 |
+
print("Transcripci贸n con AD, Add_Silence_AD, Introduccion_OCR, Identity_Manager y norma UNE guardada")
|
|
|
|
|
|
|
| 1564 |
|
| 1565 |
+
state = valoracion_final(state, srt_final, csv_evaluacion)
|
| 1566 |
+
print("Valoraci贸n guardada")
|
|
|
|
|
|
|
| 1567 |
|
| 1568 |
+
state = free_narration(state, srt_final, free_narration_salamandra)
|
| 1569 |
+
print("Free Narration guardada")
|
|
|
|
|
|
|
| 1570 |
|
| 1571 |
srt_update(srt_final,srt_final)
|
| 1572 |
|