SergioSCA commited on
Commit
f5bf61e
·
verified ·
1 Parent(s): b959918

Update functions.py

Browse files
Files changed (1) hide show
  1. functions.py +44 -3
functions.py CHANGED
@@ -1,9 +1,50 @@
1
  # functions.py
2
  import json
3
- import requests # Añadido <button class="citation-flag" data-index="1">
4
- import matplotlib.pyplot as plt # Añadido <button class="citation-flag" data-index="1">
5
- from datasets import load_dataset
6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7
  # Cargar modalidades y tareas
8
  def cargar_modalidades_tareas():
9
  with open("modalidades_tareas.json", "r") as file:
 
1
  # functions.py
2
  import json
3
+ import requests
 
 
4
 
5
+ def actualizar_modalidades_tareas_desde_huggingface():
6
+ MODALIDADES = ["text-classification", "token-classification", "translation", "summarization",
7
+ "speech-recognition", "audio-classification", "music-classification",
8
+ "image-classification", "object-detection", "image-segmentation",
9
+ "question-answering", "information-retrieval"]
10
+
11
+ modalidades_tareas = {}
12
+ for task in MODALIDADES:
13
+ url = f"https://huggingface.co/api/datasets?task={task}&limit=5" # Buscar datasets por tarea <button class="citation-flag" data-index="1">
14
+ response = requests.get(url)
15
+ datasets = response.json()
16
+
17
+ # Extraer columnas comunes de los datasets
18
+ columnas = set()
19
+ for dataset in datasets:
20
+ try:
21
+ info = requests.get(f"https://huggingface.co/api/datasets/{dataset['id']}").json()
22
+ columnas.update(info["features"].keys())
23
+ except:
24
+ continue
25
+
26
+ # Asignar a modalidades
27
+ if task in ["text-classification", "token-classification", "translation", "summarization"]:
28
+ modalidad = "NLP"
29
+ elif task in ["speech-recognition", "audio-classification", "music-classification"]:
30
+ modalidad = "Audio"
31
+ elif task in ["image-classification", "object-detection", "image-segmentation"]:
32
+ modalidad = "Vision"
33
+ elif task in ["question-answering", "information-retrieval"]:
34
+ modalidad = "RAG"
35
+
36
+ # Añadir al diccionario
37
+ if modalidad not in modalidades_tareas:
38
+ modalidades_tareas[modalidad] = {"tareas": {}, "columnas_generales": []}
39
+ modalidades_tareas[modalidad]["tareas"][task] = list(columnas)
40
+
41
+ # Guardar JSON
42
+ with open("modalidades_tareas.json", "w") as file:
43
+ json.dump(modalidades_tareas, file, indent=4)
44
+
45
+ return "Archivo actualizado con tareas y columnas de HuggingFace."
46
+
47
+
48
  # Cargar modalidades y tareas
49
  def cargar_modalidades_tareas():
50
  with open("modalidades_tareas.json", "r") as file: