Spaces:

Roboproch
/

MLOps_project

Runtime error

Roboproch commited on Mar 19

Commit

35f287c

1 Parent(s): 93cfcb5

inserimento primi test e modifica modello

Files changed (4) hide show

MLOps_project/CD/app.py ADDED Viewed

File without changes

MLOps_project/CI/test_ci.py CHANGED Viewed

@@ -1,12 +1,12 @@
 class TestClass :
     """
-    test fittizi per pipeline CI
     """
-    def test_1(self) :
-        x=1
-        assert x==1
-    def test_2(self) :
-        y=10
-        assert y>5

+import modello
 class TestClass :
     """
+    test sul modello per pipeline CI
     """
+    def check_trivial_output(self) :
+        assert modello.sentiment_task("neutral")[0]["label"]=="neutral" and modello.sentiment_task("awesome")[0]["label"]=="positive" and modello.sentiment_task("terrible")[0]["label"]=="negative"
+    def train_set_bigger_than_test_set(self) :
+        assert modello.df_train.shape[0]>modello.df_test.shape[0]

MLOps_project/dockerfile ADDED Viewed

+#dockerfile
+# versione di Python
+FROM python:3.12.1
+# copia della directory in /app
+COPY ./MLOps_project/CD /app
+# set della working directory
+WORKDIR /app
+RUN ls
+# run dello script Python
+CMD ["python", "app.py"]

MLOps_project/modello.py CHANGED Viewed

@@ -1,11 +1,25 @@
 from transformers import pipeline
 sentiment_task = pipeline("sentiment-analysis", model="cardiffnlp/twitter-roberta-base-sentiment-latest", tokenizer="cardiffnlp/twitter-roberta-base-sentiment-latest")
-# print(sentiment_task("Covid cases are increasing fast!"))
-from datasets import load_dataset
 ds = load_dataset("SetFit/tweet_sentiment_extraction")
-# il dataset viene splittato da load_dataset
-# stampa il primo record del set di train
-print(ds['train'][0])
-# stampa il primo record del set di test
-print(ds['test'][0])

+# Utilities
 from transformers import pipeline
+from datasets import load_dataset
+import pandas as pd
+# Import del modello da Hugging Face
 sentiment_task = pipeline("sentiment-analysis", model="cardiffnlp/twitter-roberta-base-sentiment-latest", tokenizer="cardiffnlp/twitter-roberta-base-sentiment-latest")
+# Import di un dataset da Hugging Face
 ds = load_dataset("SetFit/tweet_sentiment_extraction")
+# Il dataset viene splittato autometicamente in train set e test set da load_dataset
+# Per comodità trasformo i dataset in dataframe di pandas
+df_train = ds['train'].to_pandas()
+df_test = ds['test'].to_pandas()
+X_train = df_train['text'].values
+y_train = df_train['label_text'].values
+X_test = df_test['text'].values
+y_test = df_test['label_text'].values
+# Estraggo il modello
+model = sentiment_task.model
+# Ri-addestro il modello sul dataset importato
+model.fit(X_train,y_train)