Update prediction_multilabel.py
Browse files- prediction_multilabel.py +2 -2
prediction_multilabel.py
CHANGED
|
@@ -10,8 +10,8 @@ from sentence_transformers import util
|
|
| 10 |
torch.manual_seed(1)
|
| 11 |
|
| 12 |
# Load datasets
|
| 13 |
-
df_inmemory = pd.read_csv('
|
| 14 |
-
df_paragraph = pd.read_csv('
|
| 15 |
|
| 16 |
# Load stored embeddings
|
| 17 |
with open('embeddings_prediction.pkl', "rb") as f:
|
|
|
|
| 10 |
torch.manual_seed(1)
|
| 11 |
|
| 12 |
# Load datasets
|
| 13 |
+
df_inmemory = pd.read_csv('labeled.csv') # labeled text extracted from 230 CSR GRI reports, 150 International companies, 2017-2021 period
|
| 14 |
+
df_paragraph = pd.read_csv('prediction_demo.csv') # paragraphs to predict the label, extracted from 1.2k CSR reports, 150 German PLC companies, 2010-2021 period, 645k paragraphs)
|
| 15 |
|
| 16 |
# Load stored embeddings
|
| 17 |
with open('embeddings_prediction.pkl', "rb") as f:
|