Upload folder using huggingface_hub
Browse files- .DS_Store +0 -0
- config.json +1 -1
- example.py +1 -1
- fi_NA-nb/metadata.pkl +3 -0
- fi_NA-nb/model.pkl +3 -0
- fi_NA-nb/scaler.pkl +3 -0
- fi_NA-nb/training_details.txt +39 -0
.DS_Store
CHANGED
|
Binary files a/.DS_Store and b/.DS_Store differ
|
|
|
config.json
CHANGED
|
@@ -4,6 +4,6 @@
|
|
| 4 |
"AutoConfig": "configuration_sm_subgroup_classifier.SmSubgroupClassifierConfig",
|
| 5 |
"AutoModel": "modeling_sm_subgroup_classifier.SmSubgroupClassifier"
|
| 6 |
},
|
| 7 |
-
"available_models": ["
|
| 8 |
"model_type": "sm_subgroup_classifier"
|
| 9 |
}
|
|
|
|
| 4 |
"AutoConfig": "configuration_sm_subgroup_classifier.SmSubgroupClassifierConfig",
|
| 5 |
"AutoModel": "modeling_sm_subgroup_classifier.SmSubgroupClassifier"
|
| 6 |
},
|
| 7 |
+
"available_models": ["fi_NA-nb"],
|
| 8 |
"model_type": "sm_subgroup_classifier"
|
| 9 |
}
|
example.py
CHANGED
|
@@ -10,6 +10,6 @@ sm_classifier = AutoModel.from_pretrained(
|
|
| 10 |
embedding = np.random.rand(1024).astype(np.float32)
|
| 11 |
|
| 12 |
# Use - model automatically discovers what's available
|
| 13 |
-
result = sm_classifier("fi", "
|
| 14 |
|
| 15 |
print(result)
|
|
|
|
| 10 |
embedding = np.random.rand(1024).astype(np.float32)
|
| 11 |
|
| 12 |
# Use - model automatically discovers what's available
|
| 13 |
+
result = sm_classifier("fi", "NA-nb", embedding)
|
| 14 |
|
| 15 |
print(result)
|
fi_NA-nb/metadata.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dcebec77f65e7a4edab907a0680e37b2ee48f4c384a7ff2dee7d00dc88f60749
|
| 3 |
+
size 76
|
fi_NA-nb/model.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:da0a8b8d946ea6c2bb415f6f36b9cd5b08c5fda7c1faa67c44d093d2fdcb46e4
|
| 3 |
+
size 9055
|
fi_NA-nb/scaler.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4193fa89889dce247553136aab6945fbbc389254eb8c9d203588a7fb04cdd7a1
|
| 3 |
+
size 25191
|
fi_NA-nb/training_details.txt
ADDED
|
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Training Details for fi_NA-nb
|
| 2 |
+
========================================
|
| 3 |
+
|
| 4 |
+
Language: fi
|
| 5 |
+
Model Name: NA-nb
|
| 6 |
+
Training Date: 2025-09-18 16:12:26
|
| 7 |
+
|
| 8 |
+
Data Summary:
|
| 9 |
+
- Total samples: 218088
|
| 10 |
+
- Training samples: 174470
|
| 11 |
+
- Test samples: 43618
|
| 12 |
+
- Embedding dimension: 1024
|
| 13 |
+
|
| 14 |
+
Classes:
|
| 15 |
+
- Number of classes: 2
|
| 16 |
+
- Class names: with_comments, general
|
| 17 |
+
- Class distribution: {'with_comments': 24862, 'general': 193226}
|
| 18 |
+
|
| 19 |
+
Cross-Validation Results:
|
| 20 |
+
- CV folds: 5
|
| 21 |
+
- CV scores: [0.9941823809250874, 0.9942396973691752, 0.9939817733707801, 0.9939817733707801, 0.9939817733707801]
|
| 22 |
+
- CV mean: 0.9941
|
| 23 |
+
- CV std: 0.0001
|
| 24 |
+
- CV confidence interval: 0.9941 ± 0.0002
|
| 25 |
+
|
| 26 |
+
Final Performance:
|
| 27 |
+
- Test accuracy: 0.9945
|
| 28 |
+
|
| 29 |
+
Model Configuration:
|
| 30 |
+
- Algorithm: Logistic Regression
|
| 31 |
+
- Regularization (C): 1.0
|
| 32 |
+
- Feature scaling: StandardScaler
|
| 33 |
+
- Random state: 42
|
| 34 |
+
|
| 35 |
+
Files:
|
| 36 |
+
- Classifier: model.pkl
|
| 37 |
+
- Scaler: scaler.pkl
|
| 38 |
+
- Metadata: metadata.pkl
|
| 39 |
+
- This file: training_details.txt
|