erikhenriksson commited on
Commit
7f4d906
·
verified ·
1 Parent(s): 3c436eb

Upload folder using huggingface_hub

Browse files
.DS_Store CHANGED
Binary files a/.DS_Store and b/.DS_Store differ
 
config.json CHANGED
@@ -4,6 +4,6 @@
4
  "AutoConfig": "configuration_sm_subgroup_classifier.SmSubgroupClassifierConfig",
5
  "AutoModel": "modeling_sm_subgroup_classifier.SmSubgroupClassifier"
6
  },
7
- "available_models": ["fi_na-nb"],
8
  "model_type": "sm_subgroup_classifier"
9
  }
 
4
  "AutoConfig": "configuration_sm_subgroup_classifier.SmSubgroupClassifierConfig",
5
  "AutoModel": "modeling_sm_subgroup_classifier.SmSubgroupClassifier"
6
  },
7
+ "available_models": ["fi_NA-nb"],
8
  "model_type": "sm_subgroup_classifier"
9
  }
example.py CHANGED
@@ -10,6 +10,6 @@ sm_classifier = AutoModel.from_pretrained(
10
  embedding = np.random.rand(1024).astype(np.float32)
11
 
12
  # Use - model automatically discovers what's available
13
- result = sm_classifier("fi", "na-nb", embedding)
14
 
15
  print(result)
 
10
  embedding = np.random.rand(1024).astype(np.float32)
11
 
12
  # Use - model automatically discovers what's available
13
+ result = sm_classifier("fi", "NA-nb", embedding)
14
 
15
  print(result)
fi_NA-nb/metadata.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcebec77f65e7a4edab907a0680e37b2ee48f4c384a7ff2dee7d00dc88f60749
3
+ size 76
fi_NA-nb/model.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da0a8b8d946ea6c2bb415f6f36b9cd5b08c5fda7c1faa67c44d093d2fdcb46e4
3
+ size 9055
fi_NA-nb/scaler.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4193fa89889dce247553136aab6945fbbc389254eb8c9d203588a7fb04cdd7a1
3
+ size 25191
fi_NA-nb/training_details.txt ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Training Details for fi_NA-nb
2
+ ========================================
3
+
4
+ Language: fi
5
+ Model Name: NA-nb
6
+ Training Date: 2025-09-18 16:12:26
7
+
8
+ Data Summary:
9
+ - Total samples: 218088
10
+ - Training samples: 174470
11
+ - Test samples: 43618
12
+ - Embedding dimension: 1024
13
+
14
+ Classes:
15
+ - Number of classes: 2
16
+ - Class names: with_comments, general
17
+ - Class distribution: {'with_comments': 24862, 'general': 193226}
18
+
19
+ Cross-Validation Results:
20
+ - CV folds: 5
21
+ - CV scores: [0.9941823809250874, 0.9942396973691752, 0.9939817733707801, 0.9939817733707801, 0.9939817733707801]
22
+ - CV mean: 0.9941
23
+ - CV std: 0.0001
24
+ - CV confidence interval: 0.9941 ± 0.0002
25
+
26
+ Final Performance:
27
+ - Test accuracy: 0.9945
28
+
29
+ Model Configuration:
30
+ - Algorithm: Logistic Regression
31
+ - Regularization (C): 1.0
32
+ - Feature scaling: StandardScaler
33
+ - Random state: 42
34
+
35
+ Files:
36
+ - Classifier: model.pkl
37
+ - Scaler: scaler.pkl
38
+ - Metadata: metadata.pkl
39
+ - This file: training_details.txt