ca-finetuned-phi-2-multiple-choice
Browse files- README.md +1 -1
- adapter_config.json +2 -2
- adapter_model.safetensors +1 -1
- emissions.csv +2 -0
- runs/Feb14_23-30-17_c0c8f2aaa2e2/events.out.tfevents.1707953419.c0c8f2aaa2e2.13823.0 +3 -0
- runs/Feb14_23-33-02_c0c8f2aaa2e2/events.out.tfevents.1707953584.c0c8f2aaa2e2.14103.0 +3 -0
- tokenizer.json +1 -1
- training_args.bin +1 -1
README.md
CHANGED
|
@@ -42,7 +42,7 @@ The following hyperparameters were used during training:
|
|
| 42 |
- gradient_accumulation_steps: 10
|
| 43 |
- total_train_batch_size: 40
|
| 44 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
| 45 |
-
- lr_scheduler_type:
|
| 46 |
- num_epochs: 10
|
| 47 |
|
| 48 |
### Training results
|
|
|
|
| 42 |
- gradient_accumulation_steps: 10
|
| 43 |
- total_train_batch_size: 40
|
| 44 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
| 45 |
+
- lr_scheduler_type: linear
|
| 46 |
- num_epochs: 10
|
| 47 |
|
| 48 |
### Training results
|
adapter_config.json
CHANGED
|
@@ -19,9 +19,9 @@
|
|
| 19 |
"rank_pattern": {},
|
| 20 |
"revision": null,
|
| 21 |
"target_modules": [
|
| 22 |
-
"fc1",
|
| 23 |
-
"Wqkv",
|
| 24 |
"out_proj",
|
|
|
|
|
|
|
| 25 |
"fc2"
|
| 26 |
],
|
| 27 |
"task_type": "CAUSAL_LM",
|
|
|
|
| 19 |
"rank_pattern": {},
|
| 20 |
"revision": null,
|
| 21 |
"target_modules": [
|
|
|
|
|
|
|
| 22 |
"out_proj",
|
| 23 |
+
"Wqkv",
|
| 24 |
+
"fc1",
|
| 25 |
"fc2"
|
| 26 |
],
|
| 27 |
"task_type": "CAUSAL_LM",
|
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 83919184
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ed2997cadf9d4dd11c8e8531253cca53bad09803148979889bdc9aee4b655d00
|
| 3 |
size 83919184
|
emissions.csv
CHANGED
|
@@ -10,3 +10,5 @@ timestamp,experiment_id,project_name,duration,emissions,energy_consumed,country_
|
|
| 10 |
2024-02-14T23:00:51,980e306a-c1fd-4ce5-ae14-db5d998ba9b2,codecarbon,41.59057283401489,0.003887884617418288,0.0072713536179740655,Canada,CAN,,N,,
|
| 11 |
2024-02-14T23:02:15,4f2c9857-b5bf-4b4d-a381-13e0fc49395f,codecarbon,41.660608530044556,0.003935760455724685,0.0073608938652651315,Canada,CAN,,N,,
|
| 12 |
2024-02-14T23:03:33,9c4697c8-deb9-421f-ac6e-02afeeaf15ee,codecarbon,41.67383122444153,0.0038698348528122405,0.007237595872030742,Canada,CAN,,N,,
|
|
|
|
|
|
|
|
|
| 10 |
2024-02-14T23:00:51,980e306a-c1fd-4ce5-ae14-db5d998ba9b2,codecarbon,41.59057283401489,0.003887884617418288,0.0072713536179740655,Canada,CAN,,N,,
|
| 11 |
2024-02-14T23:02:15,4f2c9857-b5bf-4b4d-a381-13e0fc49395f,codecarbon,41.660608530044556,0.003935760455724685,0.0073608938652651315,Canada,CAN,,N,,
|
| 12 |
2024-02-14T23:03:33,9c4697c8-deb9-421f-ac6e-02afeeaf15ee,codecarbon,41.67383122444153,0.0038698348528122405,0.007237595872030742,Canada,CAN,,N,,
|
| 13 |
+
2024-02-14T23:31:03,81853d8a-6372-47ef-bed5-b782cfa4de03,codecarbon,41.40422487258911,0.0038608000269561796,0.007220698402033328,Canada,CAN,,N,,
|
| 14 |
+
2024-02-14T23:46:02,eca5c0fe-8516-455b-aebe-57731462102d,codecarbon,775.5782225131989,0.0777968384134041,0.14550028566431314,Canada,CAN,,N,,
|
runs/Feb14_23-30-17_c0c8f2aaa2e2/events.out.tfevents.1707953419.c0c8f2aaa2e2.13823.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:327010a88967fde30a7afeb05f5dc5c662a91644b86034d4af13fe905a428b08
|
| 3 |
+
size 6818
|
runs/Feb14_23-33-02_c0c8f2aaa2e2/events.out.tfevents.1707953584.c0c8f2aaa2e2.14103.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:39488b54cff86fb285cd28abd5375f893c8fe955926996f5d6ae6c6f7b5e52cc
|
| 3 |
+
size 6818
|
tokenizer.json
CHANGED
|
@@ -2,7 +2,7 @@
|
|
| 2 |
"version": "1.0",
|
| 3 |
"truncation": {
|
| 4 |
"direction": "Right",
|
| 5 |
-
"max_length":
|
| 6 |
"strategy": "LongestFirst",
|
| 7 |
"stride": 0
|
| 8 |
},
|
|
|
|
| 2 |
"version": "1.0",
|
| 3 |
"truncation": {
|
| 4 |
"direction": "Right",
|
| 5 |
+
"max_length": 512,
|
| 6 |
"strategy": "LongestFirst",
|
| 7 |
"stride": 0
|
| 8 |
},
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4283
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9774c03f2c19adbb371e13b89fb1d396860e4a70625a986cb06caf788ac571a3
|
| 3 |
size 4283
|