la run on qqp
Browse files- outputs/qqp/args.json +41 -0
- outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/logfile_la_all.log +30 -0
- outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_0/all_results_la_kron_all_homo_mc_corr_1000.json +1 -0
- outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_0/eval_res_la_kron_all_homo_mc_corr_1000.json +0 -0
- outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_0/gpu_stats_la.json +130 -0
- outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_10915/all_results_la_kron_all_homo_mc_corr_1000.json +1 -0
- outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_10915/eval_res_la_kron_all_homo_mc_corr_1000.json +0 -0
- outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_10915/gpu_stats_la.json +130 -0
- outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_16373/all_results_la_kron_all_homo_mc_corr_1000.json +1 -0
- outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_16373/eval_res_la_kron_all_homo_mc_corr_1000.json +0 -0
- outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_16373/gpu_stats_la.json +130 -0
- outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_21831/all_results_la_kron_all_homo_mc_corr_1000.json +1 -0
- outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_21831/eval_res_la_kron_all_homo_mc_corr_1000.json +0 -0
- outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_21831/gpu_stats_la.json +130 -0
- outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_27290/all_results_la_kron_all_homo_mc_corr_1000.json +1 -0
- outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_27290/eval_res_la_kron_all_homo_mc_corr_1000.json +0 -0
- outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_27290/gpu_stats_la.json +130 -0
- outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_5457/all_results_la_kron_all_homo_mc_corr_1000.json +1 -0
- outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_5457/eval_res_la_kron_all_homo_mc_corr_1000.json +0 -0
- outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_5457/gpu_stats_la.json +130 -0
- outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_0/f_mu_kron_all_homo_1000.pt +3 -0
- outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_0/f_var_kron_all_homo_1000.pt +3 -0
- outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_0/prior_precision_kron_all_homo_1000.pt +3 -0
- outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_10915/f_mu_kron_all_homo_1000.pt +3 -0
- outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_10915/f_var_kron_all_homo_1000.pt +3 -0
- outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_10915/prior_precision_kron_all_homo_1000.pt +3 -0
- outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_16373/f_mu_kron_all_homo_1000.pt +3 -0
- outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_16373/f_var_kron_all_homo_1000.pt +3 -0
- outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_16373/prior_precision_kron_all_homo_1000.pt +3 -0
- outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_21831/f_mu_kron_all_homo_1000.pt +3 -0
- outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_21831/f_var_kron_all_homo_1000.pt +3 -0
- outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_21831/prior_precision_kron_all_homo_1000.pt +3 -0
- outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_27290/f_mu_kron_all_homo_1000.pt +3 -0
- outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_27290/f_var_kron_all_homo_1000.pt +3 -0
- outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_27290/prior_precision_kron_all_homo_1000.pt +3 -0
- outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_5457/f_mu_kron_all_homo_1000.pt +3 -0
- outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_5457/f_var_kron_all_homo_1000.pt +3 -0
- outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_5457/prior_precision_kron_all_homo_1000.pt +3 -0
outputs/qqp/args.json
ADDED
|
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"task_name": "qqp",
|
| 3 |
+
"train_file": null,
|
| 4 |
+
"validation_file": null,
|
| 5 |
+
"max_length": 300,
|
| 6 |
+
"pad_to_max_length": false,
|
| 7 |
+
"model_name_or_path": "bert-base-uncased",
|
| 8 |
+
"use_slow_tokenizer": false,
|
| 9 |
+
"per_device_train_batch_size": 32,
|
| 10 |
+
"per_device_eval_batch_size": 8,
|
| 11 |
+
"learning_rate": 0.0001,
|
| 12 |
+
"weight_decay": 0.0,
|
| 13 |
+
"num_train_epochs": 3,
|
| 14 |
+
"max_train_steps": null,
|
| 15 |
+
"peft_method": null,
|
| 16 |
+
"gradient_accumulation_steps": 1,
|
| 17 |
+
"lr_scheduler_type": "linear",
|
| 18 |
+
"num_warmup_steps": 0,
|
| 19 |
+
"output_dir": "./outputs",
|
| 20 |
+
"seed": 65,
|
| 21 |
+
"push_to_hub": false,
|
| 22 |
+
"hub_model_id": null,
|
| 23 |
+
"hub_token": null,
|
| 24 |
+
"checkpointing_steps": "1000",
|
| 25 |
+
"resume_from_checkpoint": null,
|
| 26 |
+
"with_tracking": false,
|
| 27 |
+
"report_to": "all",
|
| 28 |
+
"ignore_mismatched_sizes": true,
|
| 29 |
+
"save": false,
|
| 30 |
+
"load_step": 999,
|
| 31 |
+
"lora_r": 8,
|
| 32 |
+
"lora_alpha": 16,
|
| 33 |
+
"lora_dropout": 0.1,
|
| 34 |
+
"laplace_hessian": "kron",
|
| 35 |
+
"laplace_sub": "all",
|
| 36 |
+
"laplace_prior": "homo",
|
| 37 |
+
"laplace_optim_step": 1000,
|
| 38 |
+
"testing_set": "train_val",
|
| 39 |
+
"cache_dir": "/content/cache/huggingface/metrics/",
|
| 40 |
+
"laplace_predict": "mc_corr"
|
| 41 |
+
}
|
outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/logfile_la_all.log
ADDED
|
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
05/27/2024 09:52:57 - INFO - __main__ - ***** Starting script *****
|
| 2 |
+
05/27/2024 09:54:47 - INFO - __main__ - Sample 217445 of the training set: {'input_ids': [101, 2065, 1999, 1037, 7473, 1037, 17595, 4274, 5830, 2003, 4198, 1998, 1045, 2215, 2000, 2113, 2037, 15536, 1011, 10882, 20786, 1010, 2059, 2129, 2079, 1045, 2424, 1037, 20786, 1029, 102, 2129, 2064, 1045, 2156, 1996, 5552, 15536, 1011, 10882, 20786, 2015, 2006, 2026, 4684, 1029, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'labels': 0}.
|
| 3 |
+
05/27/2024 09:54:47 - INFO - __main__ - Sample 151437 of the training set: {'input_ids': [101, 2129, 2079, 1045, 6855, 1037, 2248, 2769, 11659, 6105, 1999, 2634, 1029, 2005, 1037, 2978, 3597, 2378, 2128, 22930, 26897, 22752, 1012, 102, 3784, 7909, 11909, 2015, 1998, 6364, 1024, 2003, 1037, 2194, 2066, 1043, 2100, 6199, 1010, 2029, 15187, 3573, 5592, 5329, 1999, 3863, 2005, 2978, 3597, 2378, 1010, 2641, 1037, 2769, 11659, 1998, 3223, 2000, 2031, 1037, 6105, 2000, 5452, 1029, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'labels': 0}.
|
| 4 |
+
05/27/2024 09:54:47 - INFO - __main__ - Sample 150837 of the training set: {'input_ids': [101, 2129, 2079, 2017, 2113, 2065, 2017, 2024, 23958, 16778, 2278, 1029, 102, 2054, 2515, 2108, 23958, 16778, 2278, 2514, 2066, 1029, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'labels': 0}.
|
| 5 |
+
05/27/2024 11:21:21 - INFO - __main__ - ***** Completed Script *****
|
| 6 |
+
05/27/2024 11:21:27 - INFO - __main__ - ***** Starting script *****
|
| 7 |
+
05/27/2024 11:23:09 - INFO - __main__ - Sample 217445 of the training set: {'input_ids': [101, 2065, 1999, 1037, 7473, 1037, 17595, 4274, 5830, 2003, 4198, 1998, 1045, 2215, 2000, 2113, 2037, 15536, 1011, 10882, 20786, 1010, 2059, 2129, 2079, 1045, 2424, 1037, 20786, 1029, 102, 2129, 2064, 1045, 2156, 1996, 5552, 15536, 1011, 10882, 20786, 2015, 2006, 2026, 4684, 1029, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'labels': 0}.
|
| 8 |
+
05/27/2024 11:23:09 - INFO - __main__ - Sample 151437 of the training set: {'input_ids': [101, 2129, 2079, 1045, 6855, 1037, 2248, 2769, 11659, 6105, 1999, 2634, 1029, 2005, 1037, 2978, 3597, 2378, 2128, 22930, 26897, 22752, 1012, 102, 3784, 7909, 11909, 2015, 1998, 6364, 1024, 2003, 1037, 2194, 2066, 1043, 2100, 6199, 1010, 2029, 15187, 3573, 5592, 5329, 1999, 3863, 2005, 2978, 3597, 2378, 1010, 2641, 1037, 2769, 11659, 1998, 3223, 2000, 2031, 1037, 6105, 2000, 5452, 1029, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'labels': 0}.
|
| 9 |
+
05/27/2024 11:23:09 - INFO - __main__ - Sample 150837 of the training set: {'input_ids': [101, 2129, 2079, 2017, 2113, 2065, 2017, 2024, 23958, 16778, 2278, 1029, 102, 2054, 2515, 2108, 23958, 16778, 2278, 2514, 2066, 1029, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'labels': 0}.
|
| 10 |
+
05/27/2024 12:50:25 - INFO - __main__ - ***** Completed Script *****
|
| 11 |
+
05/27/2024 12:50:30 - INFO - __main__ - ***** Starting script *****
|
| 12 |
+
05/27/2024 12:52:13 - INFO - __main__ - Sample 217445 of the training set: {'input_ids': [101, 2065, 1999, 1037, 7473, 1037, 17595, 4274, 5830, 2003, 4198, 1998, 1045, 2215, 2000, 2113, 2037, 15536, 1011, 10882, 20786, 1010, 2059, 2129, 2079, 1045, 2424, 1037, 20786, 1029, 102, 2129, 2064, 1045, 2156, 1996, 5552, 15536, 1011, 10882, 20786, 2015, 2006, 2026, 4684, 1029, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'labels': 0}.
|
| 13 |
+
05/27/2024 12:52:13 - INFO - __main__ - Sample 151437 of the training set: {'input_ids': [101, 2129, 2079, 1045, 6855, 1037, 2248, 2769, 11659, 6105, 1999, 2634, 1029, 2005, 1037, 2978, 3597, 2378, 2128, 22930, 26897, 22752, 1012, 102, 3784, 7909, 11909, 2015, 1998, 6364, 1024, 2003, 1037, 2194, 2066, 1043, 2100, 6199, 1010, 2029, 15187, 3573, 5592, 5329, 1999, 3863, 2005, 2978, 3597, 2378, 1010, 2641, 1037, 2769, 11659, 1998, 3223, 2000, 2031, 1037, 6105, 2000, 5452, 1029, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'labels': 0}.
|
| 14 |
+
05/27/2024 12:52:13 - INFO - __main__ - Sample 150837 of the training set: {'input_ids': [101, 2129, 2079, 2017, 2113, 2065, 2017, 2024, 23958, 16778, 2278, 1029, 102, 2054, 2515, 2108, 23958, 16778, 2278, 2514, 2066, 1029, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'labels': 0}.
|
| 15 |
+
05/27/2024 14:19:18 - INFO - __main__ - ***** Completed Script *****
|
| 16 |
+
05/27/2024 14:19:24 - INFO - __main__ - ***** Starting script *****
|
| 17 |
+
05/27/2024 14:21:08 - INFO - __main__ - Sample 217445 of the training set: {'input_ids': [101, 2065, 1999, 1037, 7473, 1037, 17595, 4274, 5830, 2003, 4198, 1998, 1045, 2215, 2000, 2113, 2037, 15536, 1011, 10882, 20786, 1010, 2059, 2129, 2079, 1045, 2424, 1037, 20786, 1029, 102, 2129, 2064, 1045, 2156, 1996, 5552, 15536, 1011, 10882, 20786, 2015, 2006, 2026, 4684, 1029, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'labels': 0}.
|
| 18 |
+
05/27/2024 14:21:08 - INFO - __main__ - Sample 151437 of the training set: {'input_ids': [101, 2129, 2079, 1045, 6855, 1037, 2248, 2769, 11659, 6105, 1999, 2634, 1029, 2005, 1037, 2978, 3597, 2378, 2128, 22930, 26897, 22752, 1012, 102, 3784, 7909, 11909, 2015, 1998, 6364, 1024, 2003, 1037, 2194, 2066, 1043, 2100, 6199, 1010, 2029, 15187, 3573, 5592, 5329, 1999, 3863, 2005, 2978, 3597, 2378, 1010, 2641, 1037, 2769, 11659, 1998, 3223, 2000, 2031, 1037, 6105, 2000, 5452, 1029, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'labels': 0}.
|
| 19 |
+
05/27/2024 14:21:08 - INFO - __main__ - Sample 150837 of the training set: {'input_ids': [101, 2129, 2079, 2017, 2113, 2065, 2017, 2024, 23958, 16778, 2278, 1029, 102, 2054, 2515, 2108, 23958, 16778, 2278, 2514, 2066, 1029, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'labels': 0}.
|
| 20 |
+
05/27/2024 15:48:54 - INFO - __main__ - ***** Completed Script *****
|
| 21 |
+
05/27/2024 15:48:59 - INFO - __main__ - ***** Starting script *****
|
| 22 |
+
05/27/2024 15:50:40 - INFO - __main__ - Sample 217445 of the training set: {'input_ids': [101, 2065, 1999, 1037, 7473, 1037, 17595, 4274, 5830, 2003, 4198, 1998, 1045, 2215, 2000, 2113, 2037, 15536, 1011, 10882, 20786, 1010, 2059, 2129, 2079, 1045, 2424, 1037, 20786, 1029, 102, 2129, 2064, 1045, 2156, 1996, 5552, 15536, 1011, 10882, 20786, 2015, 2006, 2026, 4684, 1029, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'labels': 0}.
|
| 23 |
+
05/27/2024 15:50:40 - INFO - __main__ - Sample 151437 of the training set: {'input_ids': [101, 2129, 2079, 1045, 6855, 1037, 2248, 2769, 11659, 6105, 1999, 2634, 1029, 2005, 1037, 2978, 3597, 2378, 2128, 22930, 26897, 22752, 1012, 102, 3784, 7909, 11909, 2015, 1998, 6364, 1024, 2003, 1037, 2194, 2066, 1043, 2100, 6199, 1010, 2029, 15187, 3573, 5592, 5329, 1999, 3863, 2005, 2978, 3597, 2378, 1010, 2641, 1037, 2769, 11659, 1998, 3223, 2000, 2031, 1037, 6105, 2000, 5452, 1029, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'labels': 0}.
|
| 24 |
+
05/27/2024 15:50:40 - INFO - __main__ - Sample 150837 of the training set: {'input_ids': [101, 2129, 2079, 2017, 2113, 2065, 2017, 2024, 23958, 16778, 2278, 1029, 102, 2054, 2515, 2108, 23958, 16778, 2278, 2514, 2066, 1029, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'labels': 0}.
|
| 25 |
+
05/27/2024 17:19:48 - INFO - __main__ - ***** Completed Script *****
|
| 26 |
+
05/27/2024 17:19:53 - INFO - __main__ - ***** Starting script *****
|
| 27 |
+
05/27/2024 17:21:43 - INFO - __main__ - Sample 217445 of the training set: {'input_ids': [101, 2065, 1999, 1037, 7473, 1037, 17595, 4274, 5830, 2003, 4198, 1998, 1045, 2215, 2000, 2113, 2037, 15536, 1011, 10882, 20786, 1010, 2059, 2129, 2079, 1045, 2424, 1037, 20786, 1029, 102, 2129, 2064, 1045, 2156, 1996, 5552, 15536, 1011, 10882, 20786, 2015, 2006, 2026, 4684, 1029, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'labels': 0}.
|
| 28 |
+
05/27/2024 17:21:43 - INFO - __main__ - Sample 151437 of the training set: {'input_ids': [101, 2129, 2079, 1045, 6855, 1037, 2248, 2769, 11659, 6105, 1999, 2634, 1029, 2005, 1037, 2978, 3597, 2378, 2128, 22930, 26897, 22752, 1012, 102, 3784, 7909, 11909, 2015, 1998, 6364, 1024, 2003, 1037, 2194, 2066, 1043, 2100, 6199, 1010, 2029, 15187, 3573, 5592, 5329, 1999, 3863, 2005, 2978, 3597, 2378, 1010, 2641, 1037, 2769, 11659, 1998, 3223, 2000, 2031, 1037, 6105, 2000, 5452, 1029, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'labels': 0}.
|
| 29 |
+
05/27/2024 17:21:43 - INFO - __main__ - Sample 150837 of the training set: {'input_ids': [101, 2129, 2079, 2017, 2113, 2065, 2017, 2024, 23958, 16778, 2278, 1029, 102, 2054, 2515, 2108, 23958, 16778, 2278, 2514, 2066, 1029, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], 'labels': 0}.
|
| 30 |
+
05/27/2024 18:50:56 - INFO - __main__ - ***** Completed Script *****
|
outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_0/all_results_la_kron_all_homo_mc_corr_1000.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"eval_accuracy": 0.3832797427652733, "eval_f1": 0.5440681685196022}
|
outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_0/eval_res_la_kron_all_homo_mc_corr_1000.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_0/gpu_stats_la.json
ADDED
|
@@ -0,0 +1,130 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"memory_allocated": 808749568,
|
| 3 |
+
"max_memory_allocated": 5014978048,
|
| 4 |
+
"memory_reserved": 6358564864,
|
| 5 |
+
"max_memory_reserved": 6727663616,
|
| 6 |
+
"memory_stats": {
|
| 7 |
+
"active.all.allocated": 24482704,
|
| 8 |
+
"active.all.current": 10809,
|
| 9 |
+
"active.all.freed": 24471895,
|
| 10 |
+
"active.all.peak": 10985,
|
| 11 |
+
"active.large_pool.allocated": 11722181,
|
| 12 |
+
"active.large_pool.current": 222,
|
| 13 |
+
"active.large_pool.freed": 11721959,
|
| 14 |
+
"active.large_pool.peak": 360,
|
| 15 |
+
"active.small_pool.allocated": 12760523,
|
| 16 |
+
"active.small_pool.current": 10587,
|
| 17 |
+
"active.small_pool.freed": 12749936,
|
| 18 |
+
"active.small_pool.peak": 10750,
|
| 19 |
+
"active_bytes.all.allocated": 78209693356544,
|
| 20 |
+
"active_bytes.all.current": 808749568,
|
| 21 |
+
"active_bytes.all.freed": 78208884606976,
|
| 22 |
+
"active_bytes.all.peak": 5014978048,
|
| 23 |
+
"active_bytes.large_pool.allocated": 74862721955840,
|
| 24 |
+
"active_bytes.large_pool.current": 799473664,
|
| 25 |
+
"active_bytes.large_pool.freed": 74861922482176,
|
| 26 |
+
"active_bytes.large_pool.peak": 4997783552,
|
| 27 |
+
"active_bytes.small_pool.allocated": 3346971400704,
|
| 28 |
+
"active_bytes.small_pool.current": 9275904,
|
| 29 |
+
"active_bytes.small_pool.freed": 3346962124800,
|
| 30 |
+
"active_bytes.small_pool.peak": 124137472,
|
| 31 |
+
"allocated_bytes.all.allocated": 78209693356544,
|
| 32 |
+
"allocated_bytes.all.current": 808749568,
|
| 33 |
+
"allocated_bytes.all.freed": 78208884606976,
|
| 34 |
+
"allocated_bytes.all.peak": 5014978048,
|
| 35 |
+
"allocated_bytes.large_pool.allocated": 74862721955840,
|
| 36 |
+
"allocated_bytes.large_pool.current": 799473664,
|
| 37 |
+
"allocated_bytes.large_pool.freed": 74861922482176,
|
| 38 |
+
"allocated_bytes.large_pool.peak": 4997783552,
|
| 39 |
+
"allocated_bytes.small_pool.allocated": 3346971400704,
|
| 40 |
+
"allocated_bytes.small_pool.current": 9275904,
|
| 41 |
+
"allocated_bytes.small_pool.freed": 3346962124800,
|
| 42 |
+
"allocated_bytes.small_pool.peak": 124137472,
|
| 43 |
+
"allocation.all.allocated": 24482704,
|
| 44 |
+
"allocation.all.current": 10809,
|
| 45 |
+
"allocation.all.freed": 24471895,
|
| 46 |
+
"allocation.all.peak": 10985,
|
| 47 |
+
"allocation.large_pool.allocated": 11722181,
|
| 48 |
+
"allocation.large_pool.current": 222,
|
| 49 |
+
"allocation.large_pool.freed": 11721959,
|
| 50 |
+
"allocation.large_pool.peak": 360,
|
| 51 |
+
"allocation.small_pool.allocated": 12760523,
|
| 52 |
+
"allocation.small_pool.current": 10587,
|
| 53 |
+
"allocation.small_pool.freed": 12749936,
|
| 54 |
+
"allocation.small_pool.peak": 10750,
|
| 55 |
+
"inactive_split.all.allocated": 12808394,
|
| 56 |
+
"inactive_split.all.current": 115,
|
| 57 |
+
"inactive_split.all.freed": 12808279,
|
| 58 |
+
"inactive_split.all.peak": 246,
|
| 59 |
+
"inactive_split.large_pool.allocated": 8088991,
|
| 60 |
+
"inactive_split.large_pool.current": 38,
|
| 61 |
+
"inactive_split.large_pool.freed": 8088953,
|
| 62 |
+
"inactive_split.large_pool.peak": 135,
|
| 63 |
+
"inactive_split.small_pool.allocated": 4719403,
|
| 64 |
+
"inactive_split.small_pool.current": 77,
|
| 65 |
+
"inactive_split.small_pool.freed": 4719326,
|
| 66 |
+
"inactive_split.small_pool.peak": 156,
|
| 67 |
+
"inactive_split_bytes.all.allocated": 71846063992832,
|
| 68 |
+
"inactive_split_bytes.all.current": 116094464,
|
| 69 |
+
"inactive_split_bytes.all.freed": 71845947898368,
|
| 70 |
+
"inactive_split_bytes.all.peak": 1893863936,
|
| 71 |
+
"inactive_split_bytes.large_pool.allocated": 68396959819776,
|
| 72 |
+
"inactive_split_bytes.large_pool.current": 91815936,
|
| 73 |
+
"inactive_split_bytes.large_pool.freed": 68396868003840,
|
| 74 |
+
"inactive_split_bytes.large_pool.peak": 1887404032,
|
| 75 |
+
"inactive_split_bytes.small_pool.allocated": 3449104173056,
|
| 76 |
+
"inactive_split_bytes.small_pool.current": 24278528,
|
| 77 |
+
"inactive_split_bytes.small_pool.freed": 3449079894528,
|
| 78 |
+
"inactive_split_bytes.small_pool.peak": 84646400,
|
| 79 |
+
"max_split_size": -1,
|
| 80 |
+
"num_alloc_retries": 0,
|
| 81 |
+
"num_device_alloc": 436,
|
| 82 |
+
"num_device_free": 130,
|
| 83 |
+
"num_ooms": 0,
|
| 84 |
+
"num_sync_all_streams": 1,
|
| 85 |
+
"oversize_allocations.allocated": 0,
|
| 86 |
+
"oversize_allocations.current": 0,
|
| 87 |
+
"oversize_allocations.freed": 0,
|
| 88 |
+
"oversize_allocations.peak": 0,
|
| 89 |
+
"oversize_segments.allocated": 0,
|
| 90 |
+
"oversize_segments.current": 0,
|
| 91 |
+
"oversize_segments.freed": 0,
|
| 92 |
+
"oversize_segments.peak": 0,
|
| 93 |
+
"requested_bytes.all.allocated": 77380438428195,
|
| 94 |
+
"requested_bytes.all.current": 800396976,
|
| 95 |
+
"requested_bytes.all.freed": 77379638031219,
|
| 96 |
+
"requested_bytes.all.peak": 4992933420,
|
| 97 |
+
"requested_bytes.large_pool.allocated": 74034645754624,
|
| 98 |
+
"requested_bytes.large_pool.current": 795392000,
|
| 99 |
+
"requested_bytes.large_pool.freed": 74033850362624,
|
| 100 |
+
"requested_bytes.large_pool.peak": 4975769600,
|
| 101 |
+
"requested_bytes.small_pool.allocated": 3345792673571,
|
| 102 |
+
"requested_bytes.small_pool.current": 5004976,
|
| 103 |
+
"requested_bytes.small_pool.freed": 3345787668595,
|
| 104 |
+
"requested_bytes.small_pool.peak": 119884008,
|
| 105 |
+
"reserved_bytes.all.allocated": 12182355968,
|
| 106 |
+
"reserved_bytes.all.current": 6358564864,
|
| 107 |
+
"reserved_bytes.all.freed": 5823791104,
|
| 108 |
+
"reserved_bytes.all.peak": 6727663616,
|
| 109 |
+
"reserved_bytes.large_pool.allocated": 12002000896,
|
| 110 |
+
"reserved_bytes.large_pool.current": 6230638592,
|
| 111 |
+
"reserved_bytes.large_pool.freed": 5771362304,
|
| 112 |
+
"reserved_bytes.large_pool.peak": 6662651904,
|
| 113 |
+
"reserved_bytes.small_pool.allocated": 180355072,
|
| 114 |
+
"reserved_bytes.small_pool.current": 127926272,
|
| 115 |
+
"reserved_bytes.small_pool.freed": 52428800,
|
| 116 |
+
"reserved_bytes.small_pool.peak": 127926272,
|
| 117 |
+
"segment.all.allocated": 436,
|
| 118 |
+
"segment.all.current": 306,
|
| 119 |
+
"segment.all.freed": 130,
|
| 120 |
+
"segment.all.peak": 306,
|
| 121 |
+
"segment.large_pool.allocated": 350,
|
| 122 |
+
"segment.large_pool.current": 245,
|
| 123 |
+
"segment.large_pool.freed": 105,
|
| 124 |
+
"segment.large_pool.peak": 245,
|
| 125 |
+
"segment.small_pool.allocated": 86,
|
| 126 |
+
"segment.small_pool.current": 61,
|
| 127 |
+
"segment.small_pool.freed": 25,
|
| 128 |
+
"segment.small_pool.peak": 61
|
| 129 |
+
}
|
| 130 |
+
}
|
outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_10915/all_results_la_kron_all_homo_mc_corr_1000.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"eval_accuracy": 0.8534504081127875, "eval_f1": 0.801221189653437}
|
outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_10915/eval_res_la_kron_all_homo_mc_corr_1000.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_10915/gpu_stats_la.json
ADDED
|
@@ -0,0 +1,130 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"memory_allocated": 808356352,
|
| 3 |
+
"max_memory_allocated": 5015770624,
|
| 4 |
+
"memory_reserved": 6350176256,
|
| 5 |
+
"max_memory_reserved": 6752829440,
|
| 6 |
+
"memory_stats": {
|
| 7 |
+
"active.all.allocated": 73448108,
|
| 8 |
+
"active.all.current": 10809,
|
| 9 |
+
"active.all.freed": 73437299,
|
| 10 |
+
"active.all.peak": 10985,
|
| 11 |
+
"active.large_pool.allocated": 35166539,
|
| 12 |
+
"active.large_pool.current": 222,
|
| 13 |
+
"active.large_pool.freed": 35166317,
|
| 14 |
+
"active.large_pool.peak": 360,
|
| 15 |
+
"active.small_pool.allocated": 38281569,
|
| 16 |
+
"active.small_pool.current": 10587,
|
| 17 |
+
"active.small_pool.freed": 38270982,
|
| 18 |
+
"active.small_pool.peak": 10750,
|
| 19 |
+
"active_bytes.all.allocated": 234626955736064,
|
| 20 |
+
"active_bytes.all.current": 808356352,
|
| 21 |
+
"active_bytes.all.freed": 234626147379712,
|
| 22 |
+
"active_bytes.all.peak": 5015770624,
|
| 23 |
+
"active_bytes.large_pool.allocated": 224586041533952,
|
| 24 |
+
"active_bytes.large_pool.current": 799080448,
|
| 25 |
+
"active_bytes.large_pool.freed": 224585242453504,
|
| 26 |
+
"active_bytes.large_pool.peak": 4998576128,
|
| 27 |
+
"active_bytes.small_pool.allocated": 10040914202112,
|
| 28 |
+
"active_bytes.small_pool.current": 9275904,
|
| 29 |
+
"active_bytes.small_pool.freed": 10040904926208,
|
| 30 |
+
"active_bytes.small_pool.peak": 124137472,
|
| 31 |
+
"allocated_bytes.all.allocated": 234626955736064,
|
| 32 |
+
"allocated_bytes.all.current": 808356352,
|
| 33 |
+
"allocated_bytes.all.freed": 234626147379712,
|
| 34 |
+
"allocated_bytes.all.peak": 5015770624,
|
| 35 |
+
"allocated_bytes.large_pool.allocated": 224586041533952,
|
| 36 |
+
"allocated_bytes.large_pool.current": 799080448,
|
| 37 |
+
"allocated_bytes.large_pool.freed": 224585242453504,
|
| 38 |
+
"allocated_bytes.large_pool.peak": 4998576128,
|
| 39 |
+
"allocated_bytes.small_pool.allocated": 10040914202112,
|
| 40 |
+
"allocated_bytes.small_pool.current": 9275904,
|
| 41 |
+
"allocated_bytes.small_pool.freed": 10040904926208,
|
| 42 |
+
"allocated_bytes.small_pool.peak": 124137472,
|
| 43 |
+
"allocation.all.allocated": 73448108,
|
| 44 |
+
"allocation.all.current": 10809,
|
| 45 |
+
"allocation.all.freed": 73437299,
|
| 46 |
+
"allocation.all.peak": 10985,
|
| 47 |
+
"allocation.large_pool.allocated": 35166539,
|
| 48 |
+
"allocation.large_pool.current": 222,
|
| 49 |
+
"allocation.large_pool.freed": 35166317,
|
| 50 |
+
"allocation.large_pool.peak": 360,
|
| 51 |
+
"allocation.small_pool.allocated": 38281569,
|
| 52 |
+
"allocation.small_pool.current": 10587,
|
| 53 |
+
"allocation.small_pool.freed": 38270982,
|
| 54 |
+
"allocation.small_pool.peak": 10750,
|
| 55 |
+
"inactive_split.all.allocated": 38491526,
|
| 56 |
+
"inactive_split.all.current": 119,
|
| 57 |
+
"inactive_split.all.freed": 38491407,
|
| 58 |
+
"inactive_split.all.peak": 1966,
|
| 59 |
+
"inactive_split.large_pool.allocated": 24502987,
|
| 60 |
+
"inactive_split.large_pool.current": 38,
|
| 61 |
+
"inactive_split.large_pool.freed": 24502949,
|
| 62 |
+
"inactive_split.large_pool.peak": 141,
|
| 63 |
+
"inactive_split.small_pool.allocated": 13988539,
|
| 64 |
+
"inactive_split.small_pool.current": 81,
|
| 65 |
+
"inactive_split.small_pool.freed": 13988458,
|
| 66 |
+
"inactive_split.small_pool.peak": 1920,
|
| 67 |
+
"inactive_split_bytes.all.allocated": 216296435532288,
|
| 68 |
+
"inactive_split_bytes.all.current": 120681984,
|
| 69 |
+
"inactive_split_bytes.all.freed": 216296314850304,
|
| 70 |
+
"inactive_split_bytes.all.peak": 1893863936,
|
| 71 |
+
"inactive_split_bytes.large_pool.allocated": 205937432882688,
|
| 72 |
+
"inactive_split_bytes.large_pool.current": 92209152,
|
| 73 |
+
"inactive_split_bytes.large_pool.freed": 205937340673536,
|
| 74 |
+
"inactive_split_bytes.large_pool.peak": 1887404032,
|
| 75 |
+
"inactive_split_bytes.small_pool.allocated": 10359002649600,
|
| 76 |
+
"inactive_split_bytes.small_pool.current": 28472832,
|
| 77 |
+
"inactive_split_bytes.small_pool.freed": 10358974176768,
|
| 78 |
+
"inactive_split_bytes.small_pool.peak": 84646400,
|
| 79 |
+
"max_split_size": -1,
|
| 80 |
+
"num_alloc_retries": 0,
|
| 81 |
+
"num_device_alloc": 1230,
|
| 82 |
+
"num_device_free": 924,
|
| 83 |
+
"num_ooms": 0,
|
| 84 |
+
"num_sync_all_streams": 5,
|
| 85 |
+
"oversize_allocations.allocated": 0,
|
| 86 |
+
"oversize_allocations.current": 0,
|
| 87 |
+
"oversize_allocations.freed": 0,
|
| 88 |
+
"oversize_allocations.peak": 0,
|
| 89 |
+
"oversize_segments.allocated": 0,
|
| 90 |
+
"oversize_segments.current": 0,
|
| 91 |
+
"oversize_segments.freed": 0,
|
| 92 |
+
"oversize_segments.peak": 0,
|
| 93 |
+
"requested_bytes.all.allocated": 232141281205865,
|
| 94 |
+
"requested_bytes.all.current": 800396976,
|
| 95 |
+
"requested_bytes.all.freed": 232140480808889,
|
| 96 |
+
"requested_bytes.all.peak": 4992933420,
|
| 97 |
+
"requested_bytes.large_pool.allocated": 222103903185152,
|
| 98 |
+
"requested_bytes.large_pool.current": 795392000,
|
| 99 |
+
"requested_bytes.large_pool.freed": 222103107793152,
|
| 100 |
+
"requested_bytes.large_pool.peak": 4975769600,
|
| 101 |
+
"requested_bytes.small_pool.allocated": 10037378020713,
|
| 102 |
+
"requested_bytes.small_pool.current": 5004976,
|
| 103 |
+
"requested_bytes.small_pool.freed": 10037373015737,
|
| 104 |
+
"requested_bytes.small_pool.peak": 119884008,
|
| 105 |
+
"reserved_bytes.all.allocated": 34997272576,
|
| 106 |
+
"reserved_bytes.all.current": 6350176256,
|
| 107 |
+
"reserved_bytes.all.freed": 28647096320,
|
| 108 |
+
"reserved_bytes.all.peak": 6752829440,
|
| 109 |
+
"reserved_bytes.large_pool.allocated": 34483470336,
|
| 110 |
+
"reserved_bytes.large_pool.current": 6222249984,
|
| 111 |
+
"reserved_bytes.large_pool.freed": 28261220352,
|
| 112 |
+
"reserved_bytes.large_pool.peak": 6687817728,
|
| 113 |
+
"reserved_bytes.small_pool.allocated": 513802240,
|
| 114 |
+
"reserved_bytes.small_pool.current": 127926272,
|
| 115 |
+
"reserved_bytes.small_pool.freed": 385875968,
|
| 116 |
+
"reserved_bytes.small_pool.peak": 127926272,
|
| 117 |
+
"segment.all.allocated": 1230,
|
| 118 |
+
"segment.all.current": 306,
|
| 119 |
+
"segment.all.freed": 924,
|
| 120 |
+
"segment.all.peak": 306,
|
| 121 |
+
"segment.large_pool.allocated": 985,
|
| 122 |
+
"segment.large_pool.current": 245,
|
| 123 |
+
"segment.large_pool.freed": 740,
|
| 124 |
+
"segment.large_pool.peak": 245,
|
| 125 |
+
"segment.small_pool.allocated": 245,
|
| 126 |
+
"segment.small_pool.current": 61,
|
| 127 |
+
"segment.small_pool.freed": 184,
|
| 128 |
+
"segment.small_pool.peak": 61
|
| 129 |
+
}
|
| 130 |
+
}
|
outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_16373/all_results_la_kron_all_homo_mc_corr_1000.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"eval_accuracy": 0.8614889933217907, "eval_f1": 0.8166939443535187}
|
outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_16373/eval_res_la_kron_all_homo_mc_corr_1000.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_16373/gpu_stats_la.json
ADDED
|
@@ -0,0 +1,130 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"memory_allocated": 808552960,
|
| 3 |
+
"max_memory_allocated": 5015770624,
|
| 4 |
+
"memory_reserved": 6345981952,
|
| 5 |
+
"max_memory_reserved": 6752829440,
|
| 6 |
+
"memory_stats": {
|
| 7 |
+
"active.all.allocated": 97930810,
|
| 8 |
+
"active.all.current": 10809,
|
| 9 |
+
"active.all.freed": 97920001,
|
| 10 |
+
"active.all.peak": 10985,
|
| 11 |
+
"active.large_pool.allocated": 46888718,
|
| 12 |
+
"active.large_pool.current": 222,
|
| 13 |
+
"active.large_pool.freed": 46888496,
|
| 14 |
+
"active.large_pool.peak": 360,
|
| 15 |
+
"active.small_pool.allocated": 51042092,
|
| 16 |
+
"active.small_pool.current": 10587,
|
| 17 |
+
"active.small_pool.freed": 51031505,
|
| 18 |
+
"active.small_pool.peak": 10750,
|
| 19 |
+
"active_bytes.all.allocated": 312846567023616,
|
| 20 |
+
"active_bytes.all.current": 808552960,
|
| 21 |
+
"active_bytes.all.freed": 312845758470656,
|
| 22 |
+
"active_bytes.all.peak": 5015770624,
|
| 23 |
+
"active_bytes.large_pool.allocated": 299458681420800,
|
| 24 |
+
"active_bytes.large_pool.current": 799277056,
|
| 25 |
+
"active_bytes.large_pool.freed": 299457882143744,
|
| 26 |
+
"active_bytes.large_pool.peak": 4998576128,
|
| 27 |
+
"active_bytes.small_pool.allocated": 13387885602816,
|
| 28 |
+
"active_bytes.small_pool.current": 9275904,
|
| 29 |
+
"active_bytes.small_pool.freed": 13387876326912,
|
| 30 |
+
"active_bytes.small_pool.peak": 124137472,
|
| 31 |
+
"allocated_bytes.all.allocated": 312846567023616,
|
| 32 |
+
"allocated_bytes.all.current": 808552960,
|
| 33 |
+
"allocated_bytes.all.freed": 312845758470656,
|
| 34 |
+
"allocated_bytes.all.peak": 5015770624,
|
| 35 |
+
"allocated_bytes.large_pool.allocated": 299458681420800,
|
| 36 |
+
"allocated_bytes.large_pool.current": 799277056,
|
| 37 |
+
"allocated_bytes.large_pool.freed": 299457882143744,
|
| 38 |
+
"allocated_bytes.large_pool.peak": 4998576128,
|
| 39 |
+
"allocated_bytes.small_pool.allocated": 13387885602816,
|
| 40 |
+
"allocated_bytes.small_pool.current": 9275904,
|
| 41 |
+
"allocated_bytes.small_pool.freed": 13387876326912,
|
| 42 |
+
"allocated_bytes.small_pool.peak": 124137472,
|
| 43 |
+
"allocation.all.allocated": 97930810,
|
| 44 |
+
"allocation.all.current": 10809,
|
| 45 |
+
"allocation.all.freed": 97920001,
|
| 46 |
+
"allocation.all.peak": 10985,
|
| 47 |
+
"allocation.large_pool.allocated": 46888718,
|
| 48 |
+
"allocation.large_pool.current": 222,
|
| 49 |
+
"allocation.large_pool.freed": 46888496,
|
| 50 |
+
"allocation.large_pool.peak": 360,
|
| 51 |
+
"allocation.small_pool.allocated": 51042092,
|
| 52 |
+
"allocation.small_pool.current": 10587,
|
| 53 |
+
"allocation.small_pool.freed": 51031505,
|
| 54 |
+
"allocation.small_pool.peak": 10750,
|
| 55 |
+
"inactive_split.all.allocated": 51328722,
|
| 56 |
+
"inactive_split.all.current": 125,
|
| 57 |
+
"inactive_split.all.freed": 51328597,
|
| 58 |
+
"inactive_split.all.peak": 1966,
|
| 59 |
+
"inactive_split.large_pool.allocated": 32685617,
|
| 60 |
+
"inactive_split.large_pool.current": 43,
|
| 61 |
+
"inactive_split.large_pool.freed": 32685574,
|
| 62 |
+
"inactive_split.large_pool.peak": 141,
|
| 63 |
+
"inactive_split.small_pool.allocated": 18643105,
|
| 64 |
+
"inactive_split.small_pool.current": 82,
|
| 65 |
+
"inactive_split.small_pool.freed": 18643023,
|
| 66 |
+
"inactive_split.small_pool.peak": 1920,
|
| 67 |
+
"inactive_split_bytes.all.allocated": 288630388610048,
|
| 68 |
+
"inactive_split_bytes.all.current": 143554048,
|
| 69 |
+
"inactive_split_bytes.all.freed": 288630245056000,
|
| 70 |
+
"inactive_split_bytes.all.peak": 1893863936,
|
| 71 |
+
"inactive_split_bytes.large_pool.allocated": 274820238239232,
|
| 72 |
+
"inactive_split_bytes.large_pool.current": 121372672,
|
| 73 |
+
"inactive_split_bytes.large_pool.freed": 274820116866560,
|
| 74 |
+
"inactive_split_bytes.large_pool.peak": 1887404032,
|
| 75 |
+
"inactive_split_bytes.small_pool.allocated": 13810150370816,
|
| 76 |
+
"inactive_split_bytes.small_pool.current": 22181376,
|
| 77 |
+
"inactive_split_bytes.small_pool.freed": 13810128189440,
|
| 78 |
+
"inactive_split_bytes.small_pool.peak": 85829632,
|
| 79 |
+
"max_split_size": -1,
|
| 80 |
+
"num_alloc_retries": 0,
|
| 81 |
+
"num_device_alloc": 1627,
|
| 82 |
+
"num_device_free": 1322,
|
| 83 |
+
"num_ooms": 0,
|
| 84 |
+
"num_sync_all_streams": 7,
|
| 85 |
+
"oversize_allocations.allocated": 0,
|
| 86 |
+
"oversize_allocations.current": 0,
|
| 87 |
+
"oversize_allocations.freed": 0,
|
| 88 |
+
"oversize_allocations.peak": 0,
|
| 89 |
+
"oversize_segments.allocated": 0,
|
| 90 |
+
"oversize_segments.current": 0,
|
| 91 |
+
"oversize_segments.freed": 0,
|
| 92 |
+
"oversize_segments.peak": 0,
|
| 93 |
+
"requested_bytes.all.allocated": 309521702594700,
|
| 94 |
+
"requested_bytes.all.current": 800396976,
|
| 95 |
+
"requested_bytes.all.freed": 309520902197724,
|
| 96 |
+
"requested_bytes.all.peak": 4992933420,
|
| 97 |
+
"requested_bytes.large_pool.allocated": 296138531900416,
|
| 98 |
+
"requested_bytes.large_pool.current": 795392000,
|
| 99 |
+
"requested_bytes.large_pool.freed": 296137736508416,
|
| 100 |
+
"requested_bytes.large_pool.peak": 4975769600,
|
| 101 |
+
"requested_bytes.small_pool.allocated": 13383170694284,
|
| 102 |
+
"requested_bytes.small_pool.current": 5004976,
|
| 103 |
+
"requested_bytes.small_pool.freed": 13383165689308,
|
| 104 |
+
"requested_bytes.small_pool.peak": 119884008,
|
| 105 |
+
"reserved_bytes.all.allocated": 46401585152,
|
| 106 |
+
"reserved_bytes.all.current": 6345981952,
|
| 107 |
+
"reserved_bytes.all.freed": 40055603200,
|
| 108 |
+
"reserved_bytes.all.peak": 6752829440,
|
| 109 |
+
"reserved_bytes.large_pool.allocated": 45720010752,
|
| 110 |
+
"reserved_bytes.large_pool.current": 6218055680,
|
| 111 |
+
"reserved_bytes.large_pool.freed": 39501955072,
|
| 112 |
+
"reserved_bytes.large_pool.peak": 6687817728,
|
| 113 |
+
"reserved_bytes.small_pool.allocated": 681574400,
|
| 114 |
+
"reserved_bytes.small_pool.current": 127926272,
|
| 115 |
+
"reserved_bytes.small_pool.freed": 553648128,
|
| 116 |
+
"reserved_bytes.small_pool.peak": 127926272,
|
| 117 |
+
"segment.all.allocated": 1627,
|
| 118 |
+
"segment.all.current": 305,
|
| 119 |
+
"segment.all.freed": 1322,
|
| 120 |
+
"segment.all.peak": 306,
|
| 121 |
+
"segment.large_pool.allocated": 1302,
|
| 122 |
+
"segment.large_pool.current": 244,
|
| 123 |
+
"segment.large_pool.freed": 1058,
|
| 124 |
+
"segment.large_pool.peak": 245,
|
| 125 |
+
"segment.small_pool.allocated": 325,
|
| 126 |
+
"segment.small_pool.current": 61,
|
| 127 |
+
"segment.small_pool.freed": 264,
|
| 128 |
+
"segment.small_pool.peak": 61
|
| 129 |
+
}
|
| 130 |
+
}
|
outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_21831/all_results_la_kron_all_homo_mc_corr_1000.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"eval_accuracy": 0.8638139995053178, "eval_f1": 0.8181638044914136}
|
outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_21831/eval_res_la_kron_all_homo_mc_corr_1000.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_21831/gpu_stats_la.json
ADDED
|
@@ -0,0 +1,130 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"memory_allocated": 808356352,
|
| 3 |
+
"max_memory_allocated": 5015770624,
|
| 4 |
+
"memory_reserved": 6350176256,
|
| 5 |
+
"max_memory_reserved": 6752829440,
|
| 6 |
+
"memory_stats": {
|
| 7 |
+
"active.all.allocated": 122413512,
|
| 8 |
+
"active.all.current": 10809,
|
| 9 |
+
"active.all.freed": 122402703,
|
| 10 |
+
"active.all.peak": 10985,
|
| 11 |
+
"active.large_pool.allocated": 58610897,
|
| 12 |
+
"active.large_pool.current": 222,
|
| 13 |
+
"active.large_pool.freed": 58610675,
|
| 14 |
+
"active.large_pool.peak": 360,
|
| 15 |
+
"active.small_pool.allocated": 63802615,
|
| 16 |
+
"active.small_pool.current": 10587,
|
| 17 |
+
"active.small_pool.freed": 63792028,
|
| 18 |
+
"active.small_pool.peak": 10750,
|
| 19 |
+
"active_bytes.all.allocated": 391045242961408,
|
| 20 |
+
"active_bytes.all.current": 808356352,
|
| 21 |
+
"active_bytes.all.freed": 391044434605056,
|
| 22 |
+
"active_bytes.all.peak": 5015770624,
|
| 23 |
+
"active_bytes.large_pool.allocated": 374310385957888,
|
| 24 |
+
"active_bytes.large_pool.current": 799080448,
|
| 25 |
+
"active_bytes.large_pool.freed": 374309586877440,
|
| 26 |
+
"active_bytes.large_pool.peak": 4998576128,
|
| 27 |
+
"active_bytes.small_pool.allocated": 16734857003520,
|
| 28 |
+
"active_bytes.small_pool.current": 9275904,
|
| 29 |
+
"active_bytes.small_pool.freed": 16734847727616,
|
| 30 |
+
"active_bytes.small_pool.peak": 124137472,
|
| 31 |
+
"allocated_bytes.all.allocated": 391045242961408,
|
| 32 |
+
"allocated_bytes.all.current": 808356352,
|
| 33 |
+
"allocated_bytes.all.freed": 391044434605056,
|
| 34 |
+
"allocated_bytes.all.peak": 5015770624,
|
| 35 |
+
"allocated_bytes.large_pool.allocated": 374310385957888,
|
| 36 |
+
"allocated_bytes.large_pool.current": 799080448,
|
| 37 |
+
"allocated_bytes.large_pool.freed": 374309586877440,
|
| 38 |
+
"allocated_bytes.large_pool.peak": 4998576128,
|
| 39 |
+
"allocated_bytes.small_pool.allocated": 16734857003520,
|
| 40 |
+
"allocated_bytes.small_pool.current": 9275904,
|
| 41 |
+
"allocated_bytes.small_pool.freed": 16734847727616,
|
| 42 |
+
"allocated_bytes.small_pool.peak": 124137472,
|
| 43 |
+
"allocation.all.allocated": 122413512,
|
| 44 |
+
"allocation.all.current": 10809,
|
| 45 |
+
"allocation.all.freed": 122402703,
|
| 46 |
+
"allocation.all.peak": 10985,
|
| 47 |
+
"allocation.large_pool.allocated": 58610897,
|
| 48 |
+
"allocation.large_pool.current": 222,
|
| 49 |
+
"allocation.large_pool.freed": 58610675,
|
| 50 |
+
"allocation.large_pool.peak": 360,
|
| 51 |
+
"allocation.small_pool.allocated": 63802615,
|
| 52 |
+
"allocation.small_pool.current": 10587,
|
| 53 |
+
"allocation.small_pool.freed": 63792028,
|
| 54 |
+
"allocation.small_pool.peak": 10750,
|
| 55 |
+
"inactive_split.all.allocated": 64144648,
|
| 56 |
+
"inactive_split.all.current": 110,
|
| 57 |
+
"inactive_split.all.freed": 64144538,
|
| 58 |
+
"inactive_split.all.peak": 1980,
|
| 59 |
+
"inactive_split.large_pool.allocated": 40914502,
|
| 60 |
+
"inactive_split.large_pool.current": 38,
|
| 61 |
+
"inactive_split.large_pool.freed": 40914464,
|
| 62 |
+
"inactive_split.large_pool.peak": 141,
|
| 63 |
+
"inactive_split.small_pool.allocated": 23230146,
|
| 64 |
+
"inactive_split.small_pool.current": 72,
|
| 65 |
+
"inactive_split.small_pool.freed": 23230074,
|
| 66 |
+
"inactive_split.small_pool.peak": 1934,
|
| 67 |
+
"inactive_split_bytes.all.allocated": 360737834738688,
|
| 68 |
+
"inactive_split_bytes.all.current": 120681984,
|
| 69 |
+
"inactive_split_bytes.all.freed": 360737714056704,
|
| 70 |
+
"inactive_split_bytes.all.peak": 1893863936,
|
| 71 |
+
"inactive_split_bytes.large_pool.allocated": 343478534163456,
|
| 72 |
+
"inactive_split_bytes.large_pool.current": 92209152,
|
| 73 |
+
"inactive_split_bytes.large_pool.freed": 343478441954304,
|
| 74 |
+
"inactive_split_bytes.large_pool.peak": 1887404032,
|
| 75 |
+
"inactive_split_bytes.small_pool.allocated": 17259300575232,
|
| 76 |
+
"inactive_split_bytes.small_pool.current": 28472832,
|
| 77 |
+
"inactive_split_bytes.small_pool.freed": 17259272102400,
|
| 78 |
+
"inactive_split_bytes.small_pool.peak": 85829632,
|
| 79 |
+
"max_split_size": -1,
|
| 80 |
+
"num_alloc_retries": 0,
|
| 81 |
+
"num_device_alloc": 2025,
|
| 82 |
+
"num_device_free": 1719,
|
| 83 |
+
"num_ooms": 0,
|
| 84 |
+
"num_sync_all_streams": 9,
|
| 85 |
+
"oversize_allocations.allocated": 0,
|
| 86 |
+
"oversize_allocations.current": 0,
|
| 87 |
+
"oversize_allocations.freed": 0,
|
| 88 |
+
"oversize_allocations.peak": 0,
|
| 89 |
+
"oversize_segments.allocated": 0,
|
| 90 |
+
"oversize_segments.current": 0,
|
| 91 |
+
"oversize_segments.freed": 0,
|
| 92 |
+
"oversize_segments.peak": 0,
|
| 93 |
+
"requested_bytes.all.allocated": 386902123983535,
|
| 94 |
+
"requested_bytes.all.current": 800396976,
|
| 95 |
+
"requested_bytes.all.freed": 386901323586559,
|
| 96 |
+
"requested_bytes.all.peak": 4992933420,
|
| 97 |
+
"requested_bytes.large_pool.allocated": 370173160615680,
|
| 98 |
+
"requested_bytes.large_pool.current": 795392000,
|
| 99 |
+
"requested_bytes.large_pool.freed": 370172365223680,
|
| 100 |
+
"requested_bytes.large_pool.peak": 4975769600,
|
| 101 |
+
"requested_bytes.small_pool.allocated": 16728963367855,
|
| 102 |
+
"requested_bytes.small_pool.current": 5004976,
|
| 103 |
+
"requested_bytes.small_pool.freed": 16728958362879,
|
| 104 |
+
"requested_bytes.small_pool.peak": 119884008,
|
| 105 |
+
"reserved_bytes.all.allocated": 57814286336,
|
| 106 |
+
"reserved_bytes.all.current": 6350176256,
|
| 107 |
+
"reserved_bytes.all.freed": 51464110080,
|
| 108 |
+
"reserved_bytes.all.peak": 6752829440,
|
| 109 |
+
"reserved_bytes.large_pool.allocated": 56964939776,
|
| 110 |
+
"reserved_bytes.large_pool.current": 6222249984,
|
| 111 |
+
"reserved_bytes.large_pool.freed": 50742689792,
|
| 112 |
+
"reserved_bytes.large_pool.peak": 6687817728,
|
| 113 |
+
"reserved_bytes.small_pool.allocated": 849346560,
|
| 114 |
+
"reserved_bytes.small_pool.current": 127926272,
|
| 115 |
+
"reserved_bytes.small_pool.freed": 721420288,
|
| 116 |
+
"reserved_bytes.small_pool.peak": 127926272,
|
| 117 |
+
"segment.all.allocated": 2025,
|
| 118 |
+
"segment.all.current": 306,
|
| 119 |
+
"segment.all.freed": 1719,
|
| 120 |
+
"segment.all.peak": 306,
|
| 121 |
+
"segment.large_pool.allocated": 1620,
|
| 122 |
+
"segment.large_pool.current": 245,
|
| 123 |
+
"segment.large_pool.freed": 1375,
|
| 124 |
+
"segment.large_pool.peak": 245,
|
| 125 |
+
"segment.small_pool.allocated": 405,
|
| 126 |
+
"segment.small_pool.current": 61,
|
| 127 |
+
"segment.small_pool.freed": 344,
|
| 128 |
+
"segment.small_pool.peak": 61
|
| 129 |
+
}
|
| 130 |
+
}
|
outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_27290/all_results_la_kron_all_homo_mc_corr_1000.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"eval_accuracy": 0.8644818204303735, "eval_f1": 0.8207544083488729}
|
outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_27290/eval_res_la_kron_all_homo_mc_corr_1000.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_27290/gpu_stats_la.json
ADDED
|
@@ -0,0 +1,130 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"memory_allocated": 808552960,
|
| 3 |
+
"max_memory_allocated": 5015770624,
|
| 4 |
+
"memory_reserved": 6354370560,
|
| 5 |
+
"max_memory_reserved": 6752829440,
|
| 6 |
+
"memory_stats": {
|
| 7 |
+
"active.all.allocated": 146896213,
|
| 8 |
+
"active.all.current": 10809,
|
| 9 |
+
"active.all.freed": 146885404,
|
| 10 |
+
"active.all.peak": 10985,
|
| 11 |
+
"active.large_pool.allocated": 70333076,
|
| 12 |
+
"active.large_pool.current": 222,
|
| 13 |
+
"active.large_pool.freed": 70332854,
|
| 14 |
+
"active.large_pool.peak": 360,
|
| 15 |
+
"active.small_pool.allocated": 76563137,
|
| 16 |
+
"active.small_pool.current": 10587,
|
| 17 |
+
"active.small_pool.freed": 76552550,
|
| 18 |
+
"active.small_pool.peak": 10750,
|
| 19 |
+
"active_bytes.all.allocated": 469258036103680,
|
| 20 |
+
"active_bytes.all.current": 808552960,
|
| 21 |
+
"active_bytes.all.freed": 469257227550720,
|
| 22 |
+
"active_bytes.all.peak": 5015770624,
|
| 23 |
+
"active_bytes.large_pool.allocated": 449176207699968,
|
| 24 |
+
"active_bytes.large_pool.current": 799277056,
|
| 25 |
+
"active_bytes.large_pool.freed": 449175408422912,
|
| 26 |
+
"active_bytes.large_pool.peak": 4998576128,
|
| 27 |
+
"active_bytes.small_pool.allocated": 20081828403712,
|
| 28 |
+
"active_bytes.small_pool.current": 9275904,
|
| 29 |
+
"active_bytes.small_pool.freed": 20081819127808,
|
| 30 |
+
"active_bytes.small_pool.peak": 124137472,
|
| 31 |
+
"allocated_bytes.all.allocated": 469258036103680,
|
| 32 |
+
"allocated_bytes.all.current": 808552960,
|
| 33 |
+
"allocated_bytes.all.freed": 469257227550720,
|
| 34 |
+
"allocated_bytes.all.peak": 5015770624,
|
| 35 |
+
"allocated_bytes.large_pool.allocated": 449176207699968,
|
| 36 |
+
"allocated_bytes.large_pool.current": 799277056,
|
| 37 |
+
"allocated_bytes.large_pool.freed": 449175408422912,
|
| 38 |
+
"allocated_bytes.large_pool.peak": 4998576128,
|
| 39 |
+
"allocated_bytes.small_pool.allocated": 20081828403712,
|
| 40 |
+
"allocated_bytes.small_pool.current": 9275904,
|
| 41 |
+
"allocated_bytes.small_pool.freed": 20081819127808,
|
| 42 |
+
"allocated_bytes.small_pool.peak": 124137472,
|
| 43 |
+
"allocation.all.allocated": 146896213,
|
| 44 |
+
"allocation.all.current": 10809,
|
| 45 |
+
"allocation.all.freed": 146885404,
|
| 46 |
+
"allocation.all.peak": 10985,
|
| 47 |
+
"allocation.large_pool.allocated": 70333076,
|
| 48 |
+
"allocation.large_pool.current": 222,
|
| 49 |
+
"allocation.large_pool.freed": 70332854,
|
| 50 |
+
"allocation.large_pool.peak": 360,
|
| 51 |
+
"allocation.small_pool.allocated": 76563137,
|
| 52 |
+
"allocation.small_pool.current": 10587,
|
| 53 |
+
"allocation.small_pool.freed": 76552550,
|
| 54 |
+
"allocation.small_pool.peak": 10750,
|
| 55 |
+
"inactive_split.all.allocated": 76956505,
|
| 56 |
+
"inactive_split.all.current": 116,
|
| 57 |
+
"inactive_split.all.freed": 76956389,
|
| 58 |
+
"inactive_split.all.peak": 2062,
|
| 59 |
+
"inactive_split.large_pool.allocated": 49091858,
|
| 60 |
+
"inactive_split.large_pool.current": 39,
|
| 61 |
+
"inactive_split.large_pool.freed": 49091819,
|
| 62 |
+
"inactive_split.large_pool.peak": 141,
|
| 63 |
+
"inactive_split.small_pool.allocated": 27864647,
|
| 64 |
+
"inactive_split.small_pool.current": 77,
|
| 65 |
+
"inactive_split.small_pool.freed": 27864570,
|
| 66 |
+
"inactive_split.small_pool.peak": 2018,
|
| 67 |
+
"inactive_split_bytes.all.allocated": 432880781105152,
|
| 68 |
+
"inactive_split_bytes.all.current": 116291072,
|
| 69 |
+
"inactive_split_bytes.all.freed": 432880664814080,
|
| 70 |
+
"inactive_split_bytes.all.peak": 1893863936,
|
| 71 |
+
"inactive_split_bytes.large_pool.allocated": 412148656592384,
|
| 72 |
+
"inactive_split_bytes.large_pool.current": 96206848,
|
| 73 |
+
"inactive_split_bytes.large_pool.freed": 412148560385536,
|
| 74 |
+
"inactive_split_bytes.large_pool.peak": 1887404032,
|
| 75 |
+
"inactive_split_bytes.small_pool.allocated": 20732124512768,
|
| 76 |
+
"inactive_split_bytes.small_pool.current": 20084224,
|
| 77 |
+
"inactive_split_bytes.small_pool.freed": 20732104428544,
|
| 78 |
+
"inactive_split_bytes.small_pool.peak": 85829632,
|
| 79 |
+
"max_split_size": -1,
|
| 80 |
+
"num_alloc_retries": 0,
|
| 81 |
+
"num_device_alloc": 2425,
|
| 82 |
+
"num_device_free": 2119,
|
| 83 |
+
"num_ooms": 0,
|
| 84 |
+
"num_sync_all_streams": 11,
|
| 85 |
+
"oversize_allocations.allocated": 0,
|
| 86 |
+
"oversize_allocations.current": 0,
|
| 87 |
+
"oversize_allocations.freed": 0,
|
| 88 |
+
"oversize_allocations.peak": 0,
|
| 89 |
+
"oversize_segments.allocated": 0,
|
| 90 |
+
"oversize_segments.current": 0,
|
| 91 |
+
"oversize_segments.freed": 0,
|
| 92 |
+
"oversize_segments.peak": 0,
|
| 93 |
+
"requested_bytes.all.allocated": 464282545372369,
|
| 94 |
+
"requested_bytes.all.current": 800396976,
|
| 95 |
+
"requested_bytes.all.freed": 464281744975393,
|
| 96 |
+
"requested_bytes.all.peak": 4992933420,
|
| 97 |
+
"requested_bytes.large_pool.allocated": 444207789330944,
|
| 98 |
+
"requested_bytes.large_pool.current": 795392000,
|
| 99 |
+
"requested_bytes.large_pool.freed": 444206993938944,
|
| 100 |
+
"requested_bytes.large_pool.peak": 4975769600,
|
| 101 |
+
"requested_bytes.small_pool.allocated": 20074756041425,
|
| 102 |
+
"requested_bytes.small_pool.current": 5004976,
|
| 103 |
+
"requested_bytes.small_pool.freed": 20074751036449,
|
| 104 |
+
"requested_bytes.small_pool.peak": 119884008,
|
| 105 |
+
"reserved_bytes.all.allocated": 69254250496,
|
| 106 |
+
"reserved_bytes.all.current": 6354370560,
|
| 107 |
+
"reserved_bytes.all.freed": 62899879936,
|
| 108 |
+
"reserved_bytes.all.peak": 6752829440,
|
| 109 |
+
"reserved_bytes.large_pool.allocated": 68235034624,
|
| 110 |
+
"reserved_bytes.large_pool.current": 6226444288,
|
| 111 |
+
"reserved_bytes.large_pool.freed": 62008590336,
|
| 112 |
+
"reserved_bytes.large_pool.peak": 6687817728,
|
| 113 |
+
"reserved_bytes.small_pool.allocated": 1019215872,
|
| 114 |
+
"reserved_bytes.small_pool.current": 127926272,
|
| 115 |
+
"reserved_bytes.small_pool.freed": 891289600,
|
| 116 |
+
"reserved_bytes.small_pool.peak": 127926272,
|
| 117 |
+
"segment.all.allocated": 2425,
|
| 118 |
+
"segment.all.current": 306,
|
| 119 |
+
"segment.all.freed": 2119,
|
| 120 |
+
"segment.all.peak": 306,
|
| 121 |
+
"segment.large_pool.allocated": 1939,
|
| 122 |
+
"segment.large_pool.current": 245,
|
| 123 |
+
"segment.large_pool.freed": 1694,
|
| 124 |
+
"segment.large_pool.peak": 245,
|
| 125 |
+
"segment.small_pool.allocated": 486,
|
| 126 |
+
"segment.small_pool.current": 61,
|
| 127 |
+
"segment.small_pool.freed": 425,
|
| 128 |
+
"segment.small_pool.peak": 61
|
| 129 |
+
}
|
| 130 |
+
}
|
outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_5457/all_results_la_kron_all_homo_mc_corr_1000.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"eval_accuracy": 0.8413306950284443, "eval_f1": 0.7981498379534944}
|
outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_5457/eval_res_la_kron_all_homo_mc_corr_1000.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
outputs/qqp/bert-base-uncased_loratrain_val_8_16_0.1_0.0001_65/step_5457/gpu_stats_la.json
ADDED
|
@@ -0,0 +1,130 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"memory_allocated": 808552960,
|
| 3 |
+
"max_memory_allocated": 5015770624,
|
| 4 |
+
"memory_reserved": 6345981952,
|
| 5 |
+
"max_memory_reserved": 6748635136,
|
| 6 |
+
"memory_stats": {
|
| 7 |
+
"active.all.allocated": 48965406,
|
| 8 |
+
"active.all.current": 10809,
|
| 9 |
+
"active.all.freed": 48954597,
|
| 10 |
+
"active.all.peak": 10985,
|
| 11 |
+
"active.large_pool.allocated": 23444360,
|
| 12 |
+
"active.large_pool.current": 222,
|
| 13 |
+
"active.large_pool.freed": 23444138,
|
| 14 |
+
"active.large_pool.peak": 360,
|
| 15 |
+
"active.small_pool.allocated": 25521046,
|
| 16 |
+
"active.small_pool.current": 10587,
|
| 17 |
+
"active.small_pool.freed": 25510459,
|
| 18 |
+
"active.small_pool.peak": 10750,
|
| 19 |
+
"active_bytes.all.allocated": 156429420911104,
|
| 20 |
+
"active_bytes.all.current": 808552960,
|
| 21 |
+
"active_bytes.all.freed": 156428612358144,
|
| 22 |
+
"active_bytes.all.peak": 5015770624,
|
| 23 |
+
"active_bytes.large_pool.allocated": 149735478109696,
|
| 24 |
+
"active_bytes.large_pool.current": 799277056,
|
| 25 |
+
"active_bytes.large_pool.freed": 149734678832640,
|
| 26 |
+
"active_bytes.large_pool.peak": 4998576128,
|
| 27 |
+
"active_bytes.small_pool.allocated": 6693942801408,
|
| 28 |
+
"active_bytes.small_pool.current": 9275904,
|
| 29 |
+
"active_bytes.small_pool.freed": 6693933525504,
|
| 30 |
+
"active_bytes.small_pool.peak": 124137472,
|
| 31 |
+
"allocated_bytes.all.allocated": 156429420911104,
|
| 32 |
+
"allocated_bytes.all.current": 808552960,
|
| 33 |
+
"allocated_bytes.all.freed": 156428612358144,
|
| 34 |
+
"allocated_bytes.all.peak": 5015770624,
|
| 35 |
+
"allocated_bytes.large_pool.allocated": 149735478109696,
|
| 36 |
+
"allocated_bytes.large_pool.current": 799277056,
|
| 37 |
+
"allocated_bytes.large_pool.freed": 149734678832640,
|
| 38 |
+
"allocated_bytes.large_pool.peak": 4998576128,
|
| 39 |
+
"allocated_bytes.small_pool.allocated": 6693942801408,
|
| 40 |
+
"allocated_bytes.small_pool.current": 9275904,
|
| 41 |
+
"allocated_bytes.small_pool.freed": 6693933525504,
|
| 42 |
+
"allocated_bytes.small_pool.peak": 124137472,
|
| 43 |
+
"allocation.all.allocated": 48965406,
|
| 44 |
+
"allocation.all.current": 10809,
|
| 45 |
+
"allocation.all.freed": 48954597,
|
| 46 |
+
"allocation.all.peak": 10985,
|
| 47 |
+
"allocation.large_pool.allocated": 23444360,
|
| 48 |
+
"allocation.large_pool.current": 222,
|
| 49 |
+
"allocation.large_pool.freed": 23444138,
|
| 50 |
+
"allocation.large_pool.peak": 360,
|
| 51 |
+
"allocation.small_pool.allocated": 25521046,
|
| 52 |
+
"allocation.small_pool.current": 10587,
|
| 53 |
+
"allocation.small_pool.freed": 25510459,
|
| 54 |
+
"allocation.small_pool.peak": 10750,
|
| 55 |
+
"inactive_split.all.allocated": 25627967,
|
| 56 |
+
"inactive_split.all.current": 124,
|
| 57 |
+
"inactive_split.all.freed": 25627843,
|
| 58 |
+
"inactive_split.all.peak": 1926,
|
| 59 |
+
"inactive_split.large_pool.allocated": 16274004,
|
| 60 |
+
"inactive_split.large_pool.current": 43,
|
| 61 |
+
"inactive_split.large_pool.freed": 16273961,
|
| 62 |
+
"inactive_split.large_pool.peak": 141,
|
| 63 |
+
"inactive_split.small_pool.allocated": 9353963,
|
| 64 |
+
"inactive_split.small_pool.current": 81,
|
| 65 |
+
"inactive_split.small_pool.freed": 9353882,
|
| 66 |
+
"inactive_split.small_pool.peak": 1881,
|
| 67 |
+
"inactive_split_bytes.all.allocated": 144184470591488,
|
| 68 |
+
"inactive_split_bytes.all.current": 149845504,
|
| 69 |
+
"inactive_split_bytes.all.freed": 144184320745984,
|
| 70 |
+
"inactive_split_bytes.all.peak": 1893863936,
|
| 71 |
+
"inactive_split_bytes.large_pool.allocated": 137280417156096,
|
| 72 |
+
"inactive_split_bytes.large_pool.current": 121372672,
|
| 73 |
+
"inactive_split_bytes.large_pool.freed": 137280295783424,
|
| 74 |
+
"inactive_split_bytes.large_pool.peak": 1887404032,
|
| 75 |
+
"inactive_split_bytes.small_pool.allocated": 6904053435392,
|
| 76 |
+
"inactive_split_bytes.small_pool.current": 28472832,
|
| 77 |
+
"inactive_split_bytes.small_pool.freed": 6904024962560,
|
| 78 |
+
"inactive_split_bytes.small_pool.peak": 84646400,
|
| 79 |
+
"max_split_size": -1,
|
| 80 |
+
"num_alloc_retries": 0,
|
| 81 |
+
"num_device_alloc": 832,
|
| 82 |
+
"num_device_free": 527,
|
| 83 |
+
"num_ooms": 0,
|
| 84 |
+
"num_sync_all_streams": 3,
|
| 85 |
+
"oversize_allocations.allocated": 0,
|
| 86 |
+
"oversize_allocations.current": 0,
|
| 87 |
+
"oversize_allocations.freed": 0,
|
| 88 |
+
"oversize_allocations.peak": 0,
|
| 89 |
+
"oversize_segments.allocated": 0,
|
| 90 |
+
"oversize_segments.current": 0,
|
| 91 |
+
"oversize_segments.freed": 0,
|
| 92 |
+
"oversize_segments.peak": 0,
|
| 93 |
+
"requested_bytes.all.allocated": 154760859817030,
|
| 94 |
+
"requested_bytes.all.current": 800396976,
|
| 95 |
+
"requested_bytes.all.freed": 154760059420054,
|
| 96 |
+
"requested_bytes.all.peak": 4992933420,
|
| 97 |
+
"requested_bytes.large_pool.allocated": 148069274469888,
|
| 98 |
+
"requested_bytes.large_pool.current": 795392000,
|
| 99 |
+
"requested_bytes.large_pool.freed": 148068479077888,
|
| 100 |
+
"requested_bytes.large_pool.peak": 4975769600,
|
| 101 |
+
"requested_bytes.small_pool.allocated": 6691585347142,
|
| 102 |
+
"requested_bytes.small_pool.current": 5004976,
|
| 103 |
+
"requested_bytes.small_pool.freed": 6691580342166,
|
| 104 |
+
"requested_bytes.small_pool.peak": 119884008,
|
| 105 |
+
"reserved_bytes.all.allocated": 23584571392,
|
| 106 |
+
"reserved_bytes.all.current": 6345981952,
|
| 107 |
+
"reserved_bytes.all.freed": 17238589440,
|
| 108 |
+
"reserved_bytes.all.peak": 6748635136,
|
| 109 |
+
"reserved_bytes.large_pool.allocated": 23238541312,
|
| 110 |
+
"reserved_bytes.large_pool.current": 6218055680,
|
| 111 |
+
"reserved_bytes.large_pool.freed": 17020485632,
|
| 112 |
+
"reserved_bytes.large_pool.peak": 6683623424,
|
| 113 |
+
"reserved_bytes.small_pool.allocated": 346030080,
|
| 114 |
+
"reserved_bytes.small_pool.current": 127926272,
|
| 115 |
+
"reserved_bytes.small_pool.freed": 218103808,
|
| 116 |
+
"reserved_bytes.small_pool.peak": 127926272,
|
| 117 |
+
"segment.all.allocated": 832,
|
| 118 |
+
"segment.all.current": 305,
|
| 119 |
+
"segment.all.freed": 527,
|
| 120 |
+
"segment.all.peak": 306,
|
| 121 |
+
"segment.large_pool.allocated": 667,
|
| 122 |
+
"segment.large_pool.current": 244,
|
| 123 |
+
"segment.large_pool.freed": 423,
|
| 124 |
+
"segment.large_pool.peak": 245,
|
| 125 |
+
"segment.small_pool.allocated": 165,
|
| 126 |
+
"segment.small_pool.current": 61,
|
| 127 |
+
"segment.small_pool.freed": 104,
|
| 128 |
+
"segment.small_pool.peak": 61
|
| 129 |
+
}
|
| 130 |
+
}
|
outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_0/f_mu_kron_all_homo_1000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f73cf0717e5c7586a1af550f283a0895f0d3305f3b9de93811909f09fee50d74
|
| 3 |
+
size 324780
|
outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_0/f_var_kron_all_homo_1000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e141f9fd22ba416f74eca62856d7b5a0b4fb463f11fdafbc6244fc8b6a866980
|
| 3 |
+
size 648177
|
outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_0/prior_precision_kron_all_homo_1000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e918703bd3b6f42a93d9ef6d6bbb5f8a720bb6a6fee7bee386e84ac4b780c302
|
| 3 |
+
size 1379
|
outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_10915/f_mu_kron_all_homo_1000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7a9d17c9d75b37ffb0e7c6945a65d6649e292ef42486d5e3836dec31a4731626
|
| 3 |
+
size 324780
|
outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_10915/f_var_kron_all_homo_1000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:93aec03660b9b2ec5d20fb0fb2fc6e4641935685be0723e4ba4dc59d4b251f1b
|
| 3 |
+
size 648177
|
outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_10915/prior_precision_kron_all_homo_1000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:963753c4c310ad388bdf8cb5a4d793c7140171bb925289166fdb0e32587cb48c
|
| 3 |
+
size 1379
|
outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_16373/f_mu_kron_all_homo_1000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6e316591626be60985f75e4fbd7c620b56d7cc59575f1120c6f5d23e4bc47a2d
|
| 3 |
+
size 324780
|
outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_16373/f_var_kron_all_homo_1000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:697d09f3b0eedc3b331363ee664700a2a4c1cdd34da74dc784efd5d17d779a9e
|
| 3 |
+
size 648177
|
outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_16373/prior_precision_kron_all_homo_1000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e00c56bdb3cede956360e4bdd15efed2bf199bb2b5df4dfbd6b65d91f95879d8
|
| 3 |
+
size 1379
|
outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_21831/f_mu_kron_all_homo_1000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d0c0c8a3480930b9d1323796e86a2032b5edda71f193082484b4a83a29e7eb2
|
| 3 |
+
size 324780
|
outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_21831/f_var_kron_all_homo_1000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ce9560131444826701d1efc79431383618af231ca44a6c5689008253f8f9cead
|
| 3 |
+
size 648177
|
outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_21831/prior_precision_kron_all_homo_1000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a8efd9da5faffc52e6e5b04d85957e147cfe0640718635c2aff99c0a1dad9eb
|
| 3 |
+
size 1379
|
outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_27290/f_mu_kron_all_homo_1000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d8095fdd693e3c5476db60edadb9a2cd7a8ba9d993132476c26433081b746d51
|
| 3 |
+
size 324780
|
outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_27290/f_var_kron_all_homo_1000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e851c0dacc061df969bf363d774f5b678a3cd89417c6a0ed00abe0466b9b83ad
|
| 3 |
+
size 648177
|
outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_27290/prior_precision_kron_all_homo_1000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1133b09c8bbda67749f039db9859cef8e13ef97be2099960ac98708090583ef1
|
| 3 |
+
size 1379
|
outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_5457/f_mu_kron_all_homo_1000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:317b13affcaa29e689abf4b622709a32a81cf7ee919bf1b91bc5bdca25973068
|
| 3 |
+
size 324780
|
outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_5457/f_var_kron_all_homo_1000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:733cdff0db61652eefe465b0cd3f87747cd5dad2cdd76ad2580d120115790088
|
| 3 |
+
size 648177
|
outputs_laplace/qqp/bert-base-uncased_loratrain_val_16_0.1_0.0001_65/step_5457/prior_precision_kron_all_homo_1000.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:84019521caeb084cfbc9db1e54f42468088e1f2b9ff6a6d1139c3086ef9ecb8d
|
| 3 |
+
size 1379
|