radoslavralev commited on
Commit
dec7e48
·
verified ·
1 Parent(s): 65db05a

Training in progress, step 44

Browse files
config.json CHANGED
@@ -4,7 +4,7 @@
4
  ],
5
  "attention_probs_dropout_prob": 0.1,
6
  "classifier_dropout": null,
7
- "dtype": "float32",
8
  "gradient_checkpointing": false,
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
 
4
  ],
5
  "attention_probs_dropout_prob": 0.1,
6
  "classifier_dropout": null,
7
+ "dtype": "bfloat16",
8
  "gradient_checkpointing": false,
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
eval/Information-Retrieval_evaluation_test_results.csv CHANGED
@@ -5,3 +5,4 @@ epoch,steps,cosine-Accuracy@1,cosine-Precision@1,cosine-Recall@1,cosine-MRR@1,co
5
  0,0,0.5763286334056399,0.5763286334056399,0.5589816867630893,0.5763286334056399,0.7619419081029518,0.7107794631883741,{1: np.float64(0.3488530268041688)},{1: np.float64(0.1634818016054941)}
6
  0,0,0.5763286334056399,0.5763286334056399,0.5589816867630893,0.5763286334056399,0.7619419081029518,0.7107794631883741,{1: np.float64(0.3488530268041688)},{1: np.float64(0.1634818016054941)}
7
  0,0,0.5763286334056399,0.5763286334056399,0.5589816867630893,0.5763286334056399,0.7619419081029518,0.7107794631883741,{1: np.float64(0.3488530268041688)},{1: np.float64(0.1634818016054941)}
 
 
5
  0,0,0.5763286334056399,0.5763286334056399,0.5589816867630893,0.5763286334056399,0.7619419081029518,0.7107794631883741,{1: np.float64(0.3488530268041688)},{1: np.float64(0.1634818016054941)}
6
  0,0,0.5763286334056399,0.5763286334056399,0.5589816867630893,0.5763286334056399,0.7619419081029518,0.7107794631883741,{1: np.float64(0.3488530268041688)},{1: np.float64(0.1634818016054941)}
7
  0,0,0.5763286334056399,0.5763286334056399,0.5589816867630893,0.5763286334056399,0.7619419081029518,0.7107794631883741,{1: np.float64(0.3488530268041688)},{1: np.float64(0.1634818016054941)}
8
+ 0,0,0.5763286334056399,0.5763286334056399,0.5589816867630893,0.5763286334056399,0.7619433934524245,0.7107811578738404,{1: np.float64(0.3488530268041688)},{1: np.float64(0.16348145891100385)}
final_metrics.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "test_cosine_accuracy@1": 0.5907673535791758,
3
- "test_cosine_precision@1": 0.5907673535791758,
4
- "test_cosine_recall@1": 0.5736536031059655,
5
- "test_cosine_ndcg@10": 0.7683210399939226,
6
- "test_cosine_mrr@1": 0.5907673535791758,
7
- "test_cosine_map@100": 0.7197265061480947,
8
- "test_cosine_auc_precision_cache_hit_ratio": 0.362715739266966,
9
- "test_cosine_auc_similarity_distribution": 0.18036238269388047
10
  }
 
1
  {
2
+ "test_cosine_accuracy@1": 0.5910385032537961,
3
+ "test_cosine_precision@1": 0.5910385032537961,
4
+ "test_cosine_recall@1": 0.5738230716526032,
5
+ "test_cosine_ndcg@10": 0.7683219224836483,
6
+ "test_cosine_mrr@1": 0.5910385032537961,
7
+ "test_cosine_map@100": 0.7197776205033837,
8
+ "test_cosine_auc_precision_cache_hit_ratio": 0.3631867644548676,
9
+ "test_cosine_auc_similarity_distribution": 0.18035724992406232
10
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:194a08727688936a34d326a0b7ec7c4aff6c34e983fb7bfbd69eb0a270dd95ae
3
- size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec3cf21b9dac967ed24a078c8554f9c345e2b737507a2bd9751787934fc0930f
3
+ size 45437864
tokenizer.json CHANGED
@@ -2,7 +2,7 @@
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
- "max_length": 100,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
 
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
+ "max_length": 256,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bba6129a61a7388979816903a6bf7444ce80499690b9c66aa7b52b223733e322
3
  size 6289
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a9bd00f5832ad915908d05d5af131be19994bb3713a1256dcd0846c315ddf73
3
  size 6289