theo-bert-base / checkpoint_metadata.json
toranb's picture
Initial release: TheoBERT Base — biblical-domain masked language model
a64c547
{
"release_stage": "mlmcontinued (stage 2, epoch 25)",
"reported_loss": 0.8958267427277438,
"parameter_count": 273051864,
"fp16_export": true,
"tokenizer": "google-bert/bert-base-uncased",
"pretraining_stages": [
{
"stage": 1,
"name": "encoder",
"objective": "token-level masked language modeling at 20% mask rate 80/10/10 split",
"epochs": 24,
"seq_len": 256,
"final_train_loss": 1.0678829201169648,
"final_train_accuracy": 76.41802635495705
},
{
"stage": 2,
"name": "mlmcontinued",
"objective": "whole-word-masking continued pretraining at 18% mask rate",
"epochs": 25,
"seq_len": 256,
"final_train_loss": 0.8958267427277438,
"final_train_accuracy": 79.66191907459469
}
],
"mlm_eval_overall_pass_rate": 0.947,
"mlm_eval_passed_cases": 517,
"mlm_eval_total_cases": 546
}