diff --git a/r0_full/run/checkpoints/acc/README.md b/r0_full/run/checkpoints/acc/README.md new file mode 100644 index 0000000000000000000000000000000000000000..2d4c19b14ebbb9a403d09e6532e46ccfcd7b82cb --- /dev/null +++ b/r0_full/run/checkpoints/acc/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: HuggingFaceM4/idefics2-8b +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/r0_full/run/checkpoints/acc/adapter_config.json b/r0_full/run/checkpoints/acc/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a6a12bf8b59da5b42d042490beafd765fe95f7af --- /dev/null +++ b/r0_full/run/checkpoints/acc/adapter_config.json @@ -0,0 +1,29 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "Idefics2ForConditionalGeneration", + "parent_library": "transformers.models.idefics2.modeling_idefics2" + }, + "base_model_name_or_path": "HuggingFaceM4/idefics2-8b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": "gaussian", + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.1, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 16, + "rank_pattern": {}, + "revision": null, + "target_modules": "(.*(vision_model|modality_projection|perceiver_resampler).*(out_proj|fc1|fc2|down_proj|gate_proj|up_proj|k_proj|q_proj|v_proj|o_proj).*$)|(.*(k_proj|q_proj|v_proj).*$)", + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/r0_full/run/checkpoints/acc/adapter_model.safetensors b/r0_full/run/checkpoints/acc/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..46a98334ff3ea946c39c82d19fe9ccd8f00ae222 --- /dev/null +++ b/r0_full/run/checkpoints/acc/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d023b55d9d4642dabc2fa070ac45d29e75596408b54a37190667467432cafcac +size 45771496 diff --git a/r0_full/run/checkpoints/acc/best_optimizer.pt b/r0_full/run/checkpoints/acc/best_optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..842948dda83844498561c53c89a6196f3fe4a1f4 --- /dev/null +++ b/r0_full/run/checkpoints/acc/best_optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b9befa6f3041c71a73a61664b0060dd600d6ce1d58a0d699aa82d8b9d6cc963 +size 91855438 diff --git a/r0_full/run/checkpoints/acc/best_scheduler.pt b/r0_full/run/checkpoints/acc/best_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7beeb4f1a43bedc60c957734efd2c4bcb3a9081 --- /dev/null +++ b/r0_full/run/checkpoints/acc/best_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c64a691c6993fec11fb1484fbc2db955ce092b96ef7c35a038fb0756354926cd +size 1084 diff --git a/r0_full/run/checkpoints/acc/saved_metrics.pth b/r0_full/run/checkpoints/acc/saved_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..0b580de6e28e2184ed11a5ce667eb724bb83054a --- /dev/null +++ b/r0_full/run/checkpoints/acc/saved_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0563b720d0a3c5c852603683dedf11945686ad74408aa3089542112afd963961 +size 1208 diff --git a/r0_full/run/logging/epoch_0_train_metrics.pth b/r0_full/run/logging/epoch_0_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..3c21129be33401d83063930795f80ec21393cf9d --- /dev/null +++ b/r0_full/run/logging/epoch_0_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0644574bbd56621f65dbbdbf175d93fabd6675ca14ed192a72ba2361fea53d5 +size 1304 diff --git a/r0_full/run/logging/epoch_0_val_metrics.pth b/r0_full/run/logging/epoch_0_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..ba015b7543083d93fd768b0bedf1bbbe4ec12f5e --- /dev/null +++ b/r0_full/run/logging/epoch_0_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a223a06a0e8fa0631a44c59df301d2fa4c71396909112c732eddf4b7e79d8798 +size 1360 diff --git a/r0_full/run/logging/epoch_10_train_metrics.pth b/r0_full/run/logging/epoch_10_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..8ee4bfdc4257c6eed1e02c748b017bc9c7ecceb5 --- /dev/null +++ b/r0_full/run/logging/epoch_10_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f7efb0e1717789d7f47c39f1097b80392522b434f427750a47d9cc0c038235b +size 1372 diff --git a/r0_full/run/logging/epoch_10_val_metrics.pth b/r0_full/run/logging/epoch_10_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..8f7c077624d3d68045cf6c96f33bcf040702166e --- /dev/null +++ b/r0_full/run/logging/epoch_10_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef2e0e7456ec0d42bad5fcffef505114c5b39d6116d993494324d9dfe53f1924 +size 1364 diff --git a/r0_full/run/logging/epoch_11_train_metrics.pth b/r0_full/run/logging/epoch_11_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..f9740924491ef4476260caea3fb567f7f74b7301 --- /dev/null +++ b/r0_full/run/logging/epoch_11_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6322bccb60963c3fdb82a5bd0c0fc217b268b8da4114da058cc2f45ee4bae94 +size 1372 diff --git a/r0_full/run/logging/epoch_11_val_metrics.pth b/r0_full/run/logging/epoch_11_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..994d73f614dc51218b527c1b6064328eb7b80b18 --- /dev/null +++ b/r0_full/run/logging/epoch_11_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8cf996968b473736b33fe49cc4d00dbb7eb486adb8832384b13c79764b85044 +size 1364 diff --git a/r0_full/run/logging/epoch_12_train_metrics.pth b/r0_full/run/logging/epoch_12_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..1d9bf03bf52a1dad3b0716bba8d7a74359da5047 --- /dev/null +++ b/r0_full/run/logging/epoch_12_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6df0d274ae212c414a339497f89874f21ece4be908920254e00533e84e05834 +size 1372 diff --git a/r0_full/run/logging/epoch_12_val_metrics.pth b/r0_full/run/logging/epoch_12_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..90371663a56a75516c37167f922e0743a2bce853 --- /dev/null +++ b/r0_full/run/logging/epoch_12_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:068aa2d20e190525108bde73f327df4a742bdda219983a832afc5b70c6ddd5a8 +size 1364 diff --git a/r0_full/run/logging/epoch_1_train_metrics.pth b/r0_full/run/logging/epoch_1_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..baa0a32c8d5eb92a42a56c8f976213430f2c8352 --- /dev/null +++ b/r0_full/run/logging/epoch_1_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f95bb69a41dac5c0c4d1040a2515efb333e647ae09db072f5fca7250009b11d4 +size 1304 diff --git a/r0_full/run/logging/epoch_1_val_metrics.pth b/r0_full/run/logging/epoch_1_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..9100ed89e079e379300877e7032c59ba1c6ef792 --- /dev/null +++ b/r0_full/run/logging/epoch_1_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d634f030d0362824b84dbf0e2c17c6dd32fce7dc600b55e695d5da11cafe8e7 +size 1360 diff --git a/r0_full/run/logging/epoch_2_train_metrics.pth b/r0_full/run/logging/epoch_2_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..e0fd146a2f6d628ff2c033a17f1fb2e088fa2bbe --- /dev/null +++ b/r0_full/run/logging/epoch_2_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eeef3179763c22891f9c76e7dea5b42be064568ff5d3579fb94d10c7a92fa09 +size 1304 diff --git a/r0_full/run/logging/epoch_2_val_metrics.pth b/r0_full/run/logging/epoch_2_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..7ad9db4c8b855dc2269b86efb08c77b6b2490419 --- /dev/null +++ b/r0_full/run/logging/epoch_2_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9486129408fef603bd1d4551a732fef8603300593a57cd8a2bfd3586769c22a5 +size 1360 diff --git a/r0_full/run/logging/epoch_3_train_metrics.pth b/r0_full/run/logging/epoch_3_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..f5d3df1fd50732878ee143c737691520c91d1b59 --- /dev/null +++ b/r0_full/run/logging/epoch_3_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d51715b87284bc30ba0512cb4c3403c75f0cba4e484344b825ce64855324863f +size 1304 diff --git a/r0_full/run/logging/epoch_3_val_metrics.pth b/r0_full/run/logging/epoch_3_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..d2ebcc081a059d9c30885f2bc21a64250d826aa9 --- /dev/null +++ b/r0_full/run/logging/epoch_3_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ab987bce9c4667e7686042f874c8f3dfe66e17be066d844e928799a1f8f2674 +size 1360 diff --git a/r0_full/run/logging/epoch_4_train_metrics.pth b/r0_full/run/logging/epoch_4_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..ea8e096715c35178a88b2ee27ebbc73fd0a6175d --- /dev/null +++ b/r0_full/run/logging/epoch_4_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e69424abb4cf5dfede751827bf78be45e27e578cd6b85f635763c584e76d9111 +size 1304 diff --git a/r0_full/run/logging/epoch_4_val_metrics.pth b/r0_full/run/logging/epoch_4_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..d72b20f008fbc710d04b89c0fa56a0923ab980dd --- /dev/null +++ b/r0_full/run/logging/epoch_4_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fff95f67f1b5b0abac2ea2e6c678cabe195c4343a379be5626c7c96d3e6ecbc6 +size 1360 diff --git a/r0_full/run/logging/epoch_5_train_metrics.pth b/r0_full/run/logging/epoch_5_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..a9384b721da9b8147dfe1724aed943746a6396cb --- /dev/null +++ b/r0_full/run/logging/epoch_5_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d0a1ce65f98e6628143a511160da8e16153bb414b80d1a9d6d859ebf4034839 +size 1304 diff --git a/r0_full/run/logging/epoch_5_val_metrics.pth b/r0_full/run/logging/epoch_5_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..d339055fea3168877c1c5e286290d2feb78d5f1d --- /dev/null +++ b/r0_full/run/logging/epoch_5_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94962b598a8db586aae684ae42571a0977ff5cb67b1feb8ddd4882ed6def9949 +size 1360 diff --git a/r0_full/run/logging/epoch_6_train_metrics.pth b/r0_full/run/logging/epoch_6_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..beff80306c87434e76e24257875ea3224f981a01 --- /dev/null +++ b/r0_full/run/logging/epoch_6_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb22ee7aadf3f6f23a62aca798d8bdc5ab2fa5f218a7161a64c9ccdcb64e44d2 +size 1304 diff --git a/r0_full/run/logging/epoch_6_val_metrics.pth b/r0_full/run/logging/epoch_6_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..f4665c29ad62778d43e5c3b4f70743e5a0392744 --- /dev/null +++ b/r0_full/run/logging/epoch_6_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c47559d024e0f78b0711a3d9f300fa2ae6cc0f2a458d56514a6e3f107c1ce427 +size 1360 diff --git a/r0_full/run/logging/epoch_7_train_metrics.pth b/r0_full/run/logging/epoch_7_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..52d03833dfdffebb636c0d837aee3b8530eeef8f --- /dev/null +++ b/r0_full/run/logging/epoch_7_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e447f121c61d82318ce9234997bf3930866f4fa694c9f0d02c5a28a07249a5cd +size 1304 diff --git a/r0_full/run/logging/epoch_7_val_metrics.pth b/r0_full/run/logging/epoch_7_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..ed8ab23d6e16e2bd1f1e4e440a961383d2965c0e --- /dev/null +++ b/r0_full/run/logging/epoch_7_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cf2e0dcf1d8baaa667d6e1454dd8e90f039af53bd8d1cb7c3690a3bb2fe6be2 +size 1360 diff --git a/r0_full/run/logging/epoch_8_train_metrics.pth b/r0_full/run/logging/epoch_8_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..0d70a0e752ddf1772d05e8357cfd6e94ae2e4624 --- /dev/null +++ b/r0_full/run/logging/epoch_8_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a680166cfd144c26895e6fae889a0a69b6ad4c29c866fda59d79c32091a7ff39 +size 1304 diff --git a/r0_full/run/logging/epoch_8_val_metrics.pth b/r0_full/run/logging/epoch_8_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..67fe4847b3a41b7f35b7fdcb9c48a89d3a1b2e7e --- /dev/null +++ b/r0_full/run/logging/epoch_8_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e4f0ee44ced703b7f0e78a33a07c1606b965418079819247c673b0ed24b250c +size 1360 diff --git a/r0_full/run/logging/epoch_9_train_metrics.pth b/r0_full/run/logging/epoch_9_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..a7f35faf071ed063bbb6119a383535f66e10c57e --- /dev/null +++ b/r0_full/run/logging/epoch_9_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0426d41620491b9738568a334362088bc3a35474c3262f47804c30d3501499ac +size 1304 diff --git a/r0_full/run/logging/epoch_9_val_metrics.pth b/r0_full/run/logging/epoch_9_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..321b3068042826f68052cd8c4d359731cf680f70 --- /dev/null +++ b/r0_full/run/logging/epoch_9_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12233438c63c43840ec7ed37a4f05442a112ea7fa66b278b48437a70f54aa175 +size 1360 diff --git a/r0_full/run/logging/exp_cfg.yaml b/r0_full/run/logging/exp_cfg.yaml new file mode 100644 index 0000000000000000000000000000000000000000..c25821f4bf722f20cbe5979cd1f1ae1fa67bc75d --- /dev/null +++ b/r0_full/run/logging/exp_cfg.yaml @@ -0,0 +1,62 @@ +anno_len_threshold: 40 +base_folder: /home/mog29/compgen_saved_files/experiments/joint_training +batch_size: 2 +checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_full/run_i2_half_seed_run/checkpoints +comprehension_prompt: verbose_instruction +context_size: 10 +data_dir: /home/mog29/compgen_saved_files/kilogram/dataset +deployment_round: 1 +evaluation_type: joint +expdir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_full/run_i2_half_seed_run +from_scratch: true +generation_prompt: information_after +gradient_accumulation_steps: 32 +gradient_clip_norm: 1 +img_dir: /home/mog29/compgen_saved_files/kilogram/dataset/square-black-imgs +ips_clip: 5 +learning_rate: 0.0001 +listener_filter: '' +listener_lambda: 0.5 +load_from_checkpoint: false +logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_full/run_i2_half_seed_run/logging +lora_dropout: 0.05 +lora_r: 16 +lora_subset: vision_resampler +max_steps: 25 +model_family_name: full +n_epochs: 15 +name: joint and multitask training defaults +name_suffix: i2_half_seed_run +no_lora: false +no_shuffling: false +noise_filter: '' +num_samples: 10 +num_training_steps: 15000 +num_warmup_steps: 0 +num_workers: 4 +only_seed: true +past_checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r0_full/run/checkpoints +past_logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r0_full/run/logging +past_name_suffix: '' +past_round: -1 +patience_cutoff: 5 +ref_strat: no_ips_for_pos +repetition_penalty: 1 +replacement_family_name: '' +sampling_type: nucleus +save_each_epoch: true +seed: 636171 +shared_parameters: true +speaker_filter: '' +speaker_lambda: 0.5 +split_dir: /home/mog29/compgen_saved_files/split_info/ +temperature: 1.0 +test_batch_size: 4 +top_k: 20 +top_p: 0.8 +training_type: multitask +use_separate_dataloaders: false +use_wandb: true +wandb_experiment_name: r0_idefics2_half_seed_run +wandb_project_name: tangram_continual_learning_final +weight_decay: 0.1 diff --git a/r0_no_ji/run/checkpoints/acc/README.md b/r0_no_ji/run/checkpoints/acc/README.md new file mode 100644 index 0000000000000000000000000000000000000000..2d4c19b14ebbb9a403d09e6532e46ccfcd7b82cb --- /dev/null +++ b/r0_no_ji/run/checkpoints/acc/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: HuggingFaceM4/idefics2-8b +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/r0_no_ji/run/checkpoints/acc/adapter_config.json b/r0_no_ji/run/checkpoints/acc/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a6a12bf8b59da5b42d042490beafd765fe95f7af --- /dev/null +++ b/r0_no_ji/run/checkpoints/acc/adapter_config.json @@ -0,0 +1,29 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "Idefics2ForConditionalGeneration", + "parent_library": "transformers.models.idefics2.modeling_idefics2" + }, + "base_model_name_or_path": "HuggingFaceM4/idefics2-8b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": "gaussian", + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.1, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 16, + "rank_pattern": {}, + "revision": null, + "target_modules": "(.*(vision_model|modality_projection|perceiver_resampler).*(out_proj|fc1|fc2|down_proj|gate_proj|up_proj|k_proj|q_proj|v_proj|o_proj).*$)|(.*(k_proj|q_proj|v_proj).*$)", + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/r0_no_ji/run/checkpoints/acc/adapter_model.safetensors b/r0_no_ji/run/checkpoints/acc/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bd42d17617dd9baa7651f11993ac64671680c37d --- /dev/null +++ b/r0_no_ji/run/checkpoints/acc/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:862a2297469be301efeb32495428965e37fcf47ceabf27e4554de2badba5c6e9 +size 45771496 diff --git a/r0_no_ji/run/checkpoints/acc/best_optimizer.pt b/r0_no_ji/run/checkpoints/acc/best_optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..86250fd03957af5a816289854eb39ca24722bf22 --- /dev/null +++ b/r0_no_ji/run/checkpoints/acc/best_optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee4fe1170d858d50eb3576104f3c0aa20f74f4b9ef6283cb9d1e0280c55e09a5 +size 91855438 diff --git a/r0_no_ji/run/checkpoints/acc/best_scheduler.pt b/r0_no_ji/run/checkpoints/acc/best_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d4a19df499cef69f8226331889ce7b460a618de --- /dev/null +++ b/r0_no_ji/run/checkpoints/acc/best_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0ac8017b9b42b70c4a55b9611785f5cfde9f8ed5f522088c445b6cbca218bea +size 1084 diff --git a/r0_no_ji/run/checkpoints/acc/saved_metrics.pth b/r0_no_ji/run/checkpoints/acc/saved_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..4888ae34bbd43613b7956acb3d7f1cd9160798f6 --- /dev/null +++ b/r0_no_ji/run/checkpoints/acc/saved_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a57f7f289540f6e2aa16d75339a8b439da3813dd7467234a519558cf87f5ab66 +size 1016 diff --git a/r0_no_ji/run/logging/epoch_0_train_metrics.pth b/r0_no_ji/run/logging/epoch_0_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..53226df03fc47cfabe8661d5de948d693a863423 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_0_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b2097d0fe0dbb9ba891721785112c4782198b5054021d8f122ae860c56cb7cb +size 1304 diff --git a/r0_no_ji/run/logging/epoch_0_val_metrics.pth b/r0_no_ji/run/logging/epoch_0_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..735dd5f6ea4a0a03ac3329f7d2bf97574c32f2a5 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_0_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fef5fff0a12fd5752bbd668efc045d249727a8d032a106139c1dd7ced07c8d11 +size 1168 diff --git a/r0_no_ji/run/logging/epoch_10_train_metrics.pth b/r0_no_ji/run/logging/epoch_10_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..c3b9de8f84cf25be2f8da87f39e2f9f5877dca07 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_10_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a78e8393ec1c3a1152b3f8c88e1dd02dcf2908151bcdc93a83e66a002d4bd18 +size 1372 diff --git a/r0_no_ji/run/logging/epoch_10_val_metrics.pth b/r0_no_ji/run/logging/epoch_10_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..2801c77795376ffd1ffe7829d4ad4a33f197cb3a --- /dev/null +++ b/r0_no_ji/run/logging/epoch_10_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d3e8d4166ca75a805a88ef92d7fb989d33bd2732e8a50583a0a6933874f654f +size 1172 diff --git a/r0_no_ji/run/logging/epoch_11_train_metrics.pth b/r0_no_ji/run/logging/epoch_11_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..f5439ac3176039d7b87a841d56bedf66117d5dc0 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_11_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05506fbca16d2f9be7ac44e6932a73060f33ec6391bca106f5aa98279120e12a +size 1372 diff --git a/r0_no_ji/run/logging/epoch_11_val_metrics.pth b/r0_no_ji/run/logging/epoch_11_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..ce56dc7f88054ddb57c40575b94347e9eaa5b468 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_11_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:989f7d5f063df7405767b5ebe900868899808f30cd7e0485e008de9e3b2f966c +size 1172 diff --git a/r0_no_ji/run/logging/epoch_12_train_metrics.pth b/r0_no_ji/run/logging/epoch_12_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..386a869e10cec96771584deaa37f062447513e23 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_12_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d612b0a72d415f09f1667c4cd1478a9730133cc8d56ff309e3476019cec79ed +size 1372 diff --git a/r0_no_ji/run/logging/epoch_12_val_metrics.pth b/r0_no_ji/run/logging/epoch_12_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..845de92bf405a78143ebaa7b3ab4241badbcb3aa --- /dev/null +++ b/r0_no_ji/run/logging/epoch_12_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d6828ca6f919834d17ca141760a4f548b5a7f7e5fb2b085ebf719d622f4e466 +size 1172 diff --git a/r0_no_ji/run/logging/epoch_13_train_metrics.pth b/r0_no_ji/run/logging/epoch_13_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..56cb499d82b8321f2873f7f597e55522c4ccc834 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_13_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2a5a1c905f0e6876d6c200d6a35d2c1701b39fbea038e344f0287dba528430b +size 1372 diff --git a/r0_no_ji/run/logging/epoch_13_val_metrics.pth b/r0_no_ji/run/logging/epoch_13_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..9d91d97d2eec1dc9df289756895ffc796ca84d7b --- /dev/null +++ b/r0_no_ji/run/logging/epoch_13_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb47cc85a160012bcf6c6995ebb2c44012d2a09613f720ea749f11e1aa638430 +size 1172 diff --git a/r0_no_ji/run/logging/epoch_14_train_metrics.pth b/r0_no_ji/run/logging/epoch_14_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..b4fd4a32192318aaad0d8b739cefc075a35b613c --- /dev/null +++ b/r0_no_ji/run/logging/epoch_14_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac3991d41558369b53de69e2be77ccc4e23c8e5b774993eaf5ee980affbe29ad +size 1372 diff --git a/r0_no_ji/run/logging/epoch_14_val_metrics.pth b/r0_no_ji/run/logging/epoch_14_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..1acedf2b05ac4512672e07f59f5d0dfd49d9c9c3 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_14_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1a2631ec62c63720a59704fc3fa61c9afeb39bdb10167476cf148557e3194f8 +size 1172 diff --git a/r0_no_ji/run/logging/epoch_1_train_metrics.pth b/r0_no_ji/run/logging/epoch_1_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..0de9b7cdaee2f174aa50c7b3b58acc4b1294252d --- /dev/null +++ b/r0_no_ji/run/logging/epoch_1_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76b36009ac769e7163676a288130f07716ac916da113511c585c1b7dab1f2340 +size 1304 diff --git a/r0_no_ji/run/logging/epoch_1_val_metrics.pth b/r0_no_ji/run/logging/epoch_1_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..3de44bc4666fb13678d305826ac065700043b138 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_1_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f64012dc573dcd013a27184f53a2cd461f281b5c1eb4cfa0659a82fba82019fe +size 1168 diff --git a/r0_no_ji/run/logging/epoch_2_train_metrics.pth b/r0_no_ji/run/logging/epoch_2_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..38a138a7d002fe937b4ac0e398f7be6fcdea3b43 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_2_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eabffc6ca68d2dc02cc65f1b526998339c9f883e11032cce0ab819372d4b0aa9 +size 1304 diff --git a/r0_no_ji/run/logging/epoch_2_val_metrics.pth b/r0_no_ji/run/logging/epoch_2_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..8635c1ccad033d639a8eab6c19670f10ff854c7a --- /dev/null +++ b/r0_no_ji/run/logging/epoch_2_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c43cae5657c37eb2a749a07042a1e3259e00462c5aa39b5b8dd123e158f09d6 +size 1168 diff --git a/r0_no_ji/run/logging/epoch_3_train_metrics.pth b/r0_no_ji/run/logging/epoch_3_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..d6e197d93041b9df9801c108864dc04f0cbd547c --- /dev/null +++ b/r0_no_ji/run/logging/epoch_3_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60d3f7613387cbd103713eab8c87bcc3d80f82e858bf1e1b35d2716ce8eceabc +size 1304 diff --git a/r0_no_ji/run/logging/epoch_3_val_metrics.pth b/r0_no_ji/run/logging/epoch_3_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..f5a2b26fa089f2b6ae1673b8bc5de8ecd98dd5c6 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_3_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5f4305e44ae8c3d1eebcdaa47b1046899d69b41003e25f2a41867e5cb4c5c0b +size 1168 diff --git a/r0_no_ji/run/logging/epoch_4_train_metrics.pth b/r0_no_ji/run/logging/epoch_4_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..9a56fd6afd3fff2c44732f22b64b1387938207ca --- /dev/null +++ b/r0_no_ji/run/logging/epoch_4_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:378ef1d03c14addebe66a5ed94b89995225aa1ef99847cfba1bd0eca8a64d074 +size 1304 diff --git a/r0_no_ji/run/logging/epoch_4_val_metrics.pth b/r0_no_ji/run/logging/epoch_4_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..944c3897d75958f5618d4d32864b331d737be737 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_4_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecf376abc56a9baef4671871d83c8c0676b870c9e342ed9add5c48078d619fea +size 1168 diff --git a/r0_no_ji/run/logging/epoch_5_train_metrics.pth b/r0_no_ji/run/logging/epoch_5_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..4f401d37acb38b2510d1180bbb0c69639288974f --- /dev/null +++ b/r0_no_ji/run/logging/epoch_5_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ea4354b3e0d018b2f65803127b3709155b23a92b1be2f2b81c11ff0be85d5aa +size 1304 diff --git a/r0_no_ji/run/logging/epoch_5_val_metrics.pth b/r0_no_ji/run/logging/epoch_5_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..84cfb4a2d28258da45607698e707a53192a1c559 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_5_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edc41b613d7bdb213386ded4e973f4b5bc7a4a46481aa1776944e8f9d0894830 +size 1168 diff --git a/r0_no_ji/run/logging/epoch_6_train_metrics.pth b/r0_no_ji/run/logging/epoch_6_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..3ae7fe847a5c5fcf19f18a8a5728d90f08b03755 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_6_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8805857f52108d4a8d22ed311849223aa1cea3e911fb5a2af0e93a20938d4296 +size 1304 diff --git a/r0_no_ji/run/logging/epoch_6_val_metrics.pth b/r0_no_ji/run/logging/epoch_6_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..2becaeae3aa8778b7c8394fbb8e9519ad2e5e2c9 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_6_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96134fc5c236af87c9be89c176e5bb8d6fc7d7c5e94bdba67e13cb14ee18a4e1 +size 1168 diff --git a/r0_no_ji/run/logging/epoch_7_train_metrics.pth b/r0_no_ji/run/logging/epoch_7_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..b52beece1df38b7c7f79bfa97dc37c60ea34f6b2 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_7_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4a8b4144e7fc7f0a6b9990e0552abc2e63f416044b7a7b61070912a4622d1a9 +size 1304 diff --git a/r0_no_ji/run/logging/epoch_7_val_metrics.pth b/r0_no_ji/run/logging/epoch_7_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..347cac366ddc01906e797505dcc18f6d6fca52d0 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_7_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9808993fc7d1c18d084fc5359998174a29a6a7728f962aebf5d44372597e8443 +size 1168 diff --git a/r0_no_ji/run/logging/epoch_8_train_metrics.pth b/r0_no_ji/run/logging/epoch_8_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..a3a8598d0033980e42129b7d8ee4a67862ff4587 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_8_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:268df7c9b8085665cc8747bb064a2f126cb83b4f1674df69274391b25eb63e59 +size 1304 diff --git a/r0_no_ji/run/logging/epoch_8_val_metrics.pth b/r0_no_ji/run/logging/epoch_8_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..13ad2b04af37ba0f9963d1491138126167f40139 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_8_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7e5a20f11e210c4fb109d3d529938d4ebad014113ae5454b6b60995c5fec7aa +size 1168 diff --git a/r0_no_ji/run/logging/epoch_9_train_metrics.pth b/r0_no_ji/run/logging/epoch_9_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..765e9ed62b3ffd901eee21d3effc71758c1a14d2 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_9_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bd2562af91b5af73536362ec9d016b6d91e6746c52cbbfabe440dcd7271584b +size 1304 diff --git a/r0_no_ji/run/logging/epoch_9_val_metrics.pth b/r0_no_ji/run/logging/epoch_9_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..6b4e22b2607ee7e429ef00a7a09380521fb3add7 --- /dev/null +++ b/r0_no_ji/run/logging/epoch_9_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a49449a921d06f3d73e5e4caed79d77a191ecc8129b77ef9bb07f405021c4f82 +size 1168 diff --git a/r0_no_ji/run/logging/exp_cfg.yaml b/r0_no_ji/run/logging/exp_cfg.yaml new file mode 100644 index 0000000000000000000000000000000000000000..6b4188b1b4dabb0fa534a2838e036892aa5113a7 --- /dev/null +++ b/r0_no_ji/run/logging/exp_cfg.yaml @@ -0,0 +1,62 @@ +anno_len_threshold: 40 +base_folder: /home/mog29/compgen_saved_files/experiments/joint_training +batch_size: 2 +checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_no_ji/run_i2_half_seed_run/checkpoints +comprehension_prompt: verbose_instruction +context_size: 10 +data_dir: /home/mog29/compgen_saved_files/kilogram/dataset +deployment_round: 1 +evaluation_type: multitask +expdir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_no_ji/run_i2_half_seed_run +from_scratch: true +generation_prompt: information_after +gradient_accumulation_steps: 32 +gradient_clip_norm: 1 +img_dir: /home/mog29/compgen_saved_files/kilogram/dataset/square-black-imgs +ips_clip: 5 +learning_rate: 0.0001 +listener_filter: '' +listener_lambda: 0.5 +load_from_checkpoint: false +logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_no_ji/run_i2_half_seed_run/logging +lora_dropout: 0.05 +lora_r: 16 +lora_subset: vision_resampler +max_steps: 25 +model_family_name: no_ji +n_epochs: 15 +name: joint and multitask training defaults +name_suffix: i2_half_seed_run +no_lora: false +no_shuffling: false +noise_filter: '' +num_samples: 10 +num_training_steps: 15000 +num_warmup_steps: 0 +num_workers: 4 +only_seed: true +past_checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r0_no_ji/run/checkpoints +past_logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r0_no_ji/run/logging +past_name_suffix: '' +past_round: -1 +patience_cutoff: 5 +ref_strat: no_ips_for_pos +repetition_penalty: 1 +replacement_family_name: '' +sampling_type: nucleus +save_each_epoch: true +seed: 735553 +shared_parameters: true +speaker_filter: '' +speaker_lambda: 0.5 +split_dir: /home/mog29/compgen_saved_files/split_info/ +temperature: 1.0 +test_batch_size: 4 +top_k: 20 +top_p: 0.8 +training_type: multitask +use_separate_dataloaders: false +use_wandb: true +wandb_experiment_name: r0_no_ji_half_seed_run +wandb_project_name: tangram_continual_learning_final +weight_decay: 0.1 diff --git a/r1_baseline/run/checkpoints/acc/README.md b/r1_baseline/run/checkpoints/acc/README.md new file mode 100644 index 0000000000000000000000000000000000000000..2d4c19b14ebbb9a403d09e6532e46ccfcd7b82cb --- /dev/null +++ b/r1_baseline/run/checkpoints/acc/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: HuggingFaceM4/idefics2-8b +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/r1_baseline/run/checkpoints/acc/adapter_config.json b/r1_baseline/run/checkpoints/acc/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a6a12bf8b59da5b42d042490beafd765fe95f7af --- /dev/null +++ b/r1_baseline/run/checkpoints/acc/adapter_config.json @@ -0,0 +1,29 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "Idefics2ForConditionalGeneration", + "parent_library": "transformers.models.idefics2.modeling_idefics2" + }, + "base_model_name_or_path": "HuggingFaceM4/idefics2-8b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": "gaussian", + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.1, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 16, + "rank_pattern": {}, + "revision": null, + "target_modules": "(.*(vision_model|modality_projection|perceiver_resampler).*(out_proj|fc1|fc2|down_proj|gate_proj|up_proj|k_proj|q_proj|v_proj|o_proj).*$)|(.*(k_proj|q_proj|v_proj).*$)", + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/r1_baseline/run/checkpoints/acc/adapter_model.safetensors b/r1_baseline/run/checkpoints/acc/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1944b9bef69b97de4d3a6579fc8173062065356d --- /dev/null +++ b/r1_baseline/run/checkpoints/acc/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ac0dc7f01d0c07523f32c6180957835d6ce54f8cd6a53f95565d2d719283276 +size 45771496 diff --git a/r1_baseline/run/checkpoints/acc/best_optimizer.pt b/r1_baseline/run/checkpoints/acc/best_optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..95eec1cd6caa73d42f5f6f41389a1a1b216328e7 --- /dev/null +++ b/r1_baseline/run/checkpoints/acc/best_optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ded6ebe15ae7c6f203c416dcc3511f75985ceac537dbc161d19841a6d3d7f125 +size 91855438 diff --git a/r1_baseline/run/checkpoints/acc/best_scheduler.pt b/r1_baseline/run/checkpoints/acc/best_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b69fc03d50615dd51da173d69c732065e7e4068 --- /dev/null +++ b/r1_baseline/run/checkpoints/acc/best_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37a61a0c73485ea5e8430bc0649e93a840b8dc15b49cab83657e79841287212e +size 1084 diff --git a/r1_baseline/run/checkpoints/acc/saved_metrics.pth b/r1_baseline/run/checkpoints/acc/saved_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..9f125aa3ee5fc737b3d629ec64675ff88a5e0d53 --- /dev/null +++ b/r1_baseline/run/checkpoints/acc/saved_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b337d81720ecdcc1a2776059dd91d98277b9a8b96b6035a19142aedd297b868 +size 1016 diff --git a/r1_baseline/run/logging/epoch_0_train_metrics.pth b/r1_baseline/run/logging/epoch_0_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..5cbd76877bbb8d50339fc28e1f4c7fa0266761dd --- /dev/null +++ b/r1_baseline/run/logging/epoch_0_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fdb88ddc11b40614502e816dd1628100112650b02948a26b08bea57b7d678f1 +size 1304 diff --git a/r1_baseline/run/logging/epoch_0_val_metrics.pth b/r1_baseline/run/logging/epoch_0_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..7646bcaf1b926e2466ab1a0ac946639d08213002 --- /dev/null +++ b/r1_baseline/run/logging/epoch_0_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b544d8909226cb5d9e188488853d856b39cb58ddd0f8534022bed177c2ac3f32 +size 1168 diff --git a/r1_baseline/run/logging/epoch_10_train_metrics.pth b/r1_baseline/run/logging/epoch_10_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..eb43241d1385914a468ac9b88209aa61752d19b2 --- /dev/null +++ b/r1_baseline/run/logging/epoch_10_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33236201cb51fd485c2d8326161820aab7866083ac4018e9e19a052477021e79 +size 1372 diff --git a/r1_baseline/run/logging/epoch_10_val_metrics.pth b/r1_baseline/run/logging/epoch_10_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..49fcab5d7c1f4ac372361d44aedbf93e77a34a7e --- /dev/null +++ b/r1_baseline/run/logging/epoch_10_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61091cf8811ed3a2341efdc71e01d9118feda9b30fe206504534c07c52c26f26 +size 1172 diff --git a/r1_baseline/run/logging/epoch_11_train_metrics.pth b/r1_baseline/run/logging/epoch_11_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..1354ce0a845109824deb68fe2d20ef464e9bbc83 --- /dev/null +++ b/r1_baseline/run/logging/epoch_11_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2796637c5bc14b5dc880431896a6476754177330f71ce2c69996526526ae0e3 +size 1372 diff --git a/r1_baseline/run/logging/epoch_11_val_metrics.pth b/r1_baseline/run/logging/epoch_11_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..e89a8779f9ff9ca39ebba6a07fb6ed8f8ab2213b --- /dev/null +++ b/r1_baseline/run/logging/epoch_11_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bc4a1c2abc134eed541a04506838d6cc60d8ebcf928bcf6b207561712478b3e +size 1172 diff --git a/r1_baseline/run/logging/epoch_12_train_metrics.pth b/r1_baseline/run/logging/epoch_12_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..6425097e13cf6f48e8f08e587d65e405ad161e6c --- /dev/null +++ b/r1_baseline/run/logging/epoch_12_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac8f0d669f0b1df86c95bcfb3f5b587d83cf671d1fd1c263453a3139a654dcde +size 1372 diff --git a/r1_baseline/run/logging/epoch_12_val_metrics.pth b/r1_baseline/run/logging/epoch_12_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..bf7c1cf2adb9818ae47e905fea4e20f7651433d5 --- /dev/null +++ b/r1_baseline/run/logging/epoch_12_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5084ade6f795d62623dd8c99fd9fcca7185a596fba13517ed6c37fdfb9f19f33 +size 1172 diff --git a/r1_baseline/run/logging/epoch_13_train_metrics.pth b/r1_baseline/run/logging/epoch_13_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..182294ec88e2c458b245df155d831291d44fb42e --- /dev/null +++ b/r1_baseline/run/logging/epoch_13_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66e69b7c66387d88f0471e2fcb7520207ca85384f73e8b6be4989871ded25f3e +size 1372 diff --git a/r1_baseline/run/logging/epoch_13_val_metrics.pth b/r1_baseline/run/logging/epoch_13_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..bcaf054a1d996a6d4c564985430395d78058fcf9 --- /dev/null +++ b/r1_baseline/run/logging/epoch_13_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:051d052d0daf106bb4cba4eecd45c6d5fed25ad13143b0ca15a6881e8ef7fab8 +size 1172 diff --git a/r1_baseline/run/logging/epoch_14_train_metrics.pth b/r1_baseline/run/logging/epoch_14_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..e7ce0117fc3cbeb7a56ddc05996d4520c9ef3182 --- /dev/null +++ b/r1_baseline/run/logging/epoch_14_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05c71b3b4c4364ea67d5d457e1a54d0530ba8f62c4ceda6c448ce8508ddf6e1b +size 1372 diff --git a/r1_baseline/run/logging/epoch_14_val_metrics.pth b/r1_baseline/run/logging/epoch_14_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..71952fbe08a49946aff03703ae765c8043feae26 --- /dev/null +++ b/r1_baseline/run/logging/epoch_14_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37988ee709646a845b3f5a152997f14797415ff0a1f8effbc0ccd44abc6cc22f +size 1172 diff --git a/r1_baseline/run/logging/epoch_1_train_metrics.pth b/r1_baseline/run/logging/epoch_1_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..c3c1a6089bb114ef69cac945290273e5d1737da1 --- /dev/null +++ b/r1_baseline/run/logging/epoch_1_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d43d1299f23fa930b901f8a551264dfad90fb3413fedba7a663fa0fdabfb261 +size 1304 diff --git a/r1_baseline/run/logging/epoch_1_val_metrics.pth b/r1_baseline/run/logging/epoch_1_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..c79735fa4edfa1e21e0f899aa8934a69d817c59e --- /dev/null +++ b/r1_baseline/run/logging/epoch_1_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6014cb6b8408d0bfa4d10b19eb43c9221e2678b531e0d58ee205b234addcb38 +size 1168 diff --git a/r1_baseline/run/logging/epoch_2_train_metrics.pth b/r1_baseline/run/logging/epoch_2_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..3dd7078809a6c04030da494409297ae90ee56eed --- /dev/null +++ b/r1_baseline/run/logging/epoch_2_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2f0a5bc2b0f4a457fb6c3afce051d644e2d27fae0d9b6bb15afc01b3aa1737e +size 1304 diff --git a/r1_baseline/run/logging/epoch_2_val_metrics.pth b/r1_baseline/run/logging/epoch_2_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..ea0eb36a6944f463d2ea963965382c9ca7f1fd73 --- /dev/null +++ b/r1_baseline/run/logging/epoch_2_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1476f9ef63d015020961b171f3c523f144d362d0a9b6047f71110eb781af264 +size 1168 diff --git a/r1_baseline/run/logging/epoch_3_train_metrics.pth b/r1_baseline/run/logging/epoch_3_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..78be2a11f70247bc64b92eee7887ef0cbe0d28b1 --- /dev/null +++ b/r1_baseline/run/logging/epoch_3_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61bad71b45a594592ee8c9399ce1654841d63a9b2f7f1fe88c231b87fc1b2ada +size 1304 diff --git a/r1_baseline/run/logging/epoch_3_val_metrics.pth b/r1_baseline/run/logging/epoch_3_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..49d25835745f1bba046da03b38283c6171c68c87 --- /dev/null +++ b/r1_baseline/run/logging/epoch_3_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72aa43ac8e58efd44f07fd15cc2b4d9ebe70f0efa502027872024be04e40fdfe +size 1168 diff --git a/r1_baseline/run/logging/epoch_4_train_metrics.pth b/r1_baseline/run/logging/epoch_4_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..011f0c276a3927d063a21ea27b1159a4119f8f38 --- /dev/null +++ b/r1_baseline/run/logging/epoch_4_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6b7620b17e995d5aa62b914f8ed675357c7d63361f7657953a6b984b69b9f8b +size 1304 diff --git a/r1_baseline/run/logging/epoch_4_val_metrics.pth b/r1_baseline/run/logging/epoch_4_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..07fda10bc66ad09749edd41780b1143850570342 --- /dev/null +++ b/r1_baseline/run/logging/epoch_4_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cf3e1e410bd18a38601e819805799f9d127a0a79f550b5872d047cf6f5cd3af +size 1168 diff --git a/r1_baseline/run/logging/epoch_5_train_metrics.pth b/r1_baseline/run/logging/epoch_5_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..1d5cb96b8adf643065d1d15514446dcba15e86c2 --- /dev/null +++ b/r1_baseline/run/logging/epoch_5_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:757b42dd22b21b3491a77e36b4668f4b7b586f0ba6e2471dccc6715eea5c34c7 +size 1304 diff --git a/r1_baseline/run/logging/epoch_5_val_metrics.pth b/r1_baseline/run/logging/epoch_5_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..15419ff9d5b81636b2b33374d424bcf05860e23d --- /dev/null +++ b/r1_baseline/run/logging/epoch_5_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c48defb94cbce9405d45ec2de6cb3a6c1256cc9e97386327090ba6f9c1c8ae92 +size 1168 diff --git a/r1_baseline/run/logging/epoch_6_train_metrics.pth b/r1_baseline/run/logging/epoch_6_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..49c8d040f589502ebbe8028450e66b88a9cb063e --- /dev/null +++ b/r1_baseline/run/logging/epoch_6_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c52202f672291c89df86229aac634faf7da60e5dd35bf5f66f2263c8c2025993 +size 1304 diff --git a/r1_baseline/run/logging/epoch_6_val_metrics.pth b/r1_baseline/run/logging/epoch_6_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..79c15439692a87a6294e9b6d3a0ce4d206b95dd3 --- /dev/null +++ b/r1_baseline/run/logging/epoch_6_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3911b25d8a3fc480bac28a075cbfc8baa4b549268a3f7dd6d359f54fcdd74a4d +size 1168 diff --git a/r1_baseline/run/logging/epoch_7_train_metrics.pth b/r1_baseline/run/logging/epoch_7_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..07998adecb4b777a2fc2be056304f0f4e3a4af96 --- /dev/null +++ b/r1_baseline/run/logging/epoch_7_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa7d1875cd39c9091c7bc0d294d05c8b6193e96dcb64ae402c0513dc1a95208a +size 1304 diff --git a/r1_baseline/run/logging/epoch_7_val_metrics.pth b/r1_baseline/run/logging/epoch_7_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..5c9e487db9e6689c8ee42c70b749398879ad3bb7 --- /dev/null +++ b/r1_baseline/run/logging/epoch_7_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1323f6cc3f89450b3b4e81e0e1d88f4cafa6154e6c408dd897bbfaa526026f46 +size 1168 diff --git a/r1_baseline/run/logging/epoch_8_train_metrics.pth b/r1_baseline/run/logging/epoch_8_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..57598fe4d5fbeec047f208949e8e7cd7669c136c --- /dev/null +++ b/r1_baseline/run/logging/epoch_8_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf84d8c1e9933946ce4977d1be3d16a8aa09d0696f83963adad18f2513ba28ba +size 1304 diff --git a/r1_baseline/run/logging/epoch_8_val_metrics.pth b/r1_baseline/run/logging/epoch_8_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..8478ea90bca978fd30956b2ff9af48e54570cc9d --- /dev/null +++ b/r1_baseline/run/logging/epoch_8_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aadf7ac8b32b38a2baa5d9c56ed994687ab5210f42fd0766d530a330c7ba82c9 +size 1168 diff --git a/r1_baseline/run/logging/epoch_9_train_metrics.pth b/r1_baseline/run/logging/epoch_9_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..dcfd86d7498cbad3341d6c355b4f7e47044f778e --- /dev/null +++ b/r1_baseline/run/logging/epoch_9_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fff7255ac5e97db8d62f445016e244049cd689639ea7a09073047a0e90a6aa61 +size 1304 diff --git a/r1_baseline/run/logging/epoch_9_val_metrics.pth b/r1_baseline/run/logging/epoch_9_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..1db67c218292daeb062e259125799f0acfc121e1 --- /dev/null +++ b/r1_baseline/run/logging/epoch_9_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:888c5161e0ee2dcfd69ca0f8d611f4247802c3856e6a9205cf1b6f9f49f4c1a0 +size 1168 diff --git a/r1_baseline/run/logging/exp_cfg.yaml b/r1_baseline/run/logging/exp_cfg.yaml new file mode 100644 index 0000000000000000000000000000000000000000..1555bf2b4859331425d938b1e2f4b9b5e5c92140 --- /dev/null +++ b/r1_baseline/run/logging/exp_cfg.yaml @@ -0,0 +1,62 @@ +anno_len_threshold: 40 +base_folder: /home/mog29/compgen_saved_files/experiments/joint_training +batch_size: 2 +checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_baseline/run/checkpoints +comprehension_prompt: verbose_instruction +context_size: 10 +data_dir: /home/mog29/compgen_saved_files/kilogram/dataset +deployment_round: 1 +evaluation_type: multitask +expdir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_baseline/run +from_scratch: true +generation_prompt: information_after +gradient_accumulation_steps: 32 +gradient_clip_norm: 1 +img_dir: /home/mog29/compgen_saved_files/kilogram/dataset/square-black-imgs +ips_clip: 5 +learning_rate: 0.0001 +listener_filter: '' +listener_lambda: 0.5 +load_from_checkpoint: false +logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_baseline/run/logging +lora_dropout: 0.05 +lora_r: 16 +lora_subset: vision_resampler +max_steps: 30 +model_family_name: baseline +n_epochs: 15 +name: joint and multitask training defaults +name_suffix: '' +no_lora: false +no_shuffling: false +noise_filter: '' +num_samples: 10 +num_training_steps: 15000 +num_warmup_steps: 0 +num_workers: 4 +only_seed: false +past_checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r0_no_ji/run/checkpoints +past_logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r0_no_ji/run/logging +past_name_suffix: '' +past_round: -1 +patience_cutoff: 5 +ref_strat: no_ips_for_pos +repetition_penalty: 1 +replacement_family_name: '' +sampling_type: nucleus +save_each_epoch: true +seed: 741624 +shared_parameters: true +speaker_filter: '' +speaker_lambda: 0.5 +split_dir: /home/mog29/compgen_saved_files/split_info/ +temperature: 0.7 +test_batch_size: 4 +top_k: 50 +top_p: 1 +training_type: multitask +use_separate_dataloaders: false +use_wandb: true +wandb_experiment_name: r1_baseline_may +wandb_project_name: tangram_continual_learning_final +weight_decay: 0.1 diff --git a/r1_full/run/checkpoints/acc/README.md b/r1_full/run/checkpoints/acc/README.md new file mode 100644 index 0000000000000000000000000000000000000000..2d4c19b14ebbb9a403d09e6532e46ccfcd7b82cb --- /dev/null +++ b/r1_full/run/checkpoints/acc/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: HuggingFaceM4/idefics2-8b +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/r1_full/run/checkpoints/acc/adapter_config.json b/r1_full/run/checkpoints/acc/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a6a12bf8b59da5b42d042490beafd765fe95f7af --- /dev/null +++ b/r1_full/run/checkpoints/acc/adapter_config.json @@ -0,0 +1,29 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "Idefics2ForConditionalGeneration", + "parent_library": "transformers.models.idefics2.modeling_idefics2" + }, + "base_model_name_or_path": "HuggingFaceM4/idefics2-8b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": "gaussian", + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.1, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 16, + "rank_pattern": {}, + "revision": null, + "target_modules": "(.*(vision_model|modality_projection|perceiver_resampler).*(out_proj|fc1|fc2|down_proj|gate_proj|up_proj|k_proj|q_proj|v_proj|o_proj).*$)|(.*(k_proj|q_proj|v_proj).*$)", + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/r1_full/run/checkpoints/acc/adapter_model.safetensors b/r1_full/run/checkpoints/acc/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..571390829847e76f2c9e016cda69b1bc817b1c13 --- /dev/null +++ b/r1_full/run/checkpoints/acc/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:110cb576ae93ee177c90f1535763a06f37d0a8b032bc6e6976e59c2a7ae10fbd +size 45771496 diff --git a/r1_full/run/checkpoints/acc/best_optimizer.pt b/r1_full/run/checkpoints/acc/best_optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ff5611e4f9ea99e65933ef7ba32b555f65944db --- /dev/null +++ b/r1_full/run/checkpoints/acc/best_optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:867058dfecfd00d2393181b0e47188d9a32c3d32104bcb915cc4c63fb6446ae4 +size 91855438 diff --git a/r1_full/run/checkpoints/acc/best_scheduler.pt b/r1_full/run/checkpoints/acc/best_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a88ab0cc3af41a7fff633aa2473544d35870db67 --- /dev/null +++ b/r1_full/run/checkpoints/acc/best_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a827e17656bf2f0e1e3a04c7aa61390e4c5db85b16844c14ae72c65b73b7e54f +size 1084 diff --git a/r1_full/run/checkpoints/acc/saved_metrics.pth b/r1_full/run/checkpoints/acc/saved_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..9c13944724e26c0c6d5798cf569a5a8f6584fd8b --- /dev/null +++ b/r1_full/run/checkpoints/acc/saved_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dca83bb01ee0fa1c04371acda8dd43fff03c7f6e730a0a4b6739e7a81273dfc +size 1208 diff --git a/r1_full/run/logging/epoch_0_train_metrics.pth b/r1_full/run/logging/epoch_0_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..fd2c7921c7bf9ef98a69b524e2c7d913b015d964 --- /dev/null +++ b/r1_full/run/logging/epoch_0_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a379485e38cdc57f2002badb7af38cf479ffa1cd97a22b5a706b5648123fe31d +size 1304 diff --git a/r1_full/run/logging/epoch_0_val_metrics.pth b/r1_full/run/logging/epoch_0_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..0248ccb89a146ff820a2967d8737c77bd98ce059 --- /dev/null +++ b/r1_full/run/logging/epoch_0_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ec49b31e79ad71088230a8185e21c7005c42083ac5c1d262ed2b5ad5c0e18a9 +size 1360 diff --git a/r1_full/run/logging/epoch_10_train_metrics.pth b/r1_full/run/logging/epoch_10_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..b8cdf7c41eb48d6fa13438a91d9463fb2eae5052 --- /dev/null +++ b/r1_full/run/logging/epoch_10_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e347df4052c9cae458851d6b2568aa4a807a21e439f1da68b6e320447c94f35 +size 1372 diff --git a/r1_full/run/logging/epoch_10_val_metrics.pth b/r1_full/run/logging/epoch_10_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..d779894957d7b975266bc0c32d7402a0c5e77ef9 --- /dev/null +++ b/r1_full/run/logging/epoch_10_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65cbfd967ec772e9404b20e0686d7fcc5048361b89ee66a2be6cafd048f825dc +size 1364 diff --git a/r1_full/run/logging/epoch_1_train_metrics.pth b/r1_full/run/logging/epoch_1_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..bde7f16affec7a25e0bbc29f2c885fb493758db1 --- /dev/null +++ b/r1_full/run/logging/epoch_1_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:539133848290b8e7fd3471eee20a25f2b650ef4679807825713a858c405d945f +size 1304 diff --git a/r1_full/run/logging/epoch_1_val_metrics.pth b/r1_full/run/logging/epoch_1_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..c54ec75d326b655209e801f51ffa9b460e314266 --- /dev/null +++ b/r1_full/run/logging/epoch_1_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04942ee3d3a2eb8d06e9b1f7d8394b52dc958dbcff027f8f9d249ecdb132e54 +size 1360 diff --git a/r1_full/run/logging/epoch_2_train_metrics.pth b/r1_full/run/logging/epoch_2_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..878504a1f5192f7f21bf4a25a56634a077599736 --- /dev/null +++ b/r1_full/run/logging/epoch_2_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53a156751b435d20f91b1914c6a99f38247a502231b930c209b3e2b0cff9bf6c +size 1304 diff --git a/r1_full/run/logging/epoch_2_val_metrics.pth b/r1_full/run/logging/epoch_2_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..91c6371e9a76562b4fab42eeccf43840da4878cd --- /dev/null +++ b/r1_full/run/logging/epoch_2_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82c79e0472b7f2ef2cf0a26b3960d6b69e21717e719d755dab397f7c98191a39 +size 1360 diff --git a/r1_full/run/logging/epoch_3_train_metrics.pth b/r1_full/run/logging/epoch_3_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..33b8b480c3e1a64bc877bc549288ea57d7a0a6b0 --- /dev/null +++ b/r1_full/run/logging/epoch_3_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0825992b8e9ce2e441d1fe12a5976afc69dffb6402b87e7f086eed0579acfb59 +size 1304 diff --git a/r1_full/run/logging/epoch_3_val_metrics.pth b/r1_full/run/logging/epoch_3_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..283e59adf690fb853075a6baf14630d195d07d2e --- /dev/null +++ b/r1_full/run/logging/epoch_3_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a08cedb85513238799bf3a860ae27eee6ba82d698e352b474f4336cd7189f0ab +size 1360 diff --git a/r1_full/run/logging/epoch_4_train_metrics.pth b/r1_full/run/logging/epoch_4_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..3a523be9d450e641b4834bb688426c560b53c153 --- /dev/null +++ b/r1_full/run/logging/epoch_4_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0d58c525f5aa3bd4484960efa04c14677ccd4b54fe36e3d30da04602e9da163 +size 1304 diff --git a/r1_full/run/logging/epoch_4_val_metrics.pth b/r1_full/run/logging/epoch_4_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..a425f8601988f69a0c18f62429446245ce84f733 --- /dev/null +++ b/r1_full/run/logging/epoch_4_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28963e36cf12cd62dfdb91913e7270a080ff5d5dead4da2906f9f02326075a48 +size 1360 diff --git a/r1_full/run/logging/epoch_5_train_metrics.pth b/r1_full/run/logging/epoch_5_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..fcdffc4f4c9aed99964c4aba8ccb8cb0353d708b --- /dev/null +++ b/r1_full/run/logging/epoch_5_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbb4bca43023e2b05cbfdc1af3af0dd2070cb3dddaff16746db533f7b509bcc3 +size 1304 diff --git a/r1_full/run/logging/epoch_5_val_metrics.pth b/r1_full/run/logging/epoch_5_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..5eff93fe0f6a9110ebe70f7e13b353eb9cad3e32 --- /dev/null +++ b/r1_full/run/logging/epoch_5_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8109a6610ca1160326dd71d03ec25e3f2c419664cf0b428d6c451a5120ce51ec +size 1360 diff --git a/r1_full/run/logging/epoch_6_train_metrics.pth b/r1_full/run/logging/epoch_6_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..38a40104e3859fe6178f050243b02a199340acb1 --- /dev/null +++ b/r1_full/run/logging/epoch_6_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc444a83cf6128ccedf55bfa00b1ec6b9af615b2427264e0ca046947e634aae0 +size 1304 diff --git a/r1_full/run/logging/epoch_6_val_metrics.pth b/r1_full/run/logging/epoch_6_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..929eed2877305c7528382f4085447c95a78bdafe --- /dev/null +++ b/r1_full/run/logging/epoch_6_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5ed2eb76a88b396f5cc23abf72881bb939a2e1393d5a3b01297ae3637df8541 +size 1360 diff --git a/r1_full/run/logging/epoch_7_train_metrics.pth b/r1_full/run/logging/epoch_7_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..07e855102d91fc3b87fef7761097ab69ab3caa8c --- /dev/null +++ b/r1_full/run/logging/epoch_7_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02b1b852e29ef27084f13613d83e2368b7e66cee4ca9f6576364123f7b5d2b08 +size 1304 diff --git a/r1_full/run/logging/epoch_7_val_metrics.pth b/r1_full/run/logging/epoch_7_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..8a14a287d784c00f8491993be94254b01435997e --- /dev/null +++ b/r1_full/run/logging/epoch_7_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bda27cc18f16961e02416ab59061a72cc21c5396896aeb0888cb69c83fab491 +size 1360 diff --git a/r1_full/run/logging/epoch_8_train_metrics.pth b/r1_full/run/logging/epoch_8_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..b909a6eb23061c329c23a6173db1c771c9582100 --- /dev/null +++ b/r1_full/run/logging/epoch_8_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78c09a7bfa88cc485bb0890c3cbc558681cc962403539b1d06e9bc846dae03fe +size 1304 diff --git a/r1_full/run/logging/epoch_8_val_metrics.pth b/r1_full/run/logging/epoch_8_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..9ee61e8541b737ac8e1f19d3944ff3245e001449 --- /dev/null +++ b/r1_full/run/logging/epoch_8_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4740257b044363a7905ab9364815dd4c53cc741acd584c2734b42e9a19344c00 +size 1360 diff --git a/r1_full/run/logging/epoch_9_train_metrics.pth b/r1_full/run/logging/epoch_9_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..f5df1c9c2b982f74bf12c37791541343decfab89 --- /dev/null +++ b/r1_full/run/logging/epoch_9_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acbb4206b0df204326f105e6c5a45459ebd4301af1f06f15d062117a4375de50 +size 1304 diff --git a/r1_full/run/logging/epoch_9_val_metrics.pth b/r1_full/run/logging/epoch_9_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..c760bc1499a1f54fa7c3b0982ead1c9aea567cc5 --- /dev/null +++ b/r1_full/run/logging/epoch_9_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04808295e5ec7549a5b7fb98669fe9967390e9e4484b17cf14d500a6bb9d4781 +size 1360 diff --git a/r1_full/run/logging/exp_cfg.yaml b/r1_full/run/logging/exp_cfg.yaml new file mode 100644 index 0000000000000000000000000000000000000000..76107b1bc2d7b318572bc805d3ee82625460255e --- /dev/null +++ b/r1_full/run/logging/exp_cfg.yaml @@ -0,0 +1,62 @@ +anno_len_threshold: 40 +base_folder: /home/mog29/compgen_saved_files/experiments/joint_training +batch_size: 2 +checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_full/run/checkpoints +comprehension_prompt: verbose_instruction +context_size: 10 +data_dir: /home/mog29/compgen_saved_files/kilogram/dataset +deployment_round: 1 +evaluation_type: joint +expdir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_full/run +from_scratch: true +generation_prompt: information_after +gradient_accumulation_steps: 32 +gradient_clip_norm: 1 +img_dir: /home/mog29/compgen_saved_files/kilogram/dataset/square-black-imgs +ips_clip: 5 +learning_rate: 0.0001 +listener_filter: no_neg_gen +listener_lambda: 0.5 +load_from_checkpoint: false +logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_full/run/logging +lora_dropout: 0.05 +lora_r: 16 +lora_subset: vision_resampler +max_steps: 30 +model_family_name: full +n_epochs: 15 +name: joint and multitask training defaults +name_suffix: '' +no_lora: false +no_shuffling: false +noise_filter: '' +num_samples: 10 +num_training_steps: 15000 +num_warmup_steps: 0 +num_workers: 4 +only_seed: false +past_checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r0_full/run/checkpoints +past_logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r0_full/run/logging +past_name_suffix: '' +past_round: -1 +patience_cutoff: 5 +ref_strat: no_ips_for_pos +repetition_penalty: 1 +replacement_family_name: '' +sampling_type: nucleus +save_each_epoch: true +seed: 699332 +shared_parameters: true +speaker_filter: no_neg_comp +speaker_lambda: 0.5 +split_dir: /home/mog29/compgen_saved_files/split_info/ +temperature: 0.7 +test_batch_size: 4 +top_k: 50 +top_p: 1 +training_type: multitask +use_separate_dataloaders: true +use_wandb: true +wandb_experiment_name: r1_full_may +wandb_project_name: tangram_continual_learning_final +weight_decay: 0.1 diff --git a/r1_no_ds/run/checkpoints/acc/README.md b/r1_no_ds/run/checkpoints/acc/README.md new file mode 100644 index 0000000000000000000000000000000000000000..2d4c19b14ebbb9a403d09e6532e46ccfcd7b82cb --- /dev/null +++ b/r1_no_ds/run/checkpoints/acc/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: HuggingFaceM4/idefics2-8b +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/r1_no_ds/run/checkpoints/acc/adapter_config.json b/r1_no_ds/run/checkpoints/acc/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a6a12bf8b59da5b42d042490beafd765fe95f7af --- /dev/null +++ b/r1_no_ds/run/checkpoints/acc/adapter_config.json @@ -0,0 +1,29 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "Idefics2ForConditionalGeneration", + "parent_library": "transformers.models.idefics2.modeling_idefics2" + }, + "base_model_name_or_path": "HuggingFaceM4/idefics2-8b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": "gaussian", + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.1, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 16, + "rank_pattern": {}, + "revision": null, + "target_modules": "(.*(vision_model|modality_projection|perceiver_resampler).*(out_proj|fc1|fc2|down_proj|gate_proj|up_proj|k_proj|q_proj|v_proj|o_proj).*$)|(.*(k_proj|q_proj|v_proj).*$)", + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/r1_no_ds/run/checkpoints/acc/adapter_model.safetensors b/r1_no_ds/run/checkpoints/acc/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..12e9dcd5e6081159d9d952099dea7282908f3bfe --- /dev/null +++ b/r1_no_ds/run/checkpoints/acc/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c62c4ed3a666e9f203da59f1a63ee8308b47c0fed8e4bca3cb7edfbab8a2e7ce +size 45771496 diff --git a/r1_no_ds/run/checkpoints/acc/best_optimizer.pt b/r1_no_ds/run/checkpoints/acc/best_optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..b427d4b2fe26ba8dd4b4a0feaa8b960e277a6859 --- /dev/null +++ b/r1_no_ds/run/checkpoints/acc/best_optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b985ce8af3a6a80856dca0141812e30cb9408f01aafe92c3b65036e095d7a321 +size 91855438 diff --git a/r1_no_ds/run/checkpoints/acc/best_scheduler.pt b/r1_no_ds/run/checkpoints/acc/best_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0312a1b3387160ece1635dd2924f25070144a91 --- /dev/null +++ b/r1_no_ds/run/checkpoints/acc/best_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:325f352c6c867cb69bfd2aaf1d3c334807d2aff4303704f3963ed1c31e774828 +size 1084 diff --git a/r1_no_ds/run/checkpoints/acc/saved_metrics.pth b/r1_no_ds/run/checkpoints/acc/saved_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..a205a665017b960a659df76a4c3dd2fc0b4e47df --- /dev/null +++ b/r1_no_ds/run/checkpoints/acc/saved_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce3ce8446fc86786210fbd6e332ec937a3caa53e6ee977da99ae92a6e9817211 +size 1208 diff --git a/r1_no_ds/run/logging/epoch_0_train_metrics.pth b/r1_no_ds/run/logging/epoch_0_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..43fd16199ece3e1463f14efc25b78823c6956a42 --- /dev/null +++ b/r1_no_ds/run/logging/epoch_0_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31241e433f987187a40177c63ef3047999ceabbed6efbf1035241e6cafa9299b +size 1304 diff --git a/r1_no_ds/run/logging/epoch_0_val_metrics.pth b/r1_no_ds/run/logging/epoch_0_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..df5cbdfde2f32dc2dca6426197c8590059a48d6a --- /dev/null +++ b/r1_no_ds/run/logging/epoch_0_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:180838c2eb1eea5ba7cc47ddbe5139845a2dd17f4262514bee14651ef7d5c037 +size 1360 diff --git a/r1_no_ds/run/logging/epoch_1_train_metrics.pth b/r1_no_ds/run/logging/epoch_1_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..a5f173148d88390e0d70537279b974da2784286d --- /dev/null +++ b/r1_no_ds/run/logging/epoch_1_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdf158e3dd5a73220b0870433e37e6aceef729f94eb3be5fa1449fec64d28811 +size 1304 diff --git a/r1_no_ds/run/logging/epoch_1_val_metrics.pth b/r1_no_ds/run/logging/epoch_1_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..c8d6a40550dc832823bf80ef964a2307f4c3a665 --- /dev/null +++ b/r1_no_ds/run/logging/epoch_1_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40e61a67420e51e60f1fe4cd3b394d52b406368d2fdba7d7361c8d4ec9c6d204 +size 1360 diff --git a/r1_no_ds/run/logging/epoch_2_train_metrics.pth b/r1_no_ds/run/logging/epoch_2_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..c43c270f4469f57f976c6035f0db18532e739938 --- /dev/null +++ b/r1_no_ds/run/logging/epoch_2_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72dc643b02526f0dedbf751cb228f384bd2daa78775ba6ba1742b3ddbae0ef97 +size 1304 diff --git a/r1_no_ds/run/logging/epoch_2_val_metrics.pth b/r1_no_ds/run/logging/epoch_2_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..96f21f9fccc1cc49dc902cf06ecd93294566ef41 --- /dev/null +++ b/r1_no_ds/run/logging/epoch_2_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeedbc3ace4729d0918f60b74cfa6f9ffda3c8cb308b63abea16e0ca8de4c6fe +size 1360 diff --git a/r1_no_ds/run/logging/epoch_3_train_metrics.pth b/r1_no_ds/run/logging/epoch_3_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..180fac8ad873842b97a9abe5a4594c1965e9590e --- /dev/null +++ b/r1_no_ds/run/logging/epoch_3_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b802ec6a1cdfa75eeb8725ee6cab5d2bce4a1b15036bf414c96cf62920b8c64c +size 1304 diff --git a/r1_no_ds/run/logging/epoch_3_val_metrics.pth b/r1_no_ds/run/logging/epoch_3_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..e8e4fda457d2efa0eaf87448127709ccec188773 --- /dev/null +++ b/r1_no_ds/run/logging/epoch_3_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a992fff428d192da66ea578c798fc605c653cef8d6a8f1690560b773a8011696 +size 1360 diff --git a/r1_no_ds/run/logging/epoch_4_train_metrics.pth b/r1_no_ds/run/logging/epoch_4_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..e07c25cbe6c3e93c6a83909d37cbc463ca410fb4 --- /dev/null +++ b/r1_no_ds/run/logging/epoch_4_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:707b0da9594ef8f40186056ff5843958e63e7e7b9cb9533c538940be3353244a +size 1304 diff --git a/r1_no_ds/run/logging/epoch_4_val_metrics.pth b/r1_no_ds/run/logging/epoch_4_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..334f1a33ab7c0ab9097517dc7a430debf532db0e --- /dev/null +++ b/r1_no_ds/run/logging/epoch_4_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:301799e55186eb00c4ad4459464b61c46f4a7db823310d9a14324bc5a43ad668 +size 1360 diff --git a/r1_no_ds/run/logging/epoch_5_train_metrics.pth b/r1_no_ds/run/logging/epoch_5_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..faf9398fa325d9c478c9e07fec718e4b880193f7 --- /dev/null +++ b/r1_no_ds/run/logging/epoch_5_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b77d711e790b206aa248e855d2f5d61e4f7d5b08ff1be71c9a9994df765018c8 +size 1304 diff --git a/r1_no_ds/run/logging/epoch_5_val_metrics.pth b/r1_no_ds/run/logging/epoch_5_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..b8878aec75735c51bdda5237e898a42e05968edb --- /dev/null +++ b/r1_no_ds/run/logging/epoch_5_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bde3997962f2a71383ff42177600ab5c5110ba798b142277b754b653c9f4067c +size 1360 diff --git a/r1_no_ds/run/logging/epoch_6_train_metrics.pth b/r1_no_ds/run/logging/epoch_6_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..c452015387cc3bc968135cfd2d246b73e6da6b37 --- /dev/null +++ b/r1_no_ds/run/logging/epoch_6_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46e73081072f10bcb2b6c447e15cad3b7fff09cd30101d71bda861496f51d504 +size 1304 diff --git a/r1_no_ds/run/logging/epoch_6_val_metrics.pth b/r1_no_ds/run/logging/epoch_6_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..e166f084438a5e3716d8ef0d0e74f6036fa1ed8d --- /dev/null +++ b/r1_no_ds/run/logging/epoch_6_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bda2d531acd91863753ca68ab411396c336a9f8ca8e85317405a96bb742a873c +size 1360 diff --git a/r1_no_ds/run/logging/epoch_7_train_metrics.pth b/r1_no_ds/run/logging/epoch_7_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..bab6e34439ef725a513f5a3167794a15d7194162 --- /dev/null +++ b/r1_no_ds/run/logging/epoch_7_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d11f8413bd966eb6b1b3ccebb3fd68aad7920f258ad2e01454413c8ce5aaa31 +size 1304 diff --git a/r1_no_ds/run/logging/epoch_7_val_metrics.pth b/r1_no_ds/run/logging/epoch_7_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..47b92fe8935203757fb7edda26c014796e75ea22 --- /dev/null +++ b/r1_no_ds/run/logging/epoch_7_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef5282ccd64ae920f12b4bd134c7fa43557dc64079a4b6ab4721ba6b8fa53201 +size 1360 diff --git a/r1_no_ds/run/logging/epoch_8_train_metrics.pth b/r1_no_ds/run/logging/epoch_8_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..f3398ee3a039f65d7b9f6fca6f26d19f7f3ee213 --- /dev/null +++ b/r1_no_ds/run/logging/epoch_8_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0955d9cb9eca408c0d3ee1098f1bcb0a8a800379d17f8d649401d3cc74b47ab +size 1304 diff --git a/r1_no_ds/run/logging/epoch_8_val_metrics.pth b/r1_no_ds/run/logging/epoch_8_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..0f1d45f556165bbdefb3f4d6825fab98334ee7e1 --- /dev/null +++ b/r1_no_ds/run/logging/epoch_8_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d0b195ec30221a8c9681c6b327ecd72514bc4bed5334b119501701d94f8c0b6 +size 1360 diff --git a/r1_no_ds/run/logging/exp_cfg.yaml b/r1_no_ds/run/logging/exp_cfg.yaml new file mode 100644 index 0000000000000000000000000000000000000000..ede6a088c4fb8a26336d4a58c8a7f17cd9d4aae4 --- /dev/null +++ b/r1_no_ds/run/logging/exp_cfg.yaml @@ -0,0 +1,62 @@ +anno_len_threshold: 40 +base_folder: /home/mog29/compgen_saved_files/experiments/joint_training +batch_size: 2 +checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_no_ds/run/checkpoints +comprehension_prompt: verbose_instruction +context_size: 10 +data_dir: /home/mog29/compgen_saved_files/kilogram/dataset +deployment_round: 1 +evaluation_type: joint +expdir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_no_ds/run +from_scratch: true +generation_prompt: information_after +gradient_accumulation_steps: 32 +gradient_clip_norm: 1 +img_dir: /home/mog29/compgen_saved_files/kilogram/dataset/square-black-imgs +ips_clip: 5 +learning_rate: 0.0001 +listener_filter: '' +listener_lambda: 0.5 +load_from_checkpoint: false +logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_no_ds/run/logging +lora_dropout: 0.05 +lora_r: 16 +lora_subset: vision_resampler +max_steps: 30 +model_family_name: no_ds +n_epochs: 15 +name: joint and multitask training defaults +name_suffix: '' +no_lora: false +no_shuffling: false +noise_filter: '' +num_samples: 10 +num_training_steps: 15000 +num_warmup_steps: 0 +num_workers: 4 +only_seed: false +past_checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r0_full/run/checkpoints +past_logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r0_full/run/logging +past_name_suffix: '' +past_round: -1 +patience_cutoff: 5 +ref_strat: no_ips_for_pos +repetition_penalty: 1 +replacement_family_name: '' +sampling_type: nucleus +save_each_epoch: true +seed: 557460 +shared_parameters: true +speaker_filter: '' +speaker_lambda: 0.5 +split_dir: /home/mog29/compgen_saved_files/split_info/ +temperature: 0.7 +test_batch_size: 4 +top_k: 50 +top_p: 1 +training_type: multitask +use_separate_dataloaders: false +use_wandb: true +wandb_experiment_name: r1_no_ds_may +wandb_project_name: tangram_continual_learning_final +weight_decay: 0.1 diff --git a/r1_no_ji/run/checkpoints/acc/README.md b/r1_no_ji/run/checkpoints/acc/README.md new file mode 100644 index 0000000000000000000000000000000000000000..2d4c19b14ebbb9a403d09e6532e46ccfcd7b82cb --- /dev/null +++ b/r1_no_ji/run/checkpoints/acc/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: HuggingFaceM4/idefics2-8b +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/r1_no_ji/run/checkpoints/acc/adapter_config.json b/r1_no_ji/run/checkpoints/acc/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a6a12bf8b59da5b42d042490beafd765fe95f7af --- /dev/null +++ b/r1_no_ji/run/checkpoints/acc/adapter_config.json @@ -0,0 +1,29 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "Idefics2ForConditionalGeneration", + "parent_library": "transformers.models.idefics2.modeling_idefics2" + }, + "base_model_name_or_path": "HuggingFaceM4/idefics2-8b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": "gaussian", + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.1, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 16, + "rank_pattern": {}, + "revision": null, + "target_modules": "(.*(vision_model|modality_projection|perceiver_resampler).*(out_proj|fc1|fc2|down_proj|gate_proj|up_proj|k_proj|q_proj|v_proj|o_proj).*$)|(.*(k_proj|q_proj|v_proj).*$)", + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/r1_no_ji/run/checkpoints/acc/adapter_model.safetensors b/r1_no_ji/run/checkpoints/acc/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d5cc0f998398a966baeb9cd49a3ebb14467d73ca --- /dev/null +++ b/r1_no_ji/run/checkpoints/acc/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ce673b64ca17118911ccf75f344972eaf8cc1c747b4b0743ba9fbb58ee829ed +size 45771496 diff --git a/r1_no_ji/run/checkpoints/acc/best_optimizer.pt b/r1_no_ji/run/checkpoints/acc/best_optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8c34bfc8bc2250c7c6c9efc502690e1d3c56dae --- /dev/null +++ b/r1_no_ji/run/checkpoints/acc/best_optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd3e4e992557ee5a534f8f8f31693f739f7e64bc8e25945283a8318180539b56 +size 91855438 diff --git a/r1_no_ji/run/checkpoints/acc/best_scheduler.pt b/r1_no_ji/run/checkpoints/acc/best_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7137f7ba81c519e8812413a7593917002e01472 --- /dev/null +++ b/r1_no_ji/run/checkpoints/acc/best_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92310b3d48b04025b66f83f2f2ce76276ec669204e8e3e260f1bfddea2af19f0 +size 1084 diff --git a/r1_no_ji/run/checkpoints/acc/saved_metrics.pth b/r1_no_ji/run/checkpoints/acc/saved_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..104ba73a7ed1c19e0f5b0cf9aac9fb4212eea499 --- /dev/null +++ b/r1_no_ji/run/checkpoints/acc/saved_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e02417b7b4c23e6b45f2d15cf68034b74de3e376cf8a28718f7ffe98b9edd0a0 +size 1016 diff --git a/r1_no_ji/run/logging/epoch_0_train_metrics.pth b/r1_no_ji/run/logging/epoch_0_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..67e0358a462edc695f1033bbe7bdb3dc969882bc --- /dev/null +++ b/r1_no_ji/run/logging/epoch_0_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3b84bacd8bd6603e858bf1c290e6a007d858a72b8b1ec5dff7c701ea70a63dc +size 1304 diff --git a/r1_no_ji/run/logging/epoch_0_val_metrics.pth b/r1_no_ji/run/logging/epoch_0_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..139bfe471fea068d70a733fe5d9e5687573dfd97 --- /dev/null +++ b/r1_no_ji/run/logging/epoch_0_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:026ef074e3d4e1c5a37813c0cc27e8e4c0885e772d841b558eae81a3086e1b34 +size 1168 diff --git a/r1_no_ji/run/logging/epoch_10_train_metrics.pth b/r1_no_ji/run/logging/epoch_10_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..cefb49aec22b0c3016728ba1ecc4fa716d40ad39 --- /dev/null +++ b/r1_no_ji/run/logging/epoch_10_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c684164ce88e03fd5d1f44089db8a7094182691ffb1c52df14171c2dfb83a3b +size 1372 diff --git a/r1_no_ji/run/logging/epoch_10_val_metrics.pth b/r1_no_ji/run/logging/epoch_10_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..69c7df686b8541d6348bd4f7d40f93c721613373 --- /dev/null +++ b/r1_no_ji/run/logging/epoch_10_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d7960625b9b4452b2a7078ecd442652e64428a98dc2a10ad10b7781b6c72750 +size 1172 diff --git a/r1_no_ji/run/logging/epoch_11_train_metrics.pth b/r1_no_ji/run/logging/epoch_11_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..712e06ff111ea83efbf9f47ca8212c40b368f30f --- /dev/null +++ b/r1_no_ji/run/logging/epoch_11_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59164de9db72995be73ff230cac39d9b16153369214b6082e21a37490fbe2586 +size 1372 diff --git a/r1_no_ji/run/logging/epoch_11_val_metrics.pth b/r1_no_ji/run/logging/epoch_11_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..2a0474083ff668e583d5b7b5536d1393bda452ed --- /dev/null +++ b/r1_no_ji/run/logging/epoch_11_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cb7f121c6da810a2dbd11a0b54b3a00aa7ea1f31708a6d5e966ed26189e8d25 +size 1172 diff --git a/r1_no_ji/run/logging/epoch_12_train_metrics.pth b/r1_no_ji/run/logging/epoch_12_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..b0add698a81efd3d3b5701d8fa6bf58b98423c6e --- /dev/null +++ b/r1_no_ji/run/logging/epoch_12_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27edea507ac46080d4a0138e852bef969586fff8c5e4d545a6f2491ff7bbb180 +size 1372 diff --git a/r1_no_ji/run/logging/epoch_12_val_metrics.pth b/r1_no_ji/run/logging/epoch_12_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..407938e09f3c06aeef49f1e9a34f5f976a3aa093 --- /dev/null +++ b/r1_no_ji/run/logging/epoch_12_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b53b90993c76d5586670e41a372ccca79d227a5c5cd1b4bd38c0047a53468b4 +size 1172 diff --git a/r1_no_ji/run/logging/epoch_13_train_metrics.pth b/r1_no_ji/run/logging/epoch_13_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..2d31fadc1cdaca60830f84bc26cfb68cfa2f1b43 --- /dev/null +++ b/r1_no_ji/run/logging/epoch_13_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a5b7d8fadba4d2856ee705e6e1e9947bdc95113a26985c67a94df14f9d39370 +size 1372 diff --git a/r1_no_ji/run/logging/epoch_13_val_metrics.pth b/r1_no_ji/run/logging/epoch_13_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..71c0e2266482a76c8621e17c0c6391f384e17b13 --- /dev/null +++ b/r1_no_ji/run/logging/epoch_13_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73e9aef3bc5c59087bdc2bb8386a3bbde2d7ff3cb07d1d6b0ba9fbcd3e205a41 +size 1172 diff --git a/r1_no_ji/run/logging/epoch_14_train_metrics.pth b/r1_no_ji/run/logging/epoch_14_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..721e354df5b22e8f3a5b793b1ae7be4426c55987 --- /dev/null +++ b/r1_no_ji/run/logging/epoch_14_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b546d7ec1a5e8a9be2bfac4ee0e0f65c21219635ead818eca30e2037d146e7a +size 1372 diff --git a/r1_no_ji/run/logging/epoch_14_val_metrics.pth b/r1_no_ji/run/logging/epoch_14_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..446819d33819d165d81f5c501464b1d78f5f3760 --- /dev/null +++ b/r1_no_ji/run/logging/epoch_14_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c49207afce01d25fe6ce1ec8faf6d21a159eb0016e3b17035f63e48d602ff825 +size 1172 diff --git a/r1_no_ji/run/logging/epoch_1_train_metrics.pth b/r1_no_ji/run/logging/epoch_1_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..3e88541531bf686326e1575e8d476b34aa420b7b --- /dev/null +++ b/r1_no_ji/run/logging/epoch_1_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91c4140209c10bd9e770cba8901e058c66aad1e82d16c692f8bd907207a80d21 +size 1304 diff --git a/r1_no_ji/run/logging/epoch_1_val_metrics.pth b/r1_no_ji/run/logging/epoch_1_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..8367600845293f012e62c72dd6e4ca048f9b2180 --- /dev/null +++ b/r1_no_ji/run/logging/epoch_1_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:304a8538866862da677b31ced7cab0c0f65a3c7eb7344e59b00e06c594f9af11 +size 1168 diff --git a/r1_no_ji/run/logging/epoch_2_train_metrics.pth b/r1_no_ji/run/logging/epoch_2_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..ab75aea5d4871ce4ba18875521a55d9193c5ba06 --- /dev/null +++ b/r1_no_ji/run/logging/epoch_2_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e048a269dae12fe0fd7e73aa6ad98292defef7805087b7a6c899809f13ad324b +size 1304 diff --git a/r1_no_ji/run/logging/epoch_2_val_metrics.pth b/r1_no_ji/run/logging/epoch_2_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..62e1e56893f1b6b6f222e0068b0d8986068b49a4 --- /dev/null +++ b/r1_no_ji/run/logging/epoch_2_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22a4644e566c1389b3f26df11f82ec04df5775d49695bd80be3bb257f0d05af7 +size 1168 diff --git a/r1_no_ji/run/logging/epoch_3_train_metrics.pth b/r1_no_ji/run/logging/epoch_3_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..19b639dc0c9d32b04a680369229a5ae3d509a92f --- /dev/null +++ b/r1_no_ji/run/logging/epoch_3_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3c8d9f9d45cfcb9b4c0289230985f24e5dd6b30dcc88a41fd7ccc85931826ea +size 1304 diff --git a/r1_no_ji/run/logging/epoch_3_val_metrics.pth b/r1_no_ji/run/logging/epoch_3_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..1cc2c2dbf9e96e2927247819de9361f6aabb133c --- /dev/null +++ b/r1_no_ji/run/logging/epoch_3_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68d32970e65c2178dcbf4e323671334d660ffc53209529aa2375ef4efcb7a1a4 +size 1168 diff --git a/r1_no_ji/run/logging/epoch_4_train_metrics.pth b/r1_no_ji/run/logging/epoch_4_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..a85e51b1086b899fb4e87e656e1da12096b3d614 --- /dev/null +++ b/r1_no_ji/run/logging/epoch_4_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:260a9c2b7f7cc0e2c75bdcb7bbcc958db105a7de42dd7da9dc3d77c9cc9c7d77 +size 1304 diff --git a/r1_no_ji/run/logging/epoch_4_val_metrics.pth b/r1_no_ji/run/logging/epoch_4_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..b7417aba8df0a44a6e190f008b6ce9aa23c1157c --- /dev/null +++ b/r1_no_ji/run/logging/epoch_4_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e78279ea9846c7d6bf07b29ccece297028071a59795048e85f911293ac954ee7 +size 1168 diff --git a/r1_no_ji/run/logging/epoch_5_train_metrics.pth b/r1_no_ji/run/logging/epoch_5_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..a2b6247fb701d19d4cfa21b7a314e7cc135ff901 --- /dev/null +++ b/r1_no_ji/run/logging/epoch_5_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:671e7f9f5417628e37fb4a11486c90c7779a0dd1dd10bbb7fdb25be4fb9cc89c +size 1304 diff --git a/r1_no_ji/run/logging/epoch_5_val_metrics.pth b/r1_no_ji/run/logging/epoch_5_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..3f764c72cc915c71407215d43e21e6794b322d3b --- /dev/null +++ b/r1_no_ji/run/logging/epoch_5_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87d4aa1d55a7bf98a17e5964d90be670e354f2511943575f967f936282ebc7dd +size 1168 diff --git a/r1_no_ji/run/logging/epoch_6_train_metrics.pth b/r1_no_ji/run/logging/epoch_6_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..665e41ad61e7185fbb9e82e2da7ad1d4516cf350 --- /dev/null +++ b/r1_no_ji/run/logging/epoch_6_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f2bd32de7aa66db8fb22eb0c223ab2c49e288e0e521fddf43e82ea855f8aea9 +size 1304 diff --git a/r1_no_ji/run/logging/epoch_6_val_metrics.pth b/r1_no_ji/run/logging/epoch_6_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..111a7d00a50af37b3b5d21804f50776ea16109ef --- /dev/null +++ b/r1_no_ji/run/logging/epoch_6_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2ba4d2db42106690f1b59af0ef6c700c53866ca2d61e835b0d7b357a271c81c +size 1168 diff --git a/r1_no_ji/run/logging/epoch_7_train_metrics.pth b/r1_no_ji/run/logging/epoch_7_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..841151dd7909c53725392d58927c6be3f9e6aec5 --- /dev/null +++ b/r1_no_ji/run/logging/epoch_7_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35ce9d800a1ddf275490f4c694ed711456c52081c6438c5c16ed585f59e88006 +size 1304 diff --git a/r1_no_ji/run/logging/epoch_7_val_metrics.pth b/r1_no_ji/run/logging/epoch_7_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..dcd03611ae4643499ca7030915d5ad0bfafc95c3 --- /dev/null +++ b/r1_no_ji/run/logging/epoch_7_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e463bf3d2a6423348873ea8ed1317815eb1ee6a820c634de4bc32e7a33f6b09 +size 1168 diff --git a/r1_no_ji/run/logging/epoch_8_train_metrics.pth b/r1_no_ji/run/logging/epoch_8_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..940f30cbc83a4099c2df40bcf33c2b9b3bddc82a --- /dev/null +++ b/r1_no_ji/run/logging/epoch_8_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f374c4285f23edbab4c3662296847776575edf55bc002a5d4c000049e1ef688 +size 1304 diff --git a/r1_no_ji/run/logging/epoch_8_val_metrics.pth b/r1_no_ji/run/logging/epoch_8_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..e5eb859dd721fa47f9f80b0cb672a9331c249612 --- /dev/null +++ b/r1_no_ji/run/logging/epoch_8_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:378d1acdbf53535f4a7e86ebe76b4c68c9d2a9e934d93c492611b58235be31e8 +size 1168 diff --git a/r1_no_ji/run/logging/epoch_9_train_metrics.pth b/r1_no_ji/run/logging/epoch_9_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..b5df9e8647cab9aeed5a3f85997ced814f0487b1 --- /dev/null +++ b/r1_no_ji/run/logging/epoch_9_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6cadb83b6345f5c03d57e8ba32b838a594fb941cb632ed22b19c7d830c57011 +size 1304 diff --git a/r1_no_ji/run/logging/epoch_9_val_metrics.pth b/r1_no_ji/run/logging/epoch_9_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..ab1cabffb7703e89efdf1f6adbbb77d37dc5cd98 --- /dev/null +++ b/r1_no_ji/run/logging/epoch_9_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e6f924755ed127ef701a2c03b48bc5ca1ec178307b7a5a0208a744e0ea3f82c +size 1168 diff --git a/r1_no_ji/run/logging/exp_cfg.yaml b/r1_no_ji/run/logging/exp_cfg.yaml new file mode 100644 index 0000000000000000000000000000000000000000..7e2d55f8283f125e584d5245aa22c98b1e8cf0c6 --- /dev/null +++ b/r1_no_ji/run/logging/exp_cfg.yaml @@ -0,0 +1,62 @@ +anno_len_threshold: 40 +base_folder: /home/mog29/compgen_saved_files/experiments/joint_training +batch_size: 2 +checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_no_ji/run/checkpoints +comprehension_prompt: verbose_instruction +context_size: 10 +data_dir: /home/mog29/compgen_saved_files/kilogram/dataset +deployment_round: 1 +evaluation_type: multitask +expdir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_no_ji/run +from_scratch: true +generation_prompt: information_after +gradient_accumulation_steps: 32 +gradient_clip_norm: 1 +img_dir: /home/mog29/compgen_saved_files/kilogram/dataset/square-black-imgs +ips_clip: 5 +learning_rate: 0.0001 +listener_filter: no_neg_gen +listener_lambda: 0.5 +load_from_checkpoint: false +logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_no_ji/run/logging +lora_dropout: 0.05 +lora_r: 16 +lora_subset: vision_resampler +max_steps: 30 +model_family_name: no_ji +n_epochs: 15 +name: joint and multitask training defaults +name_suffix: '' +no_lora: false +no_shuffling: false +noise_filter: '' +num_samples: 10 +num_training_steps: 15000 +num_warmup_steps: 0 +num_workers: 4 +only_seed: false +past_checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r0_no_ji/run/checkpoints +past_logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r0_no_ji/run/logging +past_name_suffix: '' +past_round: -1 +patience_cutoff: 5 +ref_strat: no_ips_for_pos +repetition_penalty: 1 +replacement_family_name: '' +sampling_type: nucleus +save_each_epoch: true +seed: 505263 +shared_parameters: true +speaker_filter: no_neg_comp +speaker_lambda: 0.5 +split_dir: /home/mog29/compgen_saved_files/split_info/ +temperature: 0.7 +test_batch_size: 4 +top_k: 50 +top_p: 1 +training_type: multitask +use_separate_dataloaders: true +use_wandb: true +wandb_experiment_name: r1_no_ji_may +wandb_project_name: tangram_continual_learning_final +weight_decay: 0.1 diff --git a/r2_baseline/run/checkpoints/acc/README.md b/r2_baseline/run/checkpoints/acc/README.md new file mode 100644 index 0000000000000000000000000000000000000000..2d4c19b14ebbb9a403d09e6532e46ccfcd7b82cb --- /dev/null +++ b/r2_baseline/run/checkpoints/acc/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: HuggingFaceM4/idefics2-8b +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/r2_baseline/run/checkpoints/acc/adapter_config.json b/r2_baseline/run/checkpoints/acc/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a6a12bf8b59da5b42d042490beafd765fe95f7af --- /dev/null +++ b/r2_baseline/run/checkpoints/acc/adapter_config.json @@ -0,0 +1,29 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "Idefics2ForConditionalGeneration", + "parent_library": "transformers.models.idefics2.modeling_idefics2" + }, + "base_model_name_or_path": "HuggingFaceM4/idefics2-8b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": "gaussian", + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.1, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 16, + "rank_pattern": {}, + "revision": null, + "target_modules": "(.*(vision_model|modality_projection|perceiver_resampler).*(out_proj|fc1|fc2|down_proj|gate_proj|up_proj|k_proj|q_proj|v_proj|o_proj).*$)|(.*(k_proj|q_proj|v_proj).*$)", + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/r2_baseline/run/checkpoints/acc/adapter_model.safetensors b/r2_baseline/run/checkpoints/acc/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a73ab5c9ee68772e75d2b1fb43a2749eb1274516 --- /dev/null +++ b/r2_baseline/run/checkpoints/acc/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a06e6c82943a7c41f90a02e216dae69bcad36a2ab13188e54dee2320d1d5c54 +size 45771496 diff --git a/r2_baseline/run/checkpoints/acc/best_optimizer.pt b/r2_baseline/run/checkpoints/acc/best_optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..c954135d25a555479daa687afb427218ed820b92 --- /dev/null +++ b/r2_baseline/run/checkpoints/acc/best_optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88710afdeb931a570a08949e7c3117811ed84d53940354e95dc54f2f94659082 +size 91855438 diff --git a/r2_baseline/run/checkpoints/acc/best_scheduler.pt b/r2_baseline/run/checkpoints/acc/best_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..6809c6db1c116dcd801e932f4b581ed00b7c169d --- /dev/null +++ b/r2_baseline/run/checkpoints/acc/best_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fce855d36d4caa363c8d0677a25bc01fd104e14a24ac9d8b82298a7abe6c789b +size 1084 diff --git a/r2_baseline/run/checkpoints/acc/saved_metrics.pth b/r2_baseline/run/checkpoints/acc/saved_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..a3405ea92e438a7923f9121c428ad4e049b673c1 --- /dev/null +++ b/r2_baseline/run/checkpoints/acc/saved_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2338bc5e4ce64500847344f13aec00ba2da784b31af57a7cf8e087c63f57c97 +size 1016 diff --git a/r2_baseline/run/logging/epoch_0_train_metrics.pth b/r2_baseline/run/logging/epoch_0_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..71f440de49321fd3944ebeefb14dc1afc844c762 --- /dev/null +++ b/r2_baseline/run/logging/epoch_0_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a21e89e3604228925de979f9db5f6d8631d4d8e826431744a85fef84a2c8f8f3 +size 1304 diff --git a/r2_baseline/run/logging/epoch_0_val_metrics.pth b/r2_baseline/run/logging/epoch_0_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..6bb00fd29d2421b14b134a4210d4e13d007ffe5f --- /dev/null +++ b/r2_baseline/run/logging/epoch_0_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8154c9d7c9a8d8132efb53e3483ea858bb4a153ce791b84f5eae935dfba377ac +size 1168 diff --git a/r2_baseline/run/logging/epoch_1_train_metrics.pth b/r2_baseline/run/logging/epoch_1_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..5b2735106a2cdd4f326d9d3a34aad40b1c2164a6 --- /dev/null +++ b/r2_baseline/run/logging/epoch_1_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24a7d69bb388dabd528594b78f82221849fe0270ead8be2e4936ea9ae5ba2cf7 +size 1304 diff --git a/r2_baseline/run/logging/epoch_1_val_metrics.pth b/r2_baseline/run/logging/epoch_1_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..2836ce325239a7bae78aad006c75b26fb80639ed --- /dev/null +++ b/r2_baseline/run/logging/epoch_1_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59a203cf97435c081ee1e6b443cef9fb6bec4fe72ee66384bbab6150359b3889 +size 1168 diff --git a/r2_baseline/run/logging/epoch_2_train_metrics.pth b/r2_baseline/run/logging/epoch_2_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..dbd47760dc6cdcdbdb45fb0aa2d9a813ed203ad9 --- /dev/null +++ b/r2_baseline/run/logging/epoch_2_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e5aa2db24548592856926b49e86ab620962ee006343446d98e278fffed5fdec +size 1304 diff --git a/r2_baseline/run/logging/epoch_2_val_metrics.pth b/r2_baseline/run/logging/epoch_2_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..706122bbfda09af16835377b9025b358940e31dd --- /dev/null +++ b/r2_baseline/run/logging/epoch_2_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f1701a68c6e714cc49329a41c3b5145c80537a4a6b3b6859f9c9668f639c26a +size 1168 diff --git a/r2_baseline/run/logging/epoch_3_train_metrics.pth b/r2_baseline/run/logging/epoch_3_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..68375db194d112757b4db05b2f37be8d9b7432ac --- /dev/null +++ b/r2_baseline/run/logging/epoch_3_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69e0606ae2487bd70358dd601b1e764720ffa9f1033710f9c1c30b06d928bad9 +size 1304 diff --git a/r2_baseline/run/logging/epoch_3_val_metrics.pth b/r2_baseline/run/logging/epoch_3_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..cbbd35fbe5141e1d263dfc08b67e3d1ae36fa061 --- /dev/null +++ b/r2_baseline/run/logging/epoch_3_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aad520e7eca8ec44481877c1b2cb063ff570706440d210c32b08231984476de3 +size 1168 diff --git a/r2_baseline/run/logging/epoch_4_train_metrics.pth b/r2_baseline/run/logging/epoch_4_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..ebf5f51ce901f34bc6542d63ebf6323827f58ae3 --- /dev/null +++ b/r2_baseline/run/logging/epoch_4_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e9ef1c2fe50a270d671a33d7f4a6002967e6283ede6d5ac30459bbcdac1d4a8 +size 1304 diff --git a/r2_baseline/run/logging/epoch_4_val_metrics.pth b/r2_baseline/run/logging/epoch_4_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..cd5bf18f90f9c63ddea5eb6243e62dc62b2685e8 --- /dev/null +++ b/r2_baseline/run/logging/epoch_4_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b773f70c45863453d40a0140c72aab04193ee61a9576e44ef1b6cc99a30d2881 +size 1168 diff --git a/r2_baseline/run/logging/epoch_5_train_metrics.pth b/r2_baseline/run/logging/epoch_5_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..2324264105d8794a80dff1b003ef5bb010362b6a --- /dev/null +++ b/r2_baseline/run/logging/epoch_5_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbce0412e4e3b75068d7313dc83937a52ae90f19a9f25495e4e13eef640b0fc9 +size 1304 diff --git a/r2_baseline/run/logging/epoch_5_val_metrics.pth b/r2_baseline/run/logging/epoch_5_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..21f90b810794bfecfce7ae1cf536fa62d2d72f42 --- /dev/null +++ b/r2_baseline/run/logging/epoch_5_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06ee5bde1ff94e04eaca4cfaa2fa3a9762662c60a503833ad78a8092f2c37122 +size 1168 diff --git a/r2_baseline/run/logging/epoch_6_train_metrics.pth b/r2_baseline/run/logging/epoch_6_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..60806b1329ee737b84c94b9ed82013801c50195b --- /dev/null +++ b/r2_baseline/run/logging/epoch_6_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69af83569ef3d40d739810a540586d3bc4b54178c52151176cfa115fb4d6eee0 +size 1304 diff --git a/r2_baseline/run/logging/epoch_6_val_metrics.pth b/r2_baseline/run/logging/epoch_6_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..106a3c896037201cc12d2f6ad6b96f32d884eb55 --- /dev/null +++ b/r2_baseline/run/logging/epoch_6_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84bfd1c5a8994dd170046591b0b9a2617f4536ed4eb0b7b8639d1c5fee4f06e0 +size 1168 diff --git a/r2_baseline/run/logging/epoch_7_train_metrics.pth b/r2_baseline/run/logging/epoch_7_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..a711157677941f82a5d981f2ece5692d839b638a --- /dev/null +++ b/r2_baseline/run/logging/epoch_7_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:292df89a2a7546cc2e43ba6ad017d4046bd7fc6f9e4e60a4b8b46b99177e8dfe +size 1304 diff --git a/r2_baseline/run/logging/epoch_7_val_metrics.pth b/r2_baseline/run/logging/epoch_7_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..13707ee870c72fa8beae8d6174bba5bed40c2841 --- /dev/null +++ b/r2_baseline/run/logging/epoch_7_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad5cfa72c5c8d5945bf171d65afd2c9e4d1a81392847a1931e1229f249fce88a +size 1168 diff --git a/r2_baseline/run/logging/epoch_8_train_metrics.pth b/r2_baseline/run/logging/epoch_8_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..0a5957a9bad7de9842e117989a3ed510f132ab35 --- /dev/null +++ b/r2_baseline/run/logging/epoch_8_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f87bf94a73aedb542966efc06f88aa3412a2f3dca532bdeb3c9f396177ebd26 +size 1304 diff --git a/r2_baseline/run/logging/epoch_8_val_metrics.pth b/r2_baseline/run/logging/epoch_8_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..67a936a05c11f4b6d6c5524fa9bc5edea395f304 --- /dev/null +++ b/r2_baseline/run/logging/epoch_8_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ac2f033b55b0bc03da26e976a56a5d2d3ff7392fd19181b360a5ec6e0888db7 +size 1168 diff --git a/r2_baseline/run/logging/epoch_9_train_metrics.pth b/r2_baseline/run/logging/epoch_9_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..0244ffc11239bf4a35119d94104214bd330e80cf --- /dev/null +++ b/r2_baseline/run/logging/epoch_9_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbf8df51cba91457b0a5627767d5f7883f0b70c1925959b73f3265959671b014 +size 1304 diff --git a/r2_baseline/run/logging/epoch_9_val_metrics.pth b/r2_baseline/run/logging/epoch_9_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..a9d584fba0ab733e1e3cfe59ea85029b1f73b273 --- /dev/null +++ b/r2_baseline/run/logging/epoch_9_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f63e71b651f15ff1fae0b74b008cd9a7d2a45819038d3633282d704f40b003a +size 1168 diff --git a/r2_baseline/run/logging/exp_cfg.yaml b/r2_baseline/run/logging/exp_cfg.yaml new file mode 100644 index 0000000000000000000000000000000000000000..864a1558659378f9c7ee390265a9d4f3f8540c3a --- /dev/null +++ b/r2_baseline/run/logging/exp_cfg.yaml @@ -0,0 +1,62 @@ +anno_len_threshold: 40 +base_folder: /home/mog29/compgen_saved_files/experiments/joint_training +batch_size: 2 +checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_baseline/run/checkpoints +comprehension_prompt: verbose_instruction +context_size: 10 +data_dir: /home/mog29/compgen_saved_files/kilogram/dataset +deployment_round: 2 +evaluation_type: multitask +expdir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_baseline/run +from_scratch: true +generation_prompt: information_after +gradient_accumulation_steps: 32 +gradient_clip_norm: 1 +img_dir: /home/mog29/compgen_saved_files/kilogram/dataset/square-black-imgs +ips_clip: 5 +learning_rate: 0.0001 +listener_filter: '' +listener_lambda: 0.5 +load_from_checkpoint: false +logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_baseline/run/logging +lora_dropout: 0.05 +lora_r: 16 +lora_subset: vision_resampler +max_steps: 30 +model_family_name: baseline +n_epochs: 15 +name: joint and multitask training defaults +name_suffix: '' +no_lora: false +no_shuffling: false +noise_filter: '' +num_samples: 10 +num_training_steps: 15000 +num_warmup_steps: 0 +num_workers: 4 +only_seed: false +past_checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_baseline/run/checkpoints +past_logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_baseline/run/logging +past_name_suffix: '' +past_round: -1 +patience_cutoff: 5 +ref_strat: no_ips_for_pos +repetition_penalty: 1 +replacement_family_name: '' +sampling_type: nucleus +save_each_epoch: true +seed: 226422 +shared_parameters: true +speaker_filter: '' +speaker_lambda: 0.5 +split_dir: /home/mog29/compgen_saved_files/split_info/ +temperature: 0.7 +test_batch_size: 4 +top_k: 50 +top_p: 1 +training_type: multitask +use_separate_dataloaders: false +use_wandb: true +wandb_experiment_name: r2_baseline_may +wandb_project_name: tangram_continual_learning_final +weight_decay: 0.1 diff --git a/r2_full/run/checkpoints/acc/README.md b/r2_full/run/checkpoints/acc/README.md new file mode 100644 index 0000000000000000000000000000000000000000..2d4c19b14ebbb9a403d09e6532e46ccfcd7b82cb --- /dev/null +++ b/r2_full/run/checkpoints/acc/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: HuggingFaceM4/idefics2-8b +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/r2_full/run/checkpoints/acc/adapter_config.json b/r2_full/run/checkpoints/acc/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a6a12bf8b59da5b42d042490beafd765fe95f7af --- /dev/null +++ b/r2_full/run/checkpoints/acc/adapter_config.json @@ -0,0 +1,29 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "Idefics2ForConditionalGeneration", + "parent_library": "transformers.models.idefics2.modeling_idefics2" + }, + "base_model_name_or_path": "HuggingFaceM4/idefics2-8b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": "gaussian", + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.1, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 16, + "rank_pattern": {}, + "revision": null, + "target_modules": "(.*(vision_model|modality_projection|perceiver_resampler).*(out_proj|fc1|fc2|down_proj|gate_proj|up_proj|k_proj|q_proj|v_proj|o_proj).*$)|(.*(k_proj|q_proj|v_proj).*$)", + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/r2_full/run/checkpoints/acc/adapter_model.safetensors b/r2_full/run/checkpoints/acc/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e9d37cf5297adc38008d72f1a877161a53d120c8 --- /dev/null +++ b/r2_full/run/checkpoints/acc/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adbd8c24f95ec1b57cd9950254d599b822bbdc7882e91a461e2cd9f523b186a9 +size 45771496 diff --git a/r2_full/run/checkpoints/acc/best_optimizer.pt b/r2_full/run/checkpoints/acc/best_optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..2eb1ba38807c83710605bf14cf9cd347fac790b3 --- /dev/null +++ b/r2_full/run/checkpoints/acc/best_optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f8bd63ee6c31fd0b50fa9e5c77d2d44dd37d00eae9c26c49755dc02494f76ff +size 91855438 diff --git a/r2_full/run/checkpoints/acc/best_scheduler.pt b/r2_full/run/checkpoints/acc/best_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..c275c9fa90c469fe5f5966eb740bd35d9dbe5e1d --- /dev/null +++ b/r2_full/run/checkpoints/acc/best_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:947762d2b3dbe7a558a0489da6ebe1ead77a94d9dadf05ca50707946798d9d7f +size 1084 diff --git a/r2_full/run/checkpoints/acc/saved_metrics.pth b/r2_full/run/checkpoints/acc/saved_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..c2a8570908bd253531edb026960d77b36ca96231 --- /dev/null +++ b/r2_full/run/checkpoints/acc/saved_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c38c6b7622d805e2691bac1d186660df9f52db4910d1bd922f1281541053f9ef +size 1208 diff --git a/r2_full/run/logging/epoch_0_train_metrics.pth b/r2_full/run/logging/epoch_0_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..b0c65f568c485b257ae0f37eb725824ae7224aa5 --- /dev/null +++ b/r2_full/run/logging/epoch_0_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dde03a9023577ea7a0de863e6d4f76ef328b690cf316c3a3aa631b281ccaf5bd +size 1304 diff --git a/r2_full/run/logging/epoch_0_val_metrics.pth b/r2_full/run/logging/epoch_0_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..8232ec54b3dca03d6cfb9ec94de3b731d2a72c8f --- /dev/null +++ b/r2_full/run/logging/epoch_0_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a446dfb0be023b8302e6903a2b9a4233d5fec632a1a371b0bff3c34146e3df7a +size 1360 diff --git a/r2_full/run/logging/epoch_10_train_metrics.pth b/r2_full/run/logging/epoch_10_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..c440a555ff34615b9b233b2958030e580674b5bb --- /dev/null +++ b/r2_full/run/logging/epoch_10_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b55a8bc0075b648b38c4e82d3fe3684d137e391a72a56003dcdd5ff1ad3fccab +size 1372 diff --git a/r2_full/run/logging/epoch_10_val_metrics.pth b/r2_full/run/logging/epoch_10_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..6db739f37e9f425799ab28cedf1b2edd8c6d7752 --- /dev/null +++ b/r2_full/run/logging/epoch_10_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:856ff2b76632c91dd9441e7efbea00f68128f02846d5ba141319e57d0aea1bec +size 1364 diff --git a/r2_full/run/logging/epoch_11_train_metrics.pth b/r2_full/run/logging/epoch_11_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..28adbabebc617c90f0231cfbe03a378e77feef3d --- /dev/null +++ b/r2_full/run/logging/epoch_11_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2da86d6010219f99a2ed0e06e202fa67c961a7dd7210f86a90401093cfd6583 +size 1372 diff --git a/r2_full/run/logging/epoch_11_val_metrics.pth b/r2_full/run/logging/epoch_11_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..45ae4d9b6aa97d8fb23b6c547b4734e38be9efec --- /dev/null +++ b/r2_full/run/logging/epoch_11_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:491e979a3a225861fbd6c0857b8a7d61b1e36ddf60c7c087e6be0e7649b7598c +size 1364 diff --git a/r2_full/run/logging/epoch_1_train_metrics.pth b/r2_full/run/logging/epoch_1_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..51370706eb14376771f633a336ddacb562b9dbb6 --- /dev/null +++ b/r2_full/run/logging/epoch_1_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f89725689d860032d3f9bb4e2c26facef54cf1d0066b07aef52aee41202328c +size 1304 diff --git a/r2_full/run/logging/epoch_1_val_metrics.pth b/r2_full/run/logging/epoch_1_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..2aa09a275466041cb983523afce4081d8201ff13 --- /dev/null +++ b/r2_full/run/logging/epoch_1_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0dfe7a87b773b13e911b8df35fc3ea3c386b7ed018bc9d509704ef89bf0c443 +size 1360 diff --git a/r2_full/run/logging/epoch_2_train_metrics.pth b/r2_full/run/logging/epoch_2_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..82b39a189236d0c26c2a6db64fdca9f451ef2414 --- /dev/null +++ b/r2_full/run/logging/epoch_2_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d84b37beb54993d7d23223a008e2767ae08735ca3cb9ab1471d4d36059e6e17 +size 1304 diff --git a/r2_full/run/logging/epoch_2_val_metrics.pth b/r2_full/run/logging/epoch_2_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..6509618bac7e219bfe2d2c19af2a23ee8080815c --- /dev/null +++ b/r2_full/run/logging/epoch_2_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc8831aa90bf0aa9f42ffe1a2c762625e1749d9755326df705e30a09e6da60d +size 1360 diff --git a/r2_full/run/logging/epoch_3_train_metrics.pth b/r2_full/run/logging/epoch_3_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..383bf0ed9f4bda9e5af3fa696e5d1d9e5b1b2c0f --- /dev/null +++ b/r2_full/run/logging/epoch_3_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b32b8b60d0d173b4fb5eb438320a13ca1f1e6dbc287d00df06b8a3e3ef5a241 +size 1304 diff --git a/r2_full/run/logging/epoch_3_val_metrics.pth b/r2_full/run/logging/epoch_3_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..fd28c540e5ebc67763d6b6ac4903cddba73e82be --- /dev/null +++ b/r2_full/run/logging/epoch_3_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c071e4cc3374695de735c5fd50db635ea7c1741dc4bbf28af9af29bfba0a53ba +size 1360 diff --git a/r2_full/run/logging/epoch_4_train_metrics.pth b/r2_full/run/logging/epoch_4_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..f61a2d5f31e66f4efc46d8b35548a3ed5e4b8f5f --- /dev/null +++ b/r2_full/run/logging/epoch_4_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e7a7c4f41c13fce64e22a27d788cfec1bb8ca369f4145fdec0c65bc3bff04ab +size 1304 diff --git a/r2_full/run/logging/epoch_4_val_metrics.pth b/r2_full/run/logging/epoch_4_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..d9638341e0a44d04e93990c87bbb05091ddf0f73 --- /dev/null +++ b/r2_full/run/logging/epoch_4_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:590a2132b377b84fc294993bf5f1d571527c9c6eaf9c3d5d1595b3c286573196 +size 1360 diff --git a/r2_full/run/logging/epoch_5_train_metrics.pth b/r2_full/run/logging/epoch_5_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..07eaffd537c9ca2973d0f4140781f1191fa2203c --- /dev/null +++ b/r2_full/run/logging/epoch_5_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32b75a017cc25dc1e64b8702d283aeefa290be03e99464daf730d52fbd7106a2 +size 1304 diff --git a/r2_full/run/logging/epoch_5_val_metrics.pth b/r2_full/run/logging/epoch_5_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..fdf3dab11722ff6588473476700b7f09307508f2 --- /dev/null +++ b/r2_full/run/logging/epoch_5_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1850e8f60792e26820a56543989581b206b45b24ff9a731f6b02d72920611e3e +size 1360 diff --git a/r2_full/run/logging/epoch_6_train_metrics.pth b/r2_full/run/logging/epoch_6_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..9b95f640bf044ef38069f630b32376cf038c69f4 --- /dev/null +++ b/r2_full/run/logging/epoch_6_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96ef0e8ef3a89faaecb9948af54b8d026d1ed55ffae1142b4d5a53044c4f4ac8 +size 1304 diff --git a/r2_full/run/logging/epoch_6_val_metrics.pth b/r2_full/run/logging/epoch_6_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..32d5e55b21c4ac8bf9923d4bd449d36049a33432 --- /dev/null +++ b/r2_full/run/logging/epoch_6_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de7dd33f1f409ffc61b0a259fd311df1163d570b12aa3afdaacb45d035f2abdb +size 1360 diff --git a/r2_full/run/logging/epoch_7_train_metrics.pth b/r2_full/run/logging/epoch_7_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..fc4e029295eee92fe37baf23d4645651ffd0ce7c --- /dev/null +++ b/r2_full/run/logging/epoch_7_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d0f654951fc2f9bd31e14a8ed05e387f9f4d9089502d9751c482613808b6c6d +size 1304 diff --git a/r2_full/run/logging/epoch_7_val_metrics.pth b/r2_full/run/logging/epoch_7_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..e2dee55814aada04d5a221edcae3794f7df456d6 --- /dev/null +++ b/r2_full/run/logging/epoch_7_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c7724f108a583a158d5e5cd50ca82fd4c3343d887f3c51f5a53d1bebd308e7f +size 1360 diff --git a/r2_full/run/logging/epoch_8_train_metrics.pth b/r2_full/run/logging/epoch_8_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..5d65c05dc673a95150dbdbf67c1c4e16b1022a77 --- /dev/null +++ b/r2_full/run/logging/epoch_8_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:195fd3ea68c74e0506bd9a302ddc535ef1dc4c67947c913ef7e163f16e7d2999 +size 1304 diff --git a/r2_full/run/logging/epoch_8_val_metrics.pth b/r2_full/run/logging/epoch_8_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..f8baae90cbdb573bac84c8c83bfed7ce10a027d6 --- /dev/null +++ b/r2_full/run/logging/epoch_8_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:003212556664587dd15feaa155d3ea511d6f3365c22b82a39186d109c4bbe28a +size 1360 diff --git a/r2_full/run/logging/epoch_9_train_metrics.pth b/r2_full/run/logging/epoch_9_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..47756de26f417e030aa1fa3a364251ce9e452dc0 --- /dev/null +++ b/r2_full/run/logging/epoch_9_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df0d5ca15ac62f2248c687c13ea569794a7eff4b99b64af10e68a3ba3820884f +size 1304 diff --git a/r2_full/run/logging/epoch_9_val_metrics.pth b/r2_full/run/logging/epoch_9_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..0c55bb545e9b9452c5bd2fa8fea735b9d39c9f8b --- /dev/null +++ b/r2_full/run/logging/epoch_9_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2931e7fcc8310acdca10434f25b0c9b9c97a97a5d483e20ca9814ea908828f09 +size 1360 diff --git a/r2_full/run/logging/exp_cfg.yaml b/r2_full/run/logging/exp_cfg.yaml new file mode 100644 index 0000000000000000000000000000000000000000..8951edad6142730c2007e5c1ce573b5f8fe60261 --- /dev/null +++ b/r2_full/run/logging/exp_cfg.yaml @@ -0,0 +1,62 @@ +anno_len_threshold: 40 +base_folder: /home/mog29/compgen_saved_files/experiments/joint_training +batch_size: 2 +checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_full/run/checkpoints +comprehension_prompt: verbose_instruction +context_size: 10 +data_dir: /home/mog29/compgen_saved_files/kilogram/dataset +deployment_round: 2 +evaluation_type: joint +expdir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_full/run +from_scratch: true +generation_prompt: information_after +gradient_accumulation_steps: 32 +gradient_clip_norm: 1 +img_dir: /home/mog29/compgen_saved_files/kilogram/dataset/square-black-imgs +ips_clip: 5 +learning_rate: 0.0001 +listener_filter: no_neg_gen +listener_lambda: 0.5 +load_from_checkpoint: false +logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_full/run/logging +lora_dropout: 0.05 +lora_r: 16 +lora_subset: vision_resampler +max_steps: 30 +model_family_name: full +n_epochs: 15 +name: joint and multitask training defaults +name_suffix: '' +no_lora: false +no_shuffling: false +noise_filter: '' +num_samples: 10 +num_training_steps: 15000 +num_warmup_steps: 0 +num_workers: 4 +only_seed: false +past_checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_full/run/checkpoints +past_logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_full/run/logging +past_name_suffix: '' +past_round: -1 +patience_cutoff: 5 +ref_strat: no_ips_for_pos +repetition_penalty: 1 +replacement_family_name: '' +sampling_type: nucleus +save_each_epoch: true +seed: 543543 +shared_parameters: true +speaker_filter: no_neg_comp +speaker_lambda: 0.5 +split_dir: /home/mog29/compgen_saved_files/split_info/ +temperature: 0.7 +test_batch_size: 4 +top_k: 50 +top_p: 1 +training_type: multitask +use_separate_dataloaders: true +use_wandb: true +wandb_experiment_name: r2_full_may +wandb_project_name: tangram_continual_learning_final +weight_decay: 0.1 diff --git a/r2_no_ds/run/checkpoints/acc/README.md b/r2_no_ds/run/checkpoints/acc/README.md new file mode 100644 index 0000000000000000000000000000000000000000..2d4c19b14ebbb9a403d09e6532e46ccfcd7b82cb --- /dev/null +++ b/r2_no_ds/run/checkpoints/acc/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: HuggingFaceM4/idefics2-8b +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/r2_no_ds/run/checkpoints/acc/adapter_config.json b/r2_no_ds/run/checkpoints/acc/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a6a12bf8b59da5b42d042490beafd765fe95f7af --- /dev/null +++ b/r2_no_ds/run/checkpoints/acc/adapter_config.json @@ -0,0 +1,29 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "Idefics2ForConditionalGeneration", + "parent_library": "transformers.models.idefics2.modeling_idefics2" + }, + "base_model_name_or_path": "HuggingFaceM4/idefics2-8b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": "gaussian", + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.1, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 16, + "rank_pattern": {}, + "revision": null, + "target_modules": "(.*(vision_model|modality_projection|perceiver_resampler).*(out_proj|fc1|fc2|down_proj|gate_proj|up_proj|k_proj|q_proj|v_proj|o_proj).*$)|(.*(k_proj|q_proj|v_proj).*$)", + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/r2_no_ds/run/checkpoints/acc/adapter_model.safetensors b/r2_no_ds/run/checkpoints/acc/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..32bdc6f9ea35cc34616ab6394d253991d43c4488 --- /dev/null +++ b/r2_no_ds/run/checkpoints/acc/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:084719aa2e9f5bc363031be23fdbf54454ddf6bcd40225a64679fe06e09eca96 +size 45771496 diff --git a/r2_no_ds/run/checkpoints/acc/best_optimizer.pt b/r2_no_ds/run/checkpoints/acc/best_optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..13547744295896729a1094105b1a7bfe8407d90a --- /dev/null +++ b/r2_no_ds/run/checkpoints/acc/best_optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6737e03d1cc233bef930b2e5896112bc7250278e39363806551024d9fb03662e +size 91855438 diff --git a/r2_no_ds/run/checkpoints/acc/best_scheduler.pt b/r2_no_ds/run/checkpoints/acc/best_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..b83c4d40b5e9a89309420a7b466d23d02a50e54e --- /dev/null +++ b/r2_no_ds/run/checkpoints/acc/best_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f357ebc85f447bece42877f32b48679cfa22029216cce5f01288bc8a1ac4aeaf +size 1084 diff --git a/r2_no_ds/run/checkpoints/acc/saved_metrics.pth b/r2_no_ds/run/checkpoints/acc/saved_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..2ac8efd8f03a6bebc090567674d9306e0f951c08 --- /dev/null +++ b/r2_no_ds/run/checkpoints/acc/saved_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5488399888d08d5ffb394c533d13964f3cc7a523deeaa4d28186fd15309803a +size 1208 diff --git a/r2_no_ds/run/logging/epoch_0_train_metrics.pth b/r2_no_ds/run/logging/epoch_0_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..6dcd4b66e3ae3c1c4233e908b36474546f1338f0 --- /dev/null +++ b/r2_no_ds/run/logging/epoch_0_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ceb150ce3ff16092bb00868c5fa9288b00e7bc8dd1b71e226aa184ca1ce9f348 +size 1304 diff --git a/r2_no_ds/run/logging/epoch_0_val_metrics.pth b/r2_no_ds/run/logging/epoch_0_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..d7b42fdf37c3b620b4289f186b0e7e983bac4eaf --- /dev/null +++ b/r2_no_ds/run/logging/epoch_0_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3ebe26c109977ceb5f327b7d6258834ba13008ae536bdf53718d248fda4dab9 +size 1360 diff --git a/r2_no_ds/run/logging/epoch_10_train_metrics.pth b/r2_no_ds/run/logging/epoch_10_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..d8e1b8220831dc226d81ec1cf560648c7595d3e7 --- /dev/null +++ b/r2_no_ds/run/logging/epoch_10_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a839a837a1918aaa32074089963183408ac986c3c42e86ca55a2f4c25a9e11d +size 1372 diff --git a/r2_no_ds/run/logging/epoch_10_val_metrics.pth b/r2_no_ds/run/logging/epoch_10_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..de295586a206acd9a3e5ce106072676c75cecfb1 --- /dev/null +++ b/r2_no_ds/run/logging/epoch_10_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49cd0e5fff82481f6a461af86ae1c8b48df30ec942e6d1d362907d5f3fe67426 +size 1364 diff --git a/r2_no_ds/run/logging/epoch_11_train_metrics.pth b/r2_no_ds/run/logging/epoch_11_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..cbc198622f1c71cc787123263ffd2c21b17a02c0 --- /dev/null +++ b/r2_no_ds/run/logging/epoch_11_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:430b44fe34e6f28cf5c80695ddceb93d3f7f91d837d7027024c9f34b5c65d8e3 +size 1372 diff --git a/r2_no_ds/run/logging/epoch_11_val_metrics.pth b/r2_no_ds/run/logging/epoch_11_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..c57b35b4cca15836ca6a3c2ac0de75c425451bea --- /dev/null +++ b/r2_no_ds/run/logging/epoch_11_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0de00f887f217022b037aa513f22abfc91949284eafc62d7ceee3f9314ccfee0 +size 1364 diff --git a/r2_no_ds/run/logging/epoch_12_train_metrics.pth b/r2_no_ds/run/logging/epoch_12_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..fbf737ef004d7894b51ea9f5a6df97c201821288 --- /dev/null +++ b/r2_no_ds/run/logging/epoch_12_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9550d058ebbafca210926c0aeb70776d85eabfeda1b3a9e2c206517e1745cac6 +size 1372 diff --git a/r2_no_ds/run/logging/epoch_12_val_metrics.pth b/r2_no_ds/run/logging/epoch_12_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..ce0b3e4e405cd1e4453d26b5962e46d298088c5e --- /dev/null +++ b/r2_no_ds/run/logging/epoch_12_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ddb82795dbc9c81041ed6cba7f89f7b09c4f790bc26a7fec2776fdf76238097 +size 1364 diff --git a/r2_no_ds/run/logging/epoch_1_train_metrics.pth b/r2_no_ds/run/logging/epoch_1_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..bc207317c0b634d014a667d5ed1198d1e428b490 --- /dev/null +++ b/r2_no_ds/run/logging/epoch_1_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3052f288a2fc5ff958f35050a2c60eb203307d896827452764e0641b71892d09 +size 1304 diff --git a/r2_no_ds/run/logging/epoch_1_val_metrics.pth b/r2_no_ds/run/logging/epoch_1_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..000c50c174b02bcdfc26fbbfdd3419926211aad4 --- /dev/null +++ b/r2_no_ds/run/logging/epoch_1_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d1ac53e7fee8c60e8b81e42026409d2b0da81fa9e124313fb727affa4536781 +size 1360 diff --git a/r2_no_ds/run/logging/epoch_2_train_metrics.pth b/r2_no_ds/run/logging/epoch_2_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..2469943966c646cb4f30158c1e6857d8b681045b --- /dev/null +++ b/r2_no_ds/run/logging/epoch_2_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:554625fc8bcb044f6dc7f8592bf6a9817627fea8407bc3073272d81884a4dc01 +size 1304 diff --git a/r2_no_ds/run/logging/epoch_2_val_metrics.pth b/r2_no_ds/run/logging/epoch_2_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..84c7ab2a2829a3948c69c906fe5fa89f6a6ba27b --- /dev/null +++ b/r2_no_ds/run/logging/epoch_2_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e8800da7b9ad6e626fcb896cc19876a10997fa8a42850e710338496e1869a6d +size 1360 diff --git a/r2_no_ds/run/logging/epoch_3_train_metrics.pth b/r2_no_ds/run/logging/epoch_3_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..121dc67806b6e8af3c6b4071676d614495ab117c --- /dev/null +++ b/r2_no_ds/run/logging/epoch_3_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:062771068cabf3d1d90393cac96c9942126ff5e45a640ee793f09e9ef6f17070 +size 1304 diff --git a/r2_no_ds/run/logging/epoch_3_val_metrics.pth b/r2_no_ds/run/logging/epoch_3_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..83e75b7ecdb6bb115543a5fd3b0e769199c1a32f --- /dev/null +++ b/r2_no_ds/run/logging/epoch_3_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd55930b10f0c7a6eef518f36ff250db24c6d65f021dff7f7b69065d980bf406 +size 1360 diff --git a/r2_no_ds/run/logging/epoch_4_train_metrics.pth b/r2_no_ds/run/logging/epoch_4_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..b9c33cd91b1f987784d1927dc4ff884f852f4694 --- /dev/null +++ b/r2_no_ds/run/logging/epoch_4_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6acfd8113b0c40ed129b0abd1f404277bbd56ae8d9708d89a7f5f5708cd04e14 +size 1304 diff --git a/r2_no_ds/run/logging/epoch_4_val_metrics.pth b/r2_no_ds/run/logging/epoch_4_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..3cad2f056072e7b1c1ce8a8bf445e031dff5e44f --- /dev/null +++ b/r2_no_ds/run/logging/epoch_4_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc187a49813ba2ae66aaf89d99ce7cbdf6cffc31db00b9f15a65f93ef15c5d17 +size 1360 diff --git a/r2_no_ds/run/logging/epoch_5_train_metrics.pth b/r2_no_ds/run/logging/epoch_5_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..7b5e48a675e0f62738005fbbe947eaddf93361da --- /dev/null +++ b/r2_no_ds/run/logging/epoch_5_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba50b350f918f3683d41abd9a93ac4a6f4c62087d094ef26a78a3c0cd267200b +size 1304 diff --git a/r2_no_ds/run/logging/epoch_5_val_metrics.pth b/r2_no_ds/run/logging/epoch_5_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..ef8afa33c523e7cc4535afdecd917eac46c5ff57 --- /dev/null +++ b/r2_no_ds/run/logging/epoch_5_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:166c844684fe9e51df3b911f7c21dcf6b501a4e80707bc093728baacdf3077e9 +size 1360 diff --git a/r2_no_ds/run/logging/epoch_6_train_metrics.pth b/r2_no_ds/run/logging/epoch_6_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..b6b2fdd3d7f7d5f51c332320fad430c7370102a8 --- /dev/null +++ b/r2_no_ds/run/logging/epoch_6_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27bc53fdc7f1789fdc6bd5480e9eecc6ddea6ff6c46cf76b4f2ef8d7eb486e7a +size 1304 diff --git a/r2_no_ds/run/logging/epoch_6_val_metrics.pth b/r2_no_ds/run/logging/epoch_6_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..4fe02b7798078a9505734ee57a52a384bec5515e --- /dev/null +++ b/r2_no_ds/run/logging/epoch_6_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01ddf1ec843b92618afb4c1e6a3d305dd78c10f3218262b4105b3e9d1f6e7f5c +size 1360 diff --git a/r2_no_ds/run/logging/epoch_7_train_metrics.pth b/r2_no_ds/run/logging/epoch_7_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..a761c99b977b3e5f6c4d17ef37addfbb4b381d97 --- /dev/null +++ b/r2_no_ds/run/logging/epoch_7_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c472c330afdefa68fb2937dcb0f896848b9d44e90a0fee4af919bcaf646fb20 +size 1304 diff --git a/r2_no_ds/run/logging/epoch_7_val_metrics.pth b/r2_no_ds/run/logging/epoch_7_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..73d95e21fd2af9b7b3c8a65b8d190532873c5fe0 --- /dev/null +++ b/r2_no_ds/run/logging/epoch_7_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93aa1b5890ab3f7169b01b6e766aa7a4592bd378fa8d6b1c3e78dd68aab01ff1 +size 1360 diff --git a/r2_no_ds/run/logging/epoch_8_train_metrics.pth b/r2_no_ds/run/logging/epoch_8_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..4ea415079a3e64a32436ac5a050a9cb65368dbe6 --- /dev/null +++ b/r2_no_ds/run/logging/epoch_8_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:320f2ef08396412e5f50121a00062946bd5ea125df0b15801db9ca0afdb0e0c3 +size 1304 diff --git a/r2_no_ds/run/logging/epoch_8_val_metrics.pth b/r2_no_ds/run/logging/epoch_8_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..0e04978605eb0693640d131d6917d6dddcc12dc2 --- /dev/null +++ b/r2_no_ds/run/logging/epoch_8_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74ddae8c0f6191923a81ef4c0cf462565c66c6a67352c02af6256e13f28270af +size 1360 diff --git a/r2_no_ds/run/logging/epoch_9_train_metrics.pth b/r2_no_ds/run/logging/epoch_9_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..76459eeeaa3510d6c290e009ea9d9a071f53b2db --- /dev/null +++ b/r2_no_ds/run/logging/epoch_9_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ece01db290369691e15962c4a9eb269bd39499751a51e983c41571989366acf +size 1304 diff --git a/r2_no_ds/run/logging/epoch_9_val_metrics.pth b/r2_no_ds/run/logging/epoch_9_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..9c5909434e4ea2f3cad1c764a80ea72a0935be88 --- /dev/null +++ b/r2_no_ds/run/logging/epoch_9_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3125b4bfef4b1348962ecd74db0e60801456e8e659d68a5444fdf77d321b386c +size 1360 diff --git a/r2_no_ds/run/logging/exp_cfg.yaml b/r2_no_ds/run/logging/exp_cfg.yaml new file mode 100644 index 0000000000000000000000000000000000000000..093fdde1cfcf04b0120674e433161059b3055cbd --- /dev/null +++ b/r2_no_ds/run/logging/exp_cfg.yaml @@ -0,0 +1,62 @@ +anno_len_threshold: 40 +base_folder: /home/mog29/compgen_saved_files/experiments/joint_training +batch_size: 2 +checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_no_ds/run/checkpoints +comprehension_prompt: verbose_instruction +context_size: 10 +data_dir: /home/mog29/compgen_saved_files/kilogram/dataset +deployment_round: 2 +evaluation_type: joint +expdir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_no_ds/run +from_scratch: true +generation_prompt: information_after +gradient_accumulation_steps: 32 +gradient_clip_norm: 1 +img_dir: /home/mog29/compgen_saved_files/kilogram/dataset/square-black-imgs +ips_clip: 5 +learning_rate: 0.0001 +listener_filter: '' +listener_lambda: 0.5 +load_from_checkpoint: false +logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_no_ds/run/logging +lora_dropout: 0.05 +lora_r: 16 +lora_subset: vision_resampler +max_steps: 30 +model_family_name: no_ds +n_epochs: 15 +name: joint and multitask training defaults +name_suffix: '' +no_lora: false +no_shuffling: false +noise_filter: '' +num_samples: 10 +num_training_steps: 15000 +num_warmup_steps: 0 +num_workers: 4 +only_seed: false +past_checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_no_ds/run/checkpoints +past_logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_no_ds/run/logging +past_name_suffix: '' +past_round: -1 +patience_cutoff: 5 +ref_strat: no_ips_for_pos +repetition_penalty: 1 +replacement_family_name: '' +sampling_type: nucleus +save_each_epoch: true +seed: 619101 +shared_parameters: true +speaker_filter: '' +speaker_lambda: 0.5 +split_dir: /home/mog29/compgen_saved_files/split_info/ +temperature: 0.7 +test_batch_size: 4 +top_k: 50 +top_p: 1 +training_type: multitask +use_separate_dataloaders: false +use_wandb: true +wandb_experiment_name: r2_no_ds_may +wandb_project_name: tangram_continual_learning_final +weight_decay: 0.1 diff --git a/r2_no_ji/run/checkpoints/acc/README.md b/r2_no_ji/run/checkpoints/acc/README.md new file mode 100644 index 0000000000000000000000000000000000000000..2d4c19b14ebbb9a403d09e6532e46ccfcd7b82cb --- /dev/null +++ b/r2_no_ji/run/checkpoints/acc/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: HuggingFaceM4/idefics2-8b +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/r2_no_ji/run/checkpoints/acc/adapter_config.json b/r2_no_ji/run/checkpoints/acc/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a6a12bf8b59da5b42d042490beafd765fe95f7af --- /dev/null +++ b/r2_no_ji/run/checkpoints/acc/adapter_config.json @@ -0,0 +1,29 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "Idefics2ForConditionalGeneration", + "parent_library": "transformers.models.idefics2.modeling_idefics2" + }, + "base_model_name_or_path": "HuggingFaceM4/idefics2-8b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": "gaussian", + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.1, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 16, + "rank_pattern": {}, + "revision": null, + "target_modules": "(.*(vision_model|modality_projection|perceiver_resampler).*(out_proj|fc1|fc2|down_proj|gate_proj|up_proj|k_proj|q_proj|v_proj|o_proj).*$)|(.*(k_proj|q_proj|v_proj).*$)", + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/r2_no_ji/run/checkpoints/acc/adapter_model.safetensors b/r2_no_ji/run/checkpoints/acc/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3028c5c72b7926682b2dc78608feb5b8fbb3dea6 --- /dev/null +++ b/r2_no_ji/run/checkpoints/acc/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4976a4eacc65a76c53b59dda17958f05da0b401b703fd19bb2f22ee4bb7bc8c +size 45771496 diff --git a/r2_no_ji/run/checkpoints/acc/best_optimizer.pt b/r2_no_ji/run/checkpoints/acc/best_optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..60abadc9979a03b1f95abcc53828ea2b77bbbe38 --- /dev/null +++ b/r2_no_ji/run/checkpoints/acc/best_optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb7b3e94b45e96476d657a5d4e36e9eb54aa3b2c56a80396597feb9dbbc6b2ec +size 91855438 diff --git a/r2_no_ji/run/checkpoints/acc/best_scheduler.pt b/r2_no_ji/run/checkpoints/acc/best_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..09adcae3684d88c5c525d5804913ccfa5ca2cf96 --- /dev/null +++ b/r2_no_ji/run/checkpoints/acc/best_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:750e564fc3878bc11cecae1e256a46e3f1ba4051a3f513f442949c84a664f210 +size 1084 diff --git a/r2_no_ji/run/checkpoints/acc/saved_metrics.pth b/r2_no_ji/run/checkpoints/acc/saved_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..6af24174ca6d164d1766a6d710cffec323374513 --- /dev/null +++ b/r2_no_ji/run/checkpoints/acc/saved_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b799d31be4dd86864652ef044168f0172bf16bb7a784c835aaffe9d45eeb7c90 +size 1016 diff --git a/r2_no_ji/run/logging/epoch_0_train_metrics.pth b/r2_no_ji/run/logging/epoch_0_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..e0f3287f702a0dd6350018fffa878aa659c3daff --- /dev/null +++ b/r2_no_ji/run/logging/epoch_0_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a886fa151b1eef2a0f91a303eb79150c69afdd6fbd4be6318b44e1d883aa70b9 +size 1304 diff --git a/r2_no_ji/run/logging/epoch_0_val_metrics.pth b/r2_no_ji/run/logging/epoch_0_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..132062b0815840aeace61a262371e15783536088 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_0_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec95e7f3bbf66cc5bb1bc40553eb177085dac680f06e2c237d2bf1e5dfd12b7c +size 1168 diff --git a/r2_no_ji/run/logging/epoch_10_train_metrics.pth b/r2_no_ji/run/logging/epoch_10_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..6aacade0ddf28efb3f65c0f7610fb4680a56192a --- /dev/null +++ b/r2_no_ji/run/logging/epoch_10_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2e5abc796ae9a3bcc60ad56ef4c492367e83aec65f8b63ecc438ef28b6cc1f9 +size 1372 diff --git a/r2_no_ji/run/logging/epoch_10_val_metrics.pth b/r2_no_ji/run/logging/epoch_10_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..75191728dcc80404c859c3f6c85cc90409849607 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_10_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a950614d30da387f8b178b2ec1e95e8c8cb9215b2a8a9d7d335466e996a7c6e0 +size 1172 diff --git a/r2_no_ji/run/logging/epoch_11_train_metrics.pth b/r2_no_ji/run/logging/epoch_11_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..d6ba0c640b61be66b8717a598189b9f295e03120 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_11_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dd1e6553e571152d69010befcfbe0ea630a3452a228416ab5c9d550a51ac2d3 +size 1372 diff --git a/r2_no_ji/run/logging/epoch_11_val_metrics.pth b/r2_no_ji/run/logging/epoch_11_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..996f5375b842cea3f163688f259fc7c11c0fba9c --- /dev/null +++ b/r2_no_ji/run/logging/epoch_11_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c10a9c68e03bce8a651ed3267caf74e37aea6fb0f516e7c91dc0be4837eebd2 +size 1172 diff --git a/r2_no_ji/run/logging/epoch_12_train_metrics.pth b/r2_no_ji/run/logging/epoch_12_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..d86f3945d93705e6be4fabd278a417c7bcf7fa66 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_12_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85171732d963e54bb6c9f413b4e76b6fc300845a8dc0ce88b37ab7df8658c521 +size 1372 diff --git a/r2_no_ji/run/logging/epoch_12_val_metrics.pth b/r2_no_ji/run/logging/epoch_12_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..2d54bd24d0b4812c496b33f1e05879035ac83ab2 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_12_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90e149c4d519193747c13b086fa106920b8d9a2e9bf08069f45748669a813d97 +size 1172 diff --git a/r2_no_ji/run/logging/epoch_13_train_metrics.pth b/r2_no_ji/run/logging/epoch_13_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..29b0f689c29717f3eeed1b990c80733151e2566c --- /dev/null +++ b/r2_no_ji/run/logging/epoch_13_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fd3a378928475f47c1d99fc760021c2332de50b4e88d141154369de4901336e +size 1372 diff --git a/r2_no_ji/run/logging/epoch_13_val_metrics.pth b/r2_no_ji/run/logging/epoch_13_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..ae4edb11d9e4d75d6ad8fc6b260e910f7a3c6faf --- /dev/null +++ b/r2_no_ji/run/logging/epoch_13_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e8b810d623443d55fdbcb08a4aeca254d9948fad363ea435b9b71fc679417bc +size 1172 diff --git a/r2_no_ji/run/logging/epoch_14_train_metrics.pth b/r2_no_ji/run/logging/epoch_14_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..73e04990378fb40622d313e0c09d97ae9882787d --- /dev/null +++ b/r2_no_ji/run/logging/epoch_14_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:063c9566bc24fd01b18a39835241305dfc8064eb0b2a4519b107ea4b5ac529e5 +size 1372 diff --git a/r2_no_ji/run/logging/epoch_14_val_metrics.pth b/r2_no_ji/run/logging/epoch_14_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..6975a38a8d4251e4103d1c70bf4b68b0132b5f73 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_14_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1957a5fcff9ca0118f3f2c9785b4a3f8cabfdb9f82bbbb0bc37384ae146732ca +size 1172 diff --git a/r2_no_ji/run/logging/epoch_1_train_metrics.pth b/r2_no_ji/run/logging/epoch_1_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..437464505a247f3c2295f8aae2341dcec2742dd0 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_1_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eeaa31249e662c2d6eebdae30f14114fd70ab4a30e670108dd5da5b561518c0 +size 1304 diff --git a/r2_no_ji/run/logging/epoch_1_val_metrics.pth b/r2_no_ji/run/logging/epoch_1_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..04be2a9ab3614b8dbcee09a4ce68e688117a2146 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_1_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb42ca3827097e3a826531434acbb33594def3de7cdf073348ea8b086f69a416 +size 1168 diff --git a/r2_no_ji/run/logging/epoch_2_train_metrics.pth b/r2_no_ji/run/logging/epoch_2_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..d86e7c20aa2e4c3814b463baaf4a735ae970aac1 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_2_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed8fde23b07f3f30f050ebf5f2a795fe4bc33419bcedafa772aff908866b15dd +size 1304 diff --git a/r2_no_ji/run/logging/epoch_2_val_metrics.pth b/r2_no_ji/run/logging/epoch_2_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..8e99dd381051ca10695a3eef90d2d033ec543d8c --- /dev/null +++ b/r2_no_ji/run/logging/epoch_2_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb65f5ef4f6748ebf7f9873894e6b04fadad7e96ad412889637680a91a802bf7 +size 1168 diff --git a/r2_no_ji/run/logging/epoch_3_train_metrics.pth b/r2_no_ji/run/logging/epoch_3_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..54fc39d67865a07bc6550abdf46ae1bcfd66abbb --- /dev/null +++ b/r2_no_ji/run/logging/epoch_3_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c823f0ea98787f4e945beede5f0d13e030afe1ba295a228eb1b186bdf07b4793 +size 1304 diff --git a/r2_no_ji/run/logging/epoch_3_val_metrics.pth b/r2_no_ji/run/logging/epoch_3_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..884cd0ae879e21ebec137cf099245d1354f88e72 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_3_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ed2562591ab3a2592373ea70d5e5a775cfc695a6a1c9f57793077a78f9da6dd +size 1168 diff --git a/r2_no_ji/run/logging/epoch_4_train_metrics.pth b/r2_no_ji/run/logging/epoch_4_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..2c5ab053ddd63cd4cf64762eca24696efa573db3 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_4_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31e0ef2f2372a491b0ff1ad6029c2ccea6ae916d0267fd75baa9674a0aff0266 +size 1304 diff --git a/r2_no_ji/run/logging/epoch_4_val_metrics.pth b/r2_no_ji/run/logging/epoch_4_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..6e67f3bf49b867b62e551d749f9a2641fffeb2b9 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_4_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:517a8a90e7892d047238e5151ada2e6db2fccae0223cc3b458d4db6527806972 +size 1168 diff --git a/r2_no_ji/run/logging/epoch_5_train_metrics.pth b/r2_no_ji/run/logging/epoch_5_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..3ecb85c38151d7390d9973cfe903ce67194ad923 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_5_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64cc37b613d08049e465285ad0b85965fa9f63dc08d65ea56907ccf56a88836b +size 1304 diff --git a/r2_no_ji/run/logging/epoch_5_val_metrics.pth b/r2_no_ji/run/logging/epoch_5_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..087ac6305796948bd1d6dd7e25cf5ba51d559e98 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_5_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ae2828fdca6117a8bd3871ea0510660f6a7adcdd8366ae7d6e726523b362da7 +size 1168 diff --git a/r2_no_ji/run/logging/epoch_6_train_metrics.pth b/r2_no_ji/run/logging/epoch_6_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..1123aa4f70d5b5e30b139cb554cdcfd1066eb6f5 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_6_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b29d2b018bfc5436b2aef9ea747ad6c6e327424ec3c57c2e31d02d120b5b4707 +size 1304 diff --git a/r2_no_ji/run/logging/epoch_6_val_metrics.pth b/r2_no_ji/run/logging/epoch_6_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..45871cd6c1b8086e2bd2ec8f3567a66385f91fde --- /dev/null +++ b/r2_no_ji/run/logging/epoch_6_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:217d1ea2c7d9a8e9350571a05fbbfb8eeb7f3ae8014d642f0d49db99fa2f7995 +size 1168 diff --git a/r2_no_ji/run/logging/epoch_7_train_metrics.pth b/r2_no_ji/run/logging/epoch_7_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..a4a915f3c46a2c9c611644249b3b289a66d99154 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_7_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70b55ca80a96de6088d34d66da2ffccc1b57920f7d824c2359e2e8fef302161f +size 1304 diff --git a/r2_no_ji/run/logging/epoch_7_val_metrics.pth b/r2_no_ji/run/logging/epoch_7_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..dd5c48f08f71422552fee8c386944a8f0f292318 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_7_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f113ae42ca09ed45a3cf2f783abe5107db2becd01e2152255067ac6cf128cc89 +size 1168 diff --git a/r2_no_ji/run/logging/epoch_8_train_metrics.pth b/r2_no_ji/run/logging/epoch_8_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..c6e02d4de2f629b838f282feb8dbdab1e7ce380d --- /dev/null +++ b/r2_no_ji/run/logging/epoch_8_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67231d83a1d227366e320393466ca9bdf0b3913d7d70deba3a8fb8261bf1a1b0 +size 1304 diff --git a/r2_no_ji/run/logging/epoch_8_val_metrics.pth b/r2_no_ji/run/logging/epoch_8_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..fe8576d53fac3476e640479b7e35a1eebcb99b59 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_8_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62f0503d5489040d2ede35564b6b0d0c532894a4756330b3b96289fea785c9a9 +size 1168 diff --git a/r2_no_ji/run/logging/epoch_9_train_metrics.pth b/r2_no_ji/run/logging/epoch_9_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..a2d8eec236599b73c0b7a0126d5c95745a789339 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_9_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee49d388014d4e9993dd1bdcd2aa0489f3e20e27c9571ca0292ab29541e0eaaa +size 1304 diff --git a/r2_no_ji/run/logging/epoch_9_val_metrics.pth b/r2_no_ji/run/logging/epoch_9_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..f3320ae3c4197f4117ffa6f14d7c5bdee1d94699 --- /dev/null +++ b/r2_no_ji/run/logging/epoch_9_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:046b95c3f102d44cef047303c987ed7e6dcd9a866292e161b812a1cfb09002f0 +size 1168 diff --git a/r2_no_ji/run/logging/exp_cfg.yaml b/r2_no_ji/run/logging/exp_cfg.yaml new file mode 100644 index 0000000000000000000000000000000000000000..5027a8b0f04c1648ec04e80b3065b261730d36c4 --- /dev/null +++ b/r2_no_ji/run/logging/exp_cfg.yaml @@ -0,0 +1,62 @@ +anno_len_threshold: 40 +base_folder: /home/mog29/compgen_saved_files/experiments/joint_training +batch_size: 2 +checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_no_ji/run/checkpoints +comprehension_prompt: verbose_instruction +context_size: 10 +data_dir: /home/mog29/compgen_saved_files/kilogram/dataset +deployment_round: 2 +evaluation_type: multitask +expdir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_no_ji/run +from_scratch: true +generation_prompt: information_after +gradient_accumulation_steps: 32 +gradient_clip_norm: 1 +img_dir: /home/mog29/compgen_saved_files/kilogram/dataset/square-black-imgs +ips_clip: 5 +learning_rate: 0.0001 +listener_filter: no_neg_gen +listener_lambda: 0.5 +load_from_checkpoint: false +logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_no_ji/run/logging +lora_dropout: 0.05 +lora_r: 16 +lora_subset: vision_resampler +max_steps: 30 +model_family_name: no_ji +n_epochs: 15 +name: joint and multitask training defaults +name_suffix: '' +no_lora: false +no_shuffling: false +noise_filter: '' +num_samples: 10 +num_training_steps: 15000 +num_warmup_steps: 0 +num_workers: 4 +only_seed: false +past_checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_no_ji/run/checkpoints +past_logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r1_no_ji/run/logging +past_name_suffix: '' +past_round: -1 +patience_cutoff: 5 +ref_strat: no_ips_for_pos +repetition_penalty: 1 +replacement_family_name: '' +sampling_type: nucleus +save_each_epoch: true +seed: 912989 +shared_parameters: true +speaker_filter: no_neg_comp +speaker_lambda: 0.5 +split_dir: /home/mog29/compgen_saved_files/split_info/ +temperature: 0.7 +test_batch_size: 4 +top_k: 50 +top_p: 1 +training_type: multitask +use_separate_dataloaders: true +use_wandb: true +wandb_experiment_name: r2_no_ji_may +wandb_project_name: tangram_continual_learning_final +weight_decay: 0.1 diff --git a/r3_baseline/run/checkpoints/acc/README.md b/r3_baseline/run/checkpoints/acc/README.md new file mode 100644 index 0000000000000000000000000000000000000000..2d4c19b14ebbb9a403d09e6532e46ccfcd7b82cb --- /dev/null +++ b/r3_baseline/run/checkpoints/acc/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: HuggingFaceM4/idefics2-8b +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/r3_baseline/run/checkpoints/acc/adapter_config.json b/r3_baseline/run/checkpoints/acc/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a6a12bf8b59da5b42d042490beafd765fe95f7af --- /dev/null +++ b/r3_baseline/run/checkpoints/acc/adapter_config.json @@ -0,0 +1,29 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "Idefics2ForConditionalGeneration", + "parent_library": "transformers.models.idefics2.modeling_idefics2" + }, + "base_model_name_or_path": "HuggingFaceM4/idefics2-8b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": "gaussian", + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.1, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 16, + "rank_pattern": {}, + "revision": null, + "target_modules": "(.*(vision_model|modality_projection|perceiver_resampler).*(out_proj|fc1|fc2|down_proj|gate_proj|up_proj|k_proj|q_proj|v_proj|o_proj).*$)|(.*(k_proj|q_proj|v_proj).*$)", + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/r3_baseline/run/checkpoints/acc/adapter_model.safetensors b/r3_baseline/run/checkpoints/acc/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..eff6a4f1896fa329d22075fadb115600851b17dd --- /dev/null +++ b/r3_baseline/run/checkpoints/acc/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87014f48c5be922176c653249a16310688d0b9603a94cfdeefdd4054dd895e17 +size 45771496 diff --git a/r3_baseline/run/checkpoints/acc/best_optimizer.pt b/r3_baseline/run/checkpoints/acc/best_optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c69e20630a3cbe065ca8b9844a1457f60d745d7 --- /dev/null +++ b/r3_baseline/run/checkpoints/acc/best_optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fb1e0cfa6520f084596af6ec053ba6305ed566db119a3a93dafb0be158af00c +size 91855438 diff --git a/r3_baseline/run/checkpoints/acc/best_scheduler.pt b/r3_baseline/run/checkpoints/acc/best_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..16f6c9b5ec67f91ace562b0b022444f1ee030ef0 --- /dev/null +++ b/r3_baseline/run/checkpoints/acc/best_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c66ef6bf58f29b5e73c83eca3db44912ad7480f0602a08d91fc6178bc7acc997 +size 1084 diff --git a/r3_baseline/run/checkpoints/acc/saved_metrics.pth b/r3_baseline/run/checkpoints/acc/saved_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..1269e655e5bac0b388f17b7a41aac41bd3699a54 --- /dev/null +++ b/r3_baseline/run/checkpoints/acc/saved_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89a8fcb7d42ed32ea3a444e4d64ff2088c413ac0c3c9af0263a115db17d8fb21 +size 1016 diff --git a/r3_baseline/run/logging/epoch_0_train_metrics.pth b/r3_baseline/run/logging/epoch_0_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..b4a094a1d265d1dcefe5cf79534454b650ed6eb9 --- /dev/null +++ b/r3_baseline/run/logging/epoch_0_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dadf782e608300a4774b6ff56944fe0406d7221fa6c862668d19d477c07d753f +size 1304 diff --git a/r3_baseline/run/logging/epoch_0_val_metrics.pth b/r3_baseline/run/logging/epoch_0_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..065a4f6bd43d75eaf794859052e04ea0ab00de62 --- /dev/null +++ b/r3_baseline/run/logging/epoch_0_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abf8874be6f79c32a9cc752ec4f5697ff511302e995b8e8b39e57821e6af4179 +size 1168 diff --git a/r3_baseline/run/logging/epoch_1_train_metrics.pth b/r3_baseline/run/logging/epoch_1_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..d58eb443214777fee431ed0c1c6afc10fd8cad9d --- /dev/null +++ b/r3_baseline/run/logging/epoch_1_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:539c2546600b102bb6ea1eebf346cb25e8e43e933aa7e5cfb5a61b9b242ed4a7 +size 1304 diff --git a/r3_baseline/run/logging/epoch_1_val_metrics.pth b/r3_baseline/run/logging/epoch_1_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..befe3983a45700263778401e5794fa24e2e020a2 --- /dev/null +++ b/r3_baseline/run/logging/epoch_1_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55429be472371ebb9b4172b25287f01fe007d85e666b7a0ea4a2895aec24e3eb +size 1168 diff --git a/r3_baseline/run/logging/epoch_2_train_metrics.pth b/r3_baseline/run/logging/epoch_2_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..3e37175f942ecdcbf676616e3169524c239b9063 --- /dev/null +++ b/r3_baseline/run/logging/epoch_2_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71b500b600b99fa3fe8fb6755f32dcd2ddbcee9a03472750dcc90b66b7efe5c9 +size 1304 diff --git a/r3_baseline/run/logging/epoch_2_val_metrics.pth b/r3_baseline/run/logging/epoch_2_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..d44b6de9a0b3aa1eba5582d5d0839ce57624ba71 --- /dev/null +++ b/r3_baseline/run/logging/epoch_2_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08a38b02a10575eb5b968d04de777a6a3c89754e9bcd43457894939e63976bfd +size 1168 diff --git a/r3_baseline/run/logging/epoch_3_train_metrics.pth b/r3_baseline/run/logging/epoch_3_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..dca685b1d091e8ac98deb0b375d718306d4a41e8 --- /dev/null +++ b/r3_baseline/run/logging/epoch_3_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89a0843c0136ba596cdbd151eb988ec731e9624e07722f56ca967e9156b39d7c +size 1304 diff --git a/r3_baseline/run/logging/epoch_3_val_metrics.pth b/r3_baseline/run/logging/epoch_3_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..682557fe5a4bd9fac93b8fb386bc492afa14b6fa --- /dev/null +++ b/r3_baseline/run/logging/epoch_3_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30ab765f2e737fd196985f4d9bfcf4de48075d704493915c89d823aecfe47737 +size 1168 diff --git a/r3_baseline/run/logging/epoch_4_train_metrics.pth b/r3_baseline/run/logging/epoch_4_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..0da541a8fc4ceb52dfe1537c8735442417316c2a --- /dev/null +++ b/r3_baseline/run/logging/epoch_4_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:283723858f19d7d36eaea12f4ad54f7d1937f8702e384320301bd16ff424f5f2 +size 1304 diff --git a/r3_baseline/run/logging/epoch_4_val_metrics.pth b/r3_baseline/run/logging/epoch_4_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..9f7febe59938b1df31afbc4b421920ca6a4344ff --- /dev/null +++ b/r3_baseline/run/logging/epoch_4_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88cad97d893e8f2a53bd094a05ed8803a8fd9378e33bb433fd4d01d7307e1a89 +size 1168 diff --git a/r3_baseline/run/logging/epoch_5_train_metrics.pth b/r3_baseline/run/logging/epoch_5_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..6f9436b63f0befc7d7ad5daa1f06675a4f264e5b --- /dev/null +++ b/r3_baseline/run/logging/epoch_5_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e567b9343ee54e16652cdc9d9df8993b221ede031ab0978c2754727558ce44a +size 1304 diff --git a/r3_baseline/run/logging/epoch_5_val_metrics.pth b/r3_baseline/run/logging/epoch_5_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..cf69fd1d7a5dcb1a80fbe886bb3f3c0d2d345f20 --- /dev/null +++ b/r3_baseline/run/logging/epoch_5_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f982f2ef1e6cc391ac1b94f84e58c1fb191e72fcca0fa58168724106ffafa70f +size 1168 diff --git a/r3_baseline/run/logging/epoch_6_train_metrics.pth b/r3_baseline/run/logging/epoch_6_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..270dbc18433a6cfab6486e7c48e889002bd614c6 --- /dev/null +++ b/r3_baseline/run/logging/epoch_6_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a66607c70e34f66baf34b9cef381b3adb72c8c1e6a396076a76b6ab672ef502 +size 1304 diff --git a/r3_baseline/run/logging/epoch_6_val_metrics.pth b/r3_baseline/run/logging/epoch_6_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..99a05c8bdd652e281973597efbac15579e05ebda --- /dev/null +++ b/r3_baseline/run/logging/epoch_6_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8f5a3c54979f5856a2c0db3eb422c9d8203b5dab694a0d55b070a5edaa0cf6f +size 1168 diff --git a/r3_baseline/run/logging/epoch_7_train_metrics.pth b/r3_baseline/run/logging/epoch_7_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..6bb480eae832f9da4ae46b04ccb621c91c6477f0 --- /dev/null +++ b/r3_baseline/run/logging/epoch_7_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c52140033137842792ffa2ad63b0a6856d3bc0d4791e819f6fd378ffbe6db7d +size 1304 diff --git a/r3_baseline/run/logging/epoch_7_val_metrics.pth b/r3_baseline/run/logging/epoch_7_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..96595eb74ff91277832719d1dfa873522e808a44 --- /dev/null +++ b/r3_baseline/run/logging/epoch_7_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a923028526fd015bfd2bf71ee26bbfa8aa714b9363517c65c968537730f789c +size 1168 diff --git a/r3_baseline/run/logging/exp_cfg.yaml b/r3_baseline/run/logging/exp_cfg.yaml new file mode 100644 index 0000000000000000000000000000000000000000..df132502c64c4f931117c839598766771feac44e --- /dev/null +++ b/r3_baseline/run/logging/exp_cfg.yaml @@ -0,0 +1,62 @@ +anno_len_threshold: 40 +base_folder: /home/mog29/compgen_saved_files/experiments/joint_training +batch_size: 2 +checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r3_baseline/run/checkpoints +comprehension_prompt: verbose_instruction +context_size: 10 +data_dir: /home/mog29/compgen_saved_files/kilogram/dataset +deployment_round: 3 +evaluation_type: multitask +expdir: /home/mog29/compgen_saved_files/experiments/joint_training/r3_baseline/run +from_scratch: true +generation_prompt: information_after +gradient_accumulation_steps: 32 +gradient_clip_norm: 1 +img_dir: /home/mog29/compgen_saved_files/kilogram/dataset/square-black-imgs +ips_clip: 5 +learning_rate: 0.0001 +listener_filter: '' +listener_lambda: 0.5 +load_from_checkpoint: false +logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r3_baseline/run/logging +lora_dropout: 0.05 +lora_r: 16 +lora_subset: vision_resampler +max_steps: 30 +model_family_name: baseline +n_epochs: 15 +name: joint and multitask training defaults +name_suffix: '' +no_lora: false +no_shuffling: false +noise_filter: '' +num_samples: 10 +num_training_steps: 17500 +num_warmup_steps: 0 +num_workers: 4 +only_seed: false +past_checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_baseline/run/checkpoints +past_logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_baseline/run/logging +past_name_suffix: '' +past_round: -1 +patience_cutoff: 5 +ref_strat: no_ips_for_pos +repetition_penalty: 1 +replacement_family_name: '' +sampling_type: nucleus +save_each_epoch: true +seed: 835313 +shared_parameters: true +speaker_filter: '' +speaker_lambda: 0.5 +split_dir: /home/mog29/compgen_saved_files/split_info/ +temperature: 0.7 +test_batch_size: 2 +top_k: 50 +top_p: 1 +training_type: multitask +use_separate_dataloaders: false +use_wandb: true +wandb_experiment_name: r3_baseline_may +wandb_project_name: tangram_continual_learning_final +weight_decay: 0.1 diff --git a/r3_full/run/checkpoints/acc/README.md b/r3_full/run/checkpoints/acc/README.md new file mode 100644 index 0000000000000000000000000000000000000000..2d4c19b14ebbb9a403d09e6532e46ccfcd7b82cb --- /dev/null +++ b/r3_full/run/checkpoints/acc/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: HuggingFaceM4/idefics2-8b +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/r3_full/run/checkpoints/acc/adapter_config.json b/r3_full/run/checkpoints/acc/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a6a12bf8b59da5b42d042490beafd765fe95f7af --- /dev/null +++ b/r3_full/run/checkpoints/acc/adapter_config.json @@ -0,0 +1,29 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "Idefics2ForConditionalGeneration", + "parent_library": "transformers.models.idefics2.modeling_idefics2" + }, + "base_model_name_or_path": "HuggingFaceM4/idefics2-8b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": "gaussian", + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.1, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 16, + "rank_pattern": {}, + "revision": null, + "target_modules": "(.*(vision_model|modality_projection|perceiver_resampler).*(out_proj|fc1|fc2|down_proj|gate_proj|up_proj|k_proj|q_proj|v_proj|o_proj).*$)|(.*(k_proj|q_proj|v_proj).*$)", + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/r3_full/run/checkpoints/acc/adapter_model.safetensors b/r3_full/run/checkpoints/acc/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..520b1519e14e2e464ff99d5d134731e3edeefb15 --- /dev/null +++ b/r3_full/run/checkpoints/acc/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b169f4b68f9b35602e73f3b9d4a1b5ad1a3bc25826b73d44f828d495a7de025e +size 45771496 diff --git a/r3_full/run/checkpoints/acc/best_optimizer.pt b/r3_full/run/checkpoints/acc/best_optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..a65ea3df2b4331dc88ca2acad4629f5df071bf51 --- /dev/null +++ b/r3_full/run/checkpoints/acc/best_optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af19193450d6fa4919db669c64d678e8e385a7bcacfdc33c77f2334f37ee7a0a +size 91855438 diff --git a/r3_full/run/checkpoints/acc/best_scheduler.pt b/r3_full/run/checkpoints/acc/best_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..50f50795e132a02ccbe8fd94a66c25060d26892b --- /dev/null +++ b/r3_full/run/checkpoints/acc/best_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7be14cdd96c230c4d3c529af42e04ec48d437771ccf6bbd2555ac26f257e846c +size 1084 diff --git a/r3_full/run/checkpoints/acc/saved_metrics.pth b/r3_full/run/checkpoints/acc/saved_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..8f809edbdb1a766837d792c3f3e1f6c067accc65 --- /dev/null +++ b/r3_full/run/checkpoints/acc/saved_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2310c5fa745834bbb983148663655e9bb01d50da6232f9bb51609ee13deb6818 +size 1208 diff --git a/r3_full/run/logging/epoch_0_train_metrics.pth b/r3_full/run/logging/epoch_0_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..30b98b8ea35bdd76e25a50a3989ff29f956bf110 --- /dev/null +++ b/r3_full/run/logging/epoch_0_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e95d6f3e23a8d461c713495fcfdd0be2668c13de8058e942d700b2034c920c95 +size 1304 diff --git a/r3_full/run/logging/epoch_0_val_metrics.pth b/r3_full/run/logging/epoch_0_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..25376e1ad364264085f1ea04d57c2dd12927ddbf --- /dev/null +++ b/r3_full/run/logging/epoch_0_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91f81998d832d097ce37965dab09e0e4607288f5701d2c0917c2c189fb08c39b +size 1360 diff --git a/r3_full/run/logging/epoch_1_train_metrics.pth b/r3_full/run/logging/epoch_1_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..254dd6db0c395b5e25382b6049708eac9c026f74 --- /dev/null +++ b/r3_full/run/logging/epoch_1_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ae331e90060b9d6b097d64f15ba518a3f68ad1f00155c3651437d4632a371be +size 1304 diff --git a/r3_full/run/logging/epoch_1_val_metrics.pth b/r3_full/run/logging/epoch_1_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..2a485326ba1c637a25f4e9a74c6d76f5d835262f --- /dev/null +++ b/r3_full/run/logging/epoch_1_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fec481bc34d9a5bee419c55c2117e5400b8e1feb5b6530194c42e525a1e4f71 +size 1360 diff --git a/r3_full/run/logging/epoch_2_train_metrics.pth b/r3_full/run/logging/epoch_2_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..46b93107880fd00b5e579ef1628da71dfe1b0b7c --- /dev/null +++ b/r3_full/run/logging/epoch_2_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:332a40741aa84a41da985821654241247af2158e5873ba2c3290dc2066d1ecde +size 1304 diff --git a/r3_full/run/logging/epoch_2_val_metrics.pth b/r3_full/run/logging/epoch_2_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..67fd55af69a28d6580ad9f15cd2005109f6e8d7e --- /dev/null +++ b/r3_full/run/logging/epoch_2_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c09b40ee98a3ec103f1189edc75ab071d0749555dffe37eba5cebaa55984fbda +size 1360 diff --git a/r3_full/run/logging/epoch_3_train_metrics.pth b/r3_full/run/logging/epoch_3_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..5e8a2fc1fe91d3b1b17f61881a2958ba701bd073 --- /dev/null +++ b/r3_full/run/logging/epoch_3_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeebd7e2b35789d933c4af6b8bed167adb36bd3cddb0b735edb2385a36713e8d +size 1304 diff --git a/r3_full/run/logging/epoch_3_val_metrics.pth b/r3_full/run/logging/epoch_3_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..1bf4cf637616b9b72bf8f2fe0fca67b1f0c8cad2 --- /dev/null +++ b/r3_full/run/logging/epoch_3_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a2da7a0b8b54a56ed31e5146ab488bbec4010256f1d44d2c030210ab6a361de +size 1360 diff --git a/r3_full/run/logging/epoch_4_train_metrics.pth b/r3_full/run/logging/epoch_4_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..fd72fe79f6a120334060a104bd74fe8c5dd2907a --- /dev/null +++ b/r3_full/run/logging/epoch_4_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01310458cf7f984ce3e1cbbacb21964838bcf77388a2f72551bb11e60fd0478e +size 1304 diff --git a/r3_full/run/logging/epoch_4_val_metrics.pth b/r3_full/run/logging/epoch_4_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..a18cc7647a5b7cc82e9ab73facc8bd7af58c9e46 --- /dev/null +++ b/r3_full/run/logging/epoch_4_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d280a51ad5714a3b930edb7d93f9ad69a3dbd23e26e3c5d5a97126888f7ba3b +size 1360 diff --git a/r3_full/run/logging/epoch_5_train_metrics.pth b/r3_full/run/logging/epoch_5_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..c62104441fb3f23491230c83f52e73139f9b9428 --- /dev/null +++ b/r3_full/run/logging/epoch_5_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9db0e07ed7d4a8fab63b1a02b956e19ebd42da2d180a11bbb8979237d11c473 +size 1304 diff --git a/r3_full/run/logging/epoch_5_val_metrics.pth b/r3_full/run/logging/epoch_5_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..05a64817fc04b557613306abc7f3add1347c8771 --- /dev/null +++ b/r3_full/run/logging/epoch_5_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:964ea5ed04984a3c01c0548d30ccbc42a854ecf85697873c3f8d5f5f3b055ae9 +size 1360 diff --git a/r3_full/run/logging/epoch_6_train_metrics.pth b/r3_full/run/logging/epoch_6_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..94e45055dc607b951844ddb898d9eb870036b3bf --- /dev/null +++ b/r3_full/run/logging/epoch_6_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44f01b709e3a32c476a05ff791d59a36c0f157be025a4e791c8889e5b6cf18ae +size 1304 diff --git a/r3_full/run/logging/epoch_6_val_metrics.pth b/r3_full/run/logging/epoch_6_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..0c3dc180b1d928d3afbfe68fd8aa01c1918c805f --- /dev/null +++ b/r3_full/run/logging/epoch_6_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4900bc25119c7125c381a37941d497ed348a6f45630a364863f5e3aef6c7c25b +size 1360 diff --git a/r3_full/run/logging/epoch_7_train_metrics.pth b/r3_full/run/logging/epoch_7_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..babde92de833989ac45f55a3e3f8d7fefb5f92bf --- /dev/null +++ b/r3_full/run/logging/epoch_7_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b023e2a5b2cf5bbe733442492fe9257b76dd496a12fe079bc2ac3ae48c2efcb +size 1304 diff --git a/r3_full/run/logging/epoch_7_val_metrics.pth b/r3_full/run/logging/epoch_7_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..5d4d400106f0e9f73c7e99318d4e2130ad4cb5eb --- /dev/null +++ b/r3_full/run/logging/epoch_7_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eee047086a60d771064c1393e2991b86802169e007e9f597a4f36a409cfa7ace +size 1360 diff --git a/r3_full/run/logging/exp_cfg.yaml b/r3_full/run/logging/exp_cfg.yaml new file mode 100644 index 0000000000000000000000000000000000000000..3a8ca2fc63d6536a4902e5dc65931cbc02105e06 --- /dev/null +++ b/r3_full/run/logging/exp_cfg.yaml @@ -0,0 +1,62 @@ +anno_len_threshold: 40 +base_folder: /home/mog29/compgen_saved_files/experiments/joint_training +batch_size: 2 +checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r3_full/run/checkpoints +comprehension_prompt: verbose_instruction +context_size: 10 +data_dir: /home/mog29/compgen_saved_files/kilogram/dataset +deployment_round: 3 +evaluation_type: joint +expdir: /home/mog29/compgen_saved_files/experiments/joint_training/r3_full/run +from_scratch: true +generation_prompt: information_after +gradient_accumulation_steps: 32 +gradient_clip_norm: 1 +img_dir: /home/mog29/compgen_saved_files/kilogram/dataset/square-black-imgs +ips_clip: 5 +learning_rate: 0.0001 +listener_filter: no_neg_gen +listener_lambda: 0.5 +load_from_checkpoint: false +logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r3_full/run/logging +lora_dropout: 0.05 +lora_r: 16 +lora_subset: vision_resampler +max_steps: 30 +model_family_name: full +n_epochs: 15 +name: joint and multitask training defaults +name_suffix: '' +no_lora: false +no_shuffling: false +noise_filter: '' +num_samples: 10 +num_training_steps: 17500 +num_warmup_steps: 0 +num_workers: 4 +only_seed: false +past_checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_full/run/checkpoints +past_logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_full/run/logging +past_name_suffix: '' +past_round: -1 +patience_cutoff: 5 +ref_strat: no_ips_for_pos +repetition_penalty: 1 +replacement_family_name: '' +sampling_type: nucleus +save_each_epoch: true +seed: 133395 +shared_parameters: true +speaker_filter: no_neg_comp +speaker_lambda: 0.5 +split_dir: /home/mog29/compgen_saved_files/split_info/ +temperature: 0.7 +test_batch_size: 4 +top_k: 50 +top_p: 1 +training_type: multitask +use_separate_dataloaders: true +use_wandb: true +wandb_experiment_name: r3_full_may +wandb_project_name: tangram_continual_learning_final +weight_decay: 0.1 diff --git a/r3_no_ds/run/checkpoints/acc/README.md b/r3_no_ds/run/checkpoints/acc/README.md new file mode 100644 index 0000000000000000000000000000000000000000..2d4c19b14ebbb9a403d09e6532e46ccfcd7b82cb --- /dev/null +++ b/r3_no_ds/run/checkpoints/acc/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: HuggingFaceM4/idefics2-8b +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/r3_no_ds/run/checkpoints/acc/adapter_config.json b/r3_no_ds/run/checkpoints/acc/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a6a12bf8b59da5b42d042490beafd765fe95f7af --- /dev/null +++ b/r3_no_ds/run/checkpoints/acc/adapter_config.json @@ -0,0 +1,29 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "Idefics2ForConditionalGeneration", + "parent_library": "transformers.models.idefics2.modeling_idefics2" + }, + "base_model_name_or_path": "HuggingFaceM4/idefics2-8b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": "gaussian", + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.1, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 16, + "rank_pattern": {}, + "revision": null, + "target_modules": "(.*(vision_model|modality_projection|perceiver_resampler).*(out_proj|fc1|fc2|down_proj|gate_proj|up_proj|k_proj|q_proj|v_proj|o_proj).*$)|(.*(k_proj|q_proj|v_proj).*$)", + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/r3_no_ds/run/checkpoints/acc/adapter_model.safetensors b/r3_no_ds/run/checkpoints/acc/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fbc4e581477cb3594a2c9aeb4b737e08bf61605c --- /dev/null +++ b/r3_no_ds/run/checkpoints/acc/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf2181f3b27a1a42950ccd96cab32ec8828e722e0e97655fd1bb39ce8edfb043 +size 45771496 diff --git a/r3_no_ds/run/checkpoints/acc/best_optimizer.pt b/r3_no_ds/run/checkpoints/acc/best_optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..f00211c8e07c27a4e75be2f47ae38241ec2c87aa --- /dev/null +++ b/r3_no_ds/run/checkpoints/acc/best_optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43b3089bdaaaff1ac9df7bee3c9218955bffda1f8eeb85caf1240a82fb1d9b32 +size 91855438 diff --git a/r3_no_ds/run/checkpoints/acc/best_scheduler.pt b/r3_no_ds/run/checkpoints/acc/best_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..16f6c9b5ec67f91ace562b0b022444f1ee030ef0 --- /dev/null +++ b/r3_no_ds/run/checkpoints/acc/best_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c66ef6bf58f29b5e73c83eca3db44912ad7480f0602a08d91fc6178bc7acc997 +size 1084 diff --git a/r3_no_ds/run/checkpoints/acc/saved_metrics.pth b/r3_no_ds/run/checkpoints/acc/saved_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..c9dc489d572250a6cee46d04a502ddb2192f12ed --- /dev/null +++ b/r3_no_ds/run/checkpoints/acc/saved_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:820aee39ef3bc4bb28348447301e4d0c019092fc58561ee258c0ec3f8dad122d +size 1208 diff --git a/r3_no_ds/run/logging/epoch_0_train_metrics.pth b/r3_no_ds/run/logging/epoch_0_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..3ddfe4f56b1f205a56e13442a6c9bdcf3e8b02ab --- /dev/null +++ b/r3_no_ds/run/logging/epoch_0_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bc17e609ab64a94193cd1aa9bc27d94868fb46d21f74a5f88bf0b673c77307b +size 1304 diff --git a/r3_no_ds/run/logging/epoch_0_val_metrics.pth b/r3_no_ds/run/logging/epoch_0_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..6f48f469d8114f70420f437c28d02e89b122117b --- /dev/null +++ b/r3_no_ds/run/logging/epoch_0_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0ccefe76e9fc1622133b4c2861a51717ad94401c3a0ff68d0ad747baf7580c5 +size 1360 diff --git a/r3_no_ds/run/logging/epoch_1_train_metrics.pth b/r3_no_ds/run/logging/epoch_1_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..58060d517966dd8fbb22131d2b2ba8a81c65a753 --- /dev/null +++ b/r3_no_ds/run/logging/epoch_1_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc1a2515c569e64eac716d5181f5a799cd884f2be5077701cab9494be36ad767 +size 1304 diff --git a/r3_no_ds/run/logging/epoch_1_val_metrics.pth b/r3_no_ds/run/logging/epoch_1_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..158eeab390595f10cd0e148b497d78caeec2cbc2 --- /dev/null +++ b/r3_no_ds/run/logging/epoch_1_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6c7c5b0edf41aa4faff850ceb98524cf131f45d722362e4cf8b2079b3c628cb +size 1360 diff --git a/r3_no_ds/run/logging/epoch_2_train_metrics.pth b/r3_no_ds/run/logging/epoch_2_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..556157699b64d5cc81626c5cd81350335ddd7c53 --- /dev/null +++ b/r3_no_ds/run/logging/epoch_2_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc3a72e91a5a37424e41eb69574b1b133c96e382b365a5ad392410e52c1d9737 +size 1304 diff --git a/r3_no_ds/run/logging/epoch_2_val_metrics.pth b/r3_no_ds/run/logging/epoch_2_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..373a81200833d7b693dc94cab83dae0126302972 --- /dev/null +++ b/r3_no_ds/run/logging/epoch_2_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcbfba0dd0541e31e0d6efa192a3832542b1dff8c465252346cd10c2deb5d27b +size 1360 diff --git a/r3_no_ds/run/logging/epoch_3_train_metrics.pth b/r3_no_ds/run/logging/epoch_3_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..58429e2ed0a87c339fe3681a6cd2740ec17df857 --- /dev/null +++ b/r3_no_ds/run/logging/epoch_3_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5b1ed99592be2ea5b657a976dc547d9f504aa2695c82586022bb2ce19dfd4e4 +size 1304 diff --git a/r3_no_ds/run/logging/epoch_3_val_metrics.pth b/r3_no_ds/run/logging/epoch_3_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..fbd26a1857ae40c46fa594b0c0d50b3facbdf738 --- /dev/null +++ b/r3_no_ds/run/logging/epoch_3_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6830b285b7c88bba8cbbffbb06b10132daeba730164072ad420095af14934a7b +size 1360 diff --git a/r3_no_ds/run/logging/epoch_4_train_metrics.pth b/r3_no_ds/run/logging/epoch_4_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..513b60f1caaaa685cf2d58a73cc3e8758ffbe87b --- /dev/null +++ b/r3_no_ds/run/logging/epoch_4_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebe947255ad08ab23419fa99fcc7d95ee7182c1972ba2e3b01016a926e70f70b +size 1304 diff --git a/r3_no_ds/run/logging/epoch_4_val_metrics.pth b/r3_no_ds/run/logging/epoch_4_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..1a315df53407d7468054df3eaa4f1f022573d710 --- /dev/null +++ b/r3_no_ds/run/logging/epoch_4_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:381f0ed197718c933e4ec108fcee51d924dcfc199c2f45de5169cb696f2d4b9d +size 1360 diff --git a/r3_no_ds/run/logging/epoch_5_train_metrics.pth b/r3_no_ds/run/logging/epoch_5_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..4c37120ee0075ae7ab0dedc06efe5cb683dbbc93 --- /dev/null +++ b/r3_no_ds/run/logging/epoch_5_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:729ff97307754a935c9a482168317d686b0afba2f2d826eea6e06a3370e33b97 +size 1304 diff --git a/r3_no_ds/run/logging/epoch_5_val_metrics.pth b/r3_no_ds/run/logging/epoch_5_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..f21763f0c231701a8866db3fcbd92086417b6bea --- /dev/null +++ b/r3_no_ds/run/logging/epoch_5_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bddbc4c2b512b93e5e1e5c0ef1bb0620cee98112be6c4c8bf775c6776e857a49 +size 1360 diff --git a/r3_no_ds/run/logging/epoch_6_train_metrics.pth b/r3_no_ds/run/logging/epoch_6_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..7af90aa2fe3ca55a9407a8f5732414a0423cf5eb --- /dev/null +++ b/r3_no_ds/run/logging/epoch_6_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:924023dba00b4e54638265c98e79b5c333bbec6123117b45fa973b669f909bfc +size 1304 diff --git a/r3_no_ds/run/logging/epoch_6_val_metrics.pth b/r3_no_ds/run/logging/epoch_6_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..27fb9e993cc083c24cda9e99223055d366ad10be --- /dev/null +++ b/r3_no_ds/run/logging/epoch_6_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:648f8c5d59187008c59e5ae7fe8a79da3ad4e8f86aba2404ab3a3780e788fb39 +size 1360 diff --git a/r3_no_ds/run/logging/epoch_7_train_metrics.pth b/r3_no_ds/run/logging/epoch_7_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..6e76fecd2abfc3701fdc0a62dd85ab9e82c2166c --- /dev/null +++ b/r3_no_ds/run/logging/epoch_7_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45fcfe485a08c7cedaf1d23cbc7ed00e87ee06ab64f057de6fdbaddfa0212e94 +size 1304 diff --git a/r3_no_ds/run/logging/epoch_7_val_metrics.pth b/r3_no_ds/run/logging/epoch_7_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..aed33f595678e11deb1ad51cb3f7e9dbd198e14b --- /dev/null +++ b/r3_no_ds/run/logging/epoch_7_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68f46f66c5a95a23d22324c7a41fa770313655ae71af915f1c70cc0463aa0256 +size 1360 diff --git a/r3_no_ds/run/logging/exp_cfg.yaml b/r3_no_ds/run/logging/exp_cfg.yaml new file mode 100644 index 0000000000000000000000000000000000000000..05f179abcc3af900f52549dc25738c468c4c3b61 --- /dev/null +++ b/r3_no_ds/run/logging/exp_cfg.yaml @@ -0,0 +1,62 @@ +anno_len_threshold: 40 +base_folder: /home/mog29/compgen_saved_files/experiments/joint_training +batch_size: 2 +checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r3_no_ds/run/checkpoints +comprehension_prompt: verbose_instruction +context_size: 10 +data_dir: /home/mog29/compgen_saved_files/kilogram/dataset +deployment_round: 3 +evaluation_type: joint +expdir: /home/mog29/compgen_saved_files/experiments/joint_training/r3_no_ds/run +from_scratch: true +generation_prompt: information_after +gradient_accumulation_steps: 32 +gradient_clip_norm: 1 +img_dir: /home/mog29/compgen_saved_files/kilogram/dataset/square-black-imgs +ips_clip: 5 +learning_rate: 0.0001 +listener_filter: '' +listener_lambda: 0.5 +load_from_checkpoint: false +logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r3_no_ds/run/logging +lora_dropout: 0.05 +lora_r: 16 +lora_subset: vision_resampler +max_steps: 30 +model_family_name: no_ds +n_epochs: 15 +name: joint and multitask training defaults +name_suffix: '' +no_lora: false +no_shuffling: false +noise_filter: '' +num_samples: 10 +num_training_steps: 17500 +num_warmup_steps: 0 +num_workers: 4 +only_seed: false +past_checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_no_ds/run/checkpoints +past_logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_no_ds/run/logging +past_name_suffix: '' +past_round: -1 +patience_cutoff: 5 +ref_strat: no_ips_for_pos +repetition_penalty: 1 +replacement_family_name: '' +sampling_type: nucleus +save_each_epoch: true +seed: 227174 +shared_parameters: true +speaker_filter: '' +speaker_lambda: 0.5 +split_dir: /home/mog29/compgen_saved_files/split_info/ +temperature: 0.7 +test_batch_size: 2 +top_k: 50 +top_p: 1 +training_type: multitask +use_separate_dataloaders: false +use_wandb: true +wandb_experiment_name: r3_no_ds_may +wandb_project_name: tangram_continual_learning_final +weight_decay: 0.1 diff --git a/r3_no_ji/run/checkpoints/acc/README.md b/r3_no_ji/run/checkpoints/acc/README.md new file mode 100644 index 0000000000000000000000000000000000000000..2d4c19b14ebbb9a403d09e6532e46ccfcd7b82cb --- /dev/null +++ b/r3_no_ji/run/checkpoints/acc/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: HuggingFaceM4/idefics2-8b +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.10.0 \ No newline at end of file diff --git a/r3_no_ji/run/checkpoints/acc/adapter_config.json b/r3_no_ji/run/checkpoints/acc/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a6a12bf8b59da5b42d042490beafd765fe95f7af --- /dev/null +++ b/r3_no_ji/run/checkpoints/acc/adapter_config.json @@ -0,0 +1,29 @@ +{ + "alpha_pattern": {}, + "auto_mapping": { + "base_model_class": "Idefics2ForConditionalGeneration", + "parent_library": "transformers.models.idefics2.modeling_idefics2" + }, + "base_model_name_or_path": "HuggingFaceM4/idefics2-8b", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": "gaussian", + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 8, + "lora_dropout": 0.1, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 16, + "rank_pattern": {}, + "revision": null, + "target_modules": "(.*(vision_model|modality_projection|perceiver_resampler).*(out_proj|fc1|fc2|down_proj|gate_proj|up_proj|k_proj|q_proj|v_proj|o_proj).*$)|(.*(k_proj|q_proj|v_proj).*$)", + "task_type": null, + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/r3_no_ji/run/checkpoints/acc/adapter_model.safetensors b/r3_no_ji/run/checkpoints/acc/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..559761471bd2ba2da1e53270bd3b71c32c7d1aa7 --- /dev/null +++ b/r3_no_ji/run/checkpoints/acc/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c52ce3fb668d9f9a435f5b408c1f5e0d3ab04f69f889e3e5cd0170c639ac167 +size 45771496 diff --git a/r3_no_ji/run/checkpoints/acc/best_optimizer.pt b/r3_no_ji/run/checkpoints/acc/best_optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1425ffa4f0eb19bb18f984be3113545271d5ff2 --- /dev/null +++ b/r3_no_ji/run/checkpoints/acc/best_optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ea9d8c05aaac98a98ffbb67b7f75630ca14bbeb37445a1ce136d5cc00d07e88 +size 91855438 diff --git a/r3_no_ji/run/checkpoints/acc/best_scheduler.pt b/r3_no_ji/run/checkpoints/acc/best_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c37c0c5f5ec91124aa9db8f7b8bfc0e5a41ac88 --- /dev/null +++ b/r3_no_ji/run/checkpoints/acc/best_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:543941c5d3ac00dad28f6a75b1e74394326c6600f851517afd832b1a9fea622b +size 1084 diff --git a/r3_no_ji/run/checkpoints/acc/saved_metrics.pth b/r3_no_ji/run/checkpoints/acc/saved_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..60a30ee0b077de345b0b6e68847140ad4c36167c --- /dev/null +++ b/r3_no_ji/run/checkpoints/acc/saved_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5316809cfdbea6bbd53cce7fba1e3ef1402cab10927b0d9d034b6516fd937670 +size 1016 diff --git a/r3_no_ji/run/logging/epoch_0_train_metrics.pth b/r3_no_ji/run/logging/epoch_0_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..43155d0ef75def9a6cc189bf950d7dc43efb250e --- /dev/null +++ b/r3_no_ji/run/logging/epoch_0_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f23a1428a44d4aa8f3ea0c04402e32131b32490829e90fce16b6a39dc1fccf74 +size 1304 diff --git a/r3_no_ji/run/logging/epoch_0_val_metrics.pth b/r3_no_ji/run/logging/epoch_0_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..1fe9bfa11ff08c75cbce903932f29402d17c1ae1 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_0_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea095c6a1b12859a0081b003208cf4e656eef5b337f3f35ba2d88223bf87f8ce +size 1168 diff --git a/r3_no_ji/run/logging/epoch_10_train_metrics.pth b/r3_no_ji/run/logging/epoch_10_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..df32f820259e61fbd5603c62ddd15d08941978e9 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_10_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9de054f9d12a464f7a7bd27ed40bd80e164e3fef8d6b77dca7e0e99415b0e435 +size 1372 diff --git a/r3_no_ji/run/logging/epoch_10_val_metrics.pth b/r3_no_ji/run/logging/epoch_10_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..8621c5df5bd4f22c2dcddc9720995b1b9fea5de5 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_10_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0eb6ce2450df21942b32ab79792a0e59f0d9494bb4c9fe02287b99d4663c21e5 +size 1172 diff --git a/r3_no_ji/run/logging/epoch_11_train_metrics.pth b/r3_no_ji/run/logging/epoch_11_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..3f2ff4e714d1645b8c8a88c0403cf9b0f9677051 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_11_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7a8f55591776fb07174df40444409fafe990a7d46659e01f8f1eedbba8d1c78 +size 1372 diff --git a/r3_no_ji/run/logging/epoch_11_val_metrics.pth b/r3_no_ji/run/logging/epoch_11_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..345a7ff7a097f239e9b015d8ca7ce82c773e1233 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_11_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1c6d9d43f48b68cc20b9ff40f120911511339e5e749e998c7bc92ea99880a4e +size 1172 diff --git a/r3_no_ji/run/logging/epoch_12_train_metrics.pth b/r3_no_ji/run/logging/epoch_12_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..d78404c4ba632c2cdba10ace24273ed55fbfbac3 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_12_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d982c314e0a78bdfa87bc0caa3e7be6bc40ddfeed39fda160475af690932303 +size 1372 diff --git a/r3_no_ji/run/logging/epoch_12_val_metrics.pth b/r3_no_ji/run/logging/epoch_12_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..2046a63c45fd151ea50e96e621ea152002e0ef47 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_12_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45afecf6546b1d5e8002a20f7322eaebeaa4d1483013b16929e8989df5ef5c2b +size 1172 diff --git a/r3_no_ji/run/logging/epoch_13_train_metrics.pth b/r3_no_ji/run/logging/epoch_13_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..e08f56835a9ffe686417216e7d952de5fac9a587 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_13_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a7d39625111f86dd5ed10b3b7c11df4002afbb525aa52e77963595319fb1891 +size 1372 diff --git a/r3_no_ji/run/logging/epoch_13_val_metrics.pth b/r3_no_ji/run/logging/epoch_13_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..7c5b894045d8cbde7e8edb80867e973c77894e12 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_13_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e7ac60053d54de7c0c12bb0d9e6db33210fa1f4d32ca0844d64ce56ea741392 +size 1172 diff --git a/r3_no_ji/run/logging/epoch_14_train_metrics.pth b/r3_no_ji/run/logging/epoch_14_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..7aed472fecd332c722f4340dd76cc2f0a957df74 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_14_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:418ad65d3f692ab5664d0688c07e6541d4f4480ff62b2ae5e9bc6000a35425a9 +size 1372 diff --git a/r3_no_ji/run/logging/epoch_14_val_metrics.pth b/r3_no_ji/run/logging/epoch_14_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..6ad32b08a4fdf8d158a8edb0543eeffc7a4b188a --- /dev/null +++ b/r3_no_ji/run/logging/epoch_14_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ada1d7fa8a6ba62ad57c942d7578b927b61c1fac6ac15c339de95f0790a39cd3 +size 1172 diff --git a/r3_no_ji/run/logging/epoch_1_train_metrics.pth b/r3_no_ji/run/logging/epoch_1_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..598f3acdc3a1016e02e170eec8319297a20c0f5e --- /dev/null +++ b/r3_no_ji/run/logging/epoch_1_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e17ce6bfaa25ece5a738f694968f6675db400a94a88642cfa75d7e4dc4b3261 +size 1304 diff --git a/r3_no_ji/run/logging/epoch_1_val_metrics.pth b/r3_no_ji/run/logging/epoch_1_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..2d361ca2f247af49d4fac96d1fe74bd3d92e8728 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_1_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60ae8517d50e9ee651bd28ecac646893ad8d8f96380cde7dcb6db094b9486cf7 +size 1168 diff --git a/r3_no_ji/run/logging/epoch_2_train_metrics.pth b/r3_no_ji/run/logging/epoch_2_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..971dcbda1e2effba51f70aab6063e502adbe8be9 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_2_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:193b0aa984ecfe82a29dcb078a259a8683e592b3d4a302098feaa59078be4845 +size 1304 diff --git a/r3_no_ji/run/logging/epoch_2_val_metrics.pth b/r3_no_ji/run/logging/epoch_2_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..7d9ccc6cdfd1b3ce5491d63c6c7f716e6e065f41 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_2_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cf14be50ce4a12e0386a1112ced0882f783b29b4227d9ecf8f49997a5b1140f +size 1168 diff --git a/r3_no_ji/run/logging/epoch_3_train_metrics.pth b/r3_no_ji/run/logging/epoch_3_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..2eccefa9caa314e1afa67feb7fe66812a0aa27e1 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_3_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8759a48f63ae478295a1cac4dfd4a01503ca798af6e544a16d656bdcd8140e5 +size 1304 diff --git a/r3_no_ji/run/logging/epoch_3_val_metrics.pth b/r3_no_ji/run/logging/epoch_3_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..44cb8c82efa5f69777db3c50435c092c1b45bb10 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_3_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a94fb3e94751190bf3d89340ab67be3a5448b2f8e80410445887396a91bb4d9 +size 1168 diff --git a/r3_no_ji/run/logging/epoch_4_train_metrics.pth b/r3_no_ji/run/logging/epoch_4_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..d4f43b11ffe3abdc90df9bdba5ef89bbf3578849 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_4_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b17d9b32f4cdb91ae0f57671ec3c515e55d9f696cb950e1cfef2ee06cccdae7d +size 1304 diff --git a/r3_no_ji/run/logging/epoch_4_val_metrics.pth b/r3_no_ji/run/logging/epoch_4_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..e98e24bed953d9a51728a41b20ce868534c7932d --- /dev/null +++ b/r3_no_ji/run/logging/epoch_4_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33b587cc79a89e1f3c41930ff07e990ead2bcdf3fc9fc8fe3c32681f129ff598 +size 1168 diff --git a/r3_no_ji/run/logging/epoch_5_train_metrics.pth b/r3_no_ji/run/logging/epoch_5_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..44338a057e6fbe92b468cd7e15e55f9bd9aa66eb --- /dev/null +++ b/r3_no_ji/run/logging/epoch_5_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0ceb8f1d5c542596b4ff69656f22acb690e80d65d877a06b3a723f699c77242 +size 1304 diff --git a/r3_no_ji/run/logging/epoch_5_val_metrics.pth b/r3_no_ji/run/logging/epoch_5_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..5233553f090c5db0a85135c5989e51e9de6d4d0d --- /dev/null +++ b/r3_no_ji/run/logging/epoch_5_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eca3f9f4f8a9c91cef642cdbde374f8e377916ff41294877e6506a781a00b3c +size 1168 diff --git a/r3_no_ji/run/logging/epoch_6_train_metrics.pth b/r3_no_ji/run/logging/epoch_6_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..dbfd6ec327a34bd69c1a2956f061305027f7d9ac --- /dev/null +++ b/r3_no_ji/run/logging/epoch_6_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c717d141d4caf7fa43b6afae5420dd62562cad56192221d7bd0ba599b05e21d7 +size 1304 diff --git a/r3_no_ji/run/logging/epoch_6_val_metrics.pth b/r3_no_ji/run/logging/epoch_6_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..f49f18c82fe6c5b21280743068b6720320b8227c --- /dev/null +++ b/r3_no_ji/run/logging/epoch_6_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:169cea217fa52cf7c3d82db25a687a29b071ba5e120e8fbe4e33ee00057906b7 +size 1168 diff --git a/r3_no_ji/run/logging/epoch_7_train_metrics.pth b/r3_no_ji/run/logging/epoch_7_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..c0c6c4046d04bfe94f2fa3d03004a73320094338 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_7_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5885ed3c5781f8d1abd8873a267a838d84d5508daba40086626cd4c9eae04ea +size 1304 diff --git a/r3_no_ji/run/logging/epoch_7_val_metrics.pth b/r3_no_ji/run/logging/epoch_7_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..92a7bd5c7a522e3af40fe8b9dd742412d5cf163c --- /dev/null +++ b/r3_no_ji/run/logging/epoch_7_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15ebe69749017f26813d0bc1bc98fc35b4fe9b7bc03a886576e8a9cf120afb3a +size 1168 diff --git a/r3_no_ji/run/logging/epoch_8_train_metrics.pth b/r3_no_ji/run/logging/epoch_8_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..528912b2ad2ba2c4776a7e3824a98cb16c6e2a94 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_8_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:217e249b8ce14bbf1ede47959f7f965f2c9372dc5c17e1d7e5ef277536fe54e3 +size 1304 diff --git a/r3_no_ji/run/logging/epoch_8_val_metrics.pth b/r3_no_ji/run/logging/epoch_8_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..8639e5f69505dbaab0a9a4fabc84a4a0752fa821 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_8_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f61641f888672ff271755db24234a6dd46bb3216066f85e0d36df26d68737b7 +size 1168 diff --git a/r3_no_ji/run/logging/epoch_9_train_metrics.pth b/r3_no_ji/run/logging/epoch_9_train_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..8b8f6e0f2333ff1695ea397a0d8daf33f43c80a3 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_9_train_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93022c803a53ccde9b1dd975d21ebcd917b530ae3071bad476f4e4ad8d428c60 +size 1304 diff --git a/r3_no_ji/run/logging/epoch_9_val_metrics.pth b/r3_no_ji/run/logging/epoch_9_val_metrics.pth new file mode 100644 index 0000000000000000000000000000000000000000..cb73893ac45a079d841a96d84b8afb33ea860349 --- /dev/null +++ b/r3_no_ji/run/logging/epoch_9_val_metrics.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2bf5628b28196289597b114671c625f7b50302a4b9f6638de91d1c8edc999c2 +size 1168 diff --git a/r3_no_ji/run/logging/exp_cfg.yaml b/r3_no_ji/run/logging/exp_cfg.yaml new file mode 100644 index 0000000000000000000000000000000000000000..b660338459a2e2460867899b518787f78a5f6d4a --- /dev/null +++ b/r3_no_ji/run/logging/exp_cfg.yaml @@ -0,0 +1,62 @@ +anno_len_threshold: 40 +base_folder: /home/mog29/compgen_saved_files/experiments/joint_training +batch_size: 2 +checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r3_no_ji/run/checkpoints +comprehension_prompt: verbose_instruction +context_size: 10 +data_dir: /home/mog29/compgen_saved_files/kilogram/dataset +deployment_round: 3 +evaluation_type: multitask +expdir: /home/mog29/compgen_saved_files/experiments/joint_training/r3_no_ji/run +from_scratch: true +generation_prompt: information_after +gradient_accumulation_steps: 32 +gradient_clip_norm: 1 +img_dir: /home/mog29/compgen_saved_files/kilogram/dataset/square-black-imgs +ips_clip: 5 +learning_rate: 0.0001 +listener_filter: no_neg_gen +listener_lambda: 0.5 +load_from_checkpoint: false +logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r3_no_ji/run/logging +lora_dropout: 0.05 +lora_r: 16 +lora_subset: vision_resampler +max_steps: 30 +model_family_name: no_ji +n_epochs: 15 +name: joint and multitask training defaults +name_suffix: '' +no_lora: false +no_shuffling: false +noise_filter: '' +num_samples: 10 +num_training_steps: 17500 +num_warmup_steps: 0 +num_workers: 4 +only_seed: false +past_checkpoint_dir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_no_ji/run/checkpoints +past_logdir: /home/mog29/compgen_saved_files/experiments/joint_training/r2_no_ji/run/logging +past_name_suffix: '' +past_round: -1 +patience_cutoff: 5 +ref_strat: no_ips_for_pos +repetition_penalty: 1 +replacement_family_name: '' +sampling_type: nucleus +save_each_epoch: true +seed: 417165 +shared_parameters: true +speaker_filter: no_neg_comp +speaker_lambda: 0.5 +split_dir: /home/mog29/compgen_saved_files/split_info/ +temperature: 0.7 +test_batch_size: 4 +top_k: 50 +top_p: 1 +training_type: multitask +use_separate_dataloaders: true +use_wandb: true +wandb_experiment_name: r3_no_ji_may +wandb_project_name: tangram_continual_learning_final +weight_decay: 0.1