diff --git a/BlackSheepVision-Phi-3/README.md b/BlackSheepVision-Phi-3/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8ea0943ce13efe0300134b4c76161d8a8ac77f36 --- /dev/null +++ b/BlackSheepVision-Phi-3/README.md @@ -0,0 +1,202 @@ +--- +base_model: models\microsoft_Phi-3-vision-128k-instruct +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.12.0 \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/adapter_config.json b/BlackSheepVision-Phi-3/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..43d6db131c56e9e0a8676c747d1a38f41ab29779 --- /dev/null +++ b/BlackSheepVision-Phi-3/adapter_config.json @@ -0,0 +1,34 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "models\\microsoft_Phi-3-vision-128k-instruct", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 4096, + "lora_dropout": 0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 2048, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "down_proj", + "k_proj", + "o_proj", + "up_proj", + "gate_proj", + "v_proj", + "q_proj" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/adapter_model.safetensors b/BlackSheepVision-Phi-3/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5a6f3f2f5c934d15081fe6404ee98cb745078ba0 --- /dev/null +++ b/BlackSheepVision-Phi-3/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c7563b9393a75fd8525e5eba4c801f65a93ead90ddbc23f21ae202aada3242e +size 5771408256 diff --git a/BlackSheepVision-Phi-3/checkpoint-1000/README.md b/BlackSheepVision-Phi-3/checkpoint-1000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8ea0943ce13efe0300134b4c76161d8a8ac77f36 --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-1000/README.md @@ -0,0 +1,202 @@ +--- +base_model: models\microsoft_Phi-3-vision-128k-instruct +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.12.0 \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/checkpoint-1000/adapter_config.json b/BlackSheepVision-Phi-3/checkpoint-1000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..43d6db131c56e9e0a8676c747d1a38f41ab29779 --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-1000/adapter_config.json @@ -0,0 +1,34 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "models\\microsoft_Phi-3-vision-128k-instruct", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 4096, + "lora_dropout": 0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 2048, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "down_proj", + "k_proj", + "o_proj", + "up_proj", + "gate_proj", + "v_proj", + "q_proj" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/checkpoint-1000/adapter_model.safetensors b/BlackSheepVision-Phi-3/checkpoint-1000/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fb5de64a8043adacc2aef6d297a5df52d398af08 --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-1000/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29aabdd5ebb2c0f9f9ca3e53f8f185afce27f1217865a83db49c9f645533bff7 +size 5771408256 diff --git a/BlackSheepVision-Phi-3/checkpoint-1000/training_log.json b/BlackSheepVision-Phi-3/checkpoint-1000/training_log.json new file mode 100644 index 0000000000000000000000000000000000000000..7198efc6371b5130cf2c453ee2ed44bd56b2eeaf --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-1000/training_log.json @@ -0,0 +1,12 @@ +{ + "base_model_name": "microsoft_Phi-3-vision-128k-instruct", + "base_model_class": "Phi3VForCausalLM", + "base_loaded_in_4bit": true, + "base_loaded_in_8bit": false, + "projections": "gate, down, up, q, v, k, o", + "loss": 1.0155, + "grad_norm": 0.855490505695343, + "learning_rate": 9.886842462960446e-05, + "epoch": 0.47573739295908657, + "current_steps": 999 +} \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/checkpoint-1000/training_prompt.json b/BlackSheepVision-Phi-3/checkpoint-1000/training_prompt.json new file mode 100644 index 0000000000000000000000000000000000000000..f8f85b67d7b4c4c05d0bcf5e2f16b6a1eb01d5c6 --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-1000/training_prompt.json @@ -0,0 +1,16 @@ +{ + "template_type": "dataset", + "template_1": "Who is your creator?\n\n%creator%", + "template_2": "%ChatML_CONVO%", + "template_3": "<|im_start|> I want you to say this next statement like a Gen-Z. \n %English% \n <|im_start|> %Gen-Z% <|im_end|>", + "template_4": "<|im_start|> %prompt% \n <|im_start|> %output% <|im_end|>", + "template_5": "<|im_start|> %instruction% \n <|im_start|> %output% <|im_end|>", + "template_6": "<|im_start|> %instruction%\n %input%\n <|im_start|> %output% <|im_end|>", + "template_7": "<|im_start|> %question% \n <|im_start|> %output% <|im_end|>", + "template_8": "<|im_start|> %question% \n <|im_start|> %response% <|im_end|>", + "template_9": "<|im_start|> %perspective% \n <|im_start|> %output% <|im_end|>", + "template_10": "<|im_start|> %perspective%\n %input%\n <|im_start|> %output% <|im_end|>", + "template_11": "<|im_start|> %instruction% \n <|im_start|> %toxic% <|im_end|>", + "template_12": "<|im_start|> %prompt% \n <|im_start|> %chosen% <|im_end|>", + "template_13": "<|im_start|> system\n : %system% \n <|im_end|> \n <|im_start|> %user% \n <|im_end|> \n <|im_start|> %assistant%" +} \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/checkpoint-2000/README.md b/BlackSheepVision-Phi-3/checkpoint-2000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8ea0943ce13efe0300134b4c76161d8a8ac77f36 --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-2000/README.md @@ -0,0 +1,202 @@ +--- +base_model: models\microsoft_Phi-3-vision-128k-instruct +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.12.0 \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/checkpoint-2000/adapter_config.json b/BlackSheepVision-Phi-3/checkpoint-2000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..43d6db131c56e9e0a8676c747d1a38f41ab29779 --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-2000/adapter_config.json @@ -0,0 +1,34 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "models\\microsoft_Phi-3-vision-128k-instruct", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 4096, + "lora_dropout": 0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 2048, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "down_proj", + "k_proj", + "o_proj", + "up_proj", + "gate_proj", + "v_proj", + "q_proj" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/checkpoint-2000/adapter_model.safetensors b/BlackSheepVision-Phi-3/checkpoint-2000/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f048cea43044da249d21764b68638825619a9407 --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-2000/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:155b56140389f259fd74c3724efdca122ba6c3563feed3f652874f63e453fec7 +size 5771408256 diff --git a/BlackSheepVision-Phi-3/checkpoint-2000/training_log.json b/BlackSheepVision-Phi-3/checkpoint-2000/training_log.json new file mode 100644 index 0000000000000000000000000000000000000000..891bd76bf47b7fa3827c9cd5fd12c8048b517537 --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-2000/training_log.json @@ -0,0 +1,12 @@ +{ + "base_model_name": "microsoft_Phi-3-vision-128k-instruct", + "base_model_class": "Phi3VForCausalLM", + "base_loaded_in_4bit": true, + "base_loaded_in_8bit": false, + "projections": "gate, down, up, q, v, k, o", + "loss": 0.9775, + "grad_norm": 1.721966028213501, + "learning_rate": 9.773684925920892e-05, + "epoch": 0.9514747859181731, + "current_steps": 1999 +} \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/checkpoint-2000/training_prompt.json b/BlackSheepVision-Phi-3/checkpoint-2000/training_prompt.json new file mode 100644 index 0000000000000000000000000000000000000000..f8f85b67d7b4c4c05d0bcf5e2f16b6a1eb01d5c6 --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-2000/training_prompt.json @@ -0,0 +1,16 @@ +{ + "template_type": "dataset", + "template_1": "Who is your creator?\n\n%creator%", + "template_2": "%ChatML_CONVO%", + "template_3": "<|im_start|> I want you to say this next statement like a Gen-Z. \n %English% \n <|im_start|> %Gen-Z% <|im_end|>", + "template_4": "<|im_start|> %prompt% \n <|im_start|> %output% <|im_end|>", + "template_5": "<|im_start|> %instruction% \n <|im_start|> %output% <|im_end|>", + "template_6": "<|im_start|> %instruction%\n %input%\n <|im_start|> %output% <|im_end|>", + "template_7": "<|im_start|> %question% \n <|im_start|> %output% <|im_end|>", + "template_8": "<|im_start|> %question% \n <|im_start|> %response% <|im_end|>", + "template_9": "<|im_start|> %perspective% \n <|im_start|> %output% <|im_end|>", + "template_10": "<|im_start|> %perspective%\n %input%\n <|im_start|> %output% <|im_end|>", + "template_11": "<|im_start|> %instruction% \n <|im_start|> %toxic% <|im_end|>", + "template_12": "<|im_start|> %prompt% \n <|im_start|> %chosen% <|im_end|>", + "template_13": "<|im_start|> system\n : %system% \n <|im_end|> \n <|im_start|> %user% \n <|im_end|> \n <|im_start|> %assistant%" +} \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/checkpoint-3000/README.md b/BlackSheepVision-Phi-3/checkpoint-3000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8ea0943ce13efe0300134b4c76161d8a8ac77f36 --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-3000/README.md @@ -0,0 +1,202 @@ +--- +base_model: models\microsoft_Phi-3-vision-128k-instruct +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.12.0 \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/checkpoint-3000/adapter_config.json b/BlackSheepVision-Phi-3/checkpoint-3000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..43d6db131c56e9e0a8676c747d1a38f41ab29779 --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-3000/adapter_config.json @@ -0,0 +1,34 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "models\\microsoft_Phi-3-vision-128k-instruct", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 4096, + "lora_dropout": 0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 2048, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "down_proj", + "k_proj", + "o_proj", + "up_proj", + "gate_proj", + "v_proj", + "q_proj" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/checkpoint-3000/adapter_model.safetensors b/BlackSheepVision-Phi-3/checkpoint-3000/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a157b58211fec43929249364f480812acd27925b --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-3000/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05f506d681fc893c8d5306386ad1e56f5feaaf3eecbf94a3bf92c0a6d35a33a4 +size 5771408256 diff --git a/BlackSheepVision-Phi-3/checkpoint-3000/training_log.json b/BlackSheepVision-Phi-3/checkpoint-3000/training_log.json new file mode 100644 index 0000000000000000000000000000000000000000..f1ce202e07b0601416b981716e3074150d7030cb --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-3000/training_log.json @@ -0,0 +1,12 @@ +{ + "base_model_name": "microsoft_Phi-3-vision-128k-instruct", + "base_model_class": "Phi3VForCausalLM", + "base_loaded_in_4bit": true, + "base_loaded_in_8bit": false, + "projections": "gate, down, up, q, v, k, o", + "loss": 0.5155, + "grad_norm": 1.1744245290756226, + "learning_rate": 9.660527388881338e-05, + "epoch": 1.4272121788772598, + "current_steps": 2999 +} \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/checkpoint-3000/training_prompt.json b/BlackSheepVision-Phi-3/checkpoint-3000/training_prompt.json new file mode 100644 index 0000000000000000000000000000000000000000..f8f85b67d7b4c4c05d0bcf5e2f16b6a1eb01d5c6 --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-3000/training_prompt.json @@ -0,0 +1,16 @@ +{ + "template_type": "dataset", + "template_1": "Who is your creator?\n\n%creator%", + "template_2": "%ChatML_CONVO%", + "template_3": "<|im_start|> I want you to say this next statement like a Gen-Z. \n %English% \n <|im_start|> %Gen-Z% <|im_end|>", + "template_4": "<|im_start|> %prompt% \n <|im_start|> %output% <|im_end|>", + "template_5": "<|im_start|> %instruction% \n <|im_start|> %output% <|im_end|>", + "template_6": "<|im_start|> %instruction%\n %input%\n <|im_start|> %output% <|im_end|>", + "template_7": "<|im_start|> %question% \n <|im_start|> %output% <|im_end|>", + "template_8": "<|im_start|> %question% \n <|im_start|> %response% <|im_end|>", + "template_9": "<|im_start|> %perspective% \n <|im_start|> %output% <|im_end|>", + "template_10": "<|im_start|> %perspective%\n %input%\n <|im_start|> %output% <|im_end|>", + "template_11": "<|im_start|> %instruction% \n <|im_start|> %toxic% <|im_end|>", + "template_12": "<|im_start|> %prompt% \n <|im_start|> %chosen% <|im_end|>", + "template_13": "<|im_start|> system\n : %system% \n <|im_end|> \n <|im_start|> %user% \n <|im_end|> \n <|im_start|> %assistant%" +} \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/checkpoint-4000/README.md b/BlackSheepVision-Phi-3/checkpoint-4000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..8ea0943ce13efe0300134b4c76161d8a8ac77f36 --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-4000/README.md @@ -0,0 +1,202 @@ +--- +base_model: models\microsoft_Phi-3-vision-128k-instruct +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.12.0 \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/checkpoint-4000/adapter_config.json b/BlackSheepVision-Phi-3/checkpoint-4000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..43d6db131c56e9e0a8676c747d1a38f41ab29779 --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-4000/adapter_config.json @@ -0,0 +1,34 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "models\\microsoft_Phi-3-vision-128k-instruct", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layer_replication": null, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 4096, + "lora_dropout": 0, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 2048, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "down_proj", + "k_proj", + "o_proj", + "up_proj", + "gate_proj", + "v_proj", + "q_proj" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/checkpoint-4000/adapter_model.safetensors b/BlackSheepVision-Phi-3/checkpoint-4000/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c72fa6996d127a6cb3194da834a04fe26bd5de6a --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-4000/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e15d106bbc8ea868b631b6263e27c80d0d16bdf27ef70c23e92db1c5b07f35ae +size 5771408256 diff --git a/BlackSheepVision-Phi-3/checkpoint-4000/training_log.json b/BlackSheepVision-Phi-3/checkpoint-4000/training_log.json new file mode 100644 index 0000000000000000000000000000000000000000..fa6b37ba7b9ea0a924f523eac2464e1cf81da191 --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-4000/training_log.json @@ -0,0 +1,12 @@ +{ + "base_model_name": "microsoft_Phi-3-vision-128k-instruct", + "base_model_class": "Phi3VForCausalLM", + "base_loaded_in_4bit": true, + "base_loaded_in_8bit": false, + "projections": "gate, down, up, q, v, k, o", + "loss": 0.649, + "grad_norm": 1.225587248802185, + "learning_rate": 9.547369851841784e-05, + "epoch": 1.9029495718363463, + "current_steps": 3999 +} \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/checkpoint-4000/training_prompt.json b/BlackSheepVision-Phi-3/checkpoint-4000/training_prompt.json new file mode 100644 index 0000000000000000000000000000000000000000..f8f85b67d7b4c4c05d0bcf5e2f16b6a1eb01d5c6 --- /dev/null +++ b/BlackSheepVision-Phi-3/checkpoint-4000/training_prompt.json @@ -0,0 +1,16 @@ +{ + "template_type": "dataset", + "template_1": "Who is your creator?\n\n%creator%", + "template_2": "%ChatML_CONVO%", + "template_3": "<|im_start|> I want you to say this next statement like a Gen-Z. \n %English% \n <|im_start|> %Gen-Z% <|im_end|>", + "template_4": "<|im_start|> %prompt% \n <|im_start|> %output% <|im_end|>", + "template_5": "<|im_start|> %instruction% \n <|im_start|> %output% <|im_end|>", + "template_6": "<|im_start|> %instruction%\n %input%\n <|im_start|> %output% <|im_end|>", + "template_7": "<|im_start|> %question% \n <|im_start|> %output% <|im_end|>", + "template_8": "<|im_start|> %question% \n <|im_start|> %response% <|im_end|>", + "template_9": "<|im_start|> %perspective% \n <|im_start|> %output% <|im_end|>", + "template_10": "<|im_start|> %perspective%\n %input%\n <|im_start|> %output% <|im_end|>", + "template_11": "<|im_start|> %instruction% \n <|im_start|> %toxic% <|im_end|>", + "template_12": "<|im_start|> %prompt% \n <|im_start|> %chosen% <|im_end|>", + "template_13": "<|im_start|> system\n : %system% \n <|im_end|> \n <|im_start|> %user% \n <|im_end|> \n <|im_start|> %assistant%" +} \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/runs/Aug10_10-40-54_Troy-New-PC/events.out.tfevents.1723311654.Troy-New-PC.22016.0 b/BlackSheepVision-Phi-3/runs/Aug10_10-40-54_Troy-New-PC/events.out.tfevents.1723311654.Troy-New-PC.22016.0 new file mode 100644 index 0000000000000000000000000000000000000000..d61644c73bf6ce716986a5985a6741316347cb6c --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug10_10-40-54_Troy-New-PC/events.out.tfevents.1723311654.Troy-New-PC.22016.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:099c012ba940bb7d2e790d86a7c955fc0f4ed8cb5245bdde209a7a29d5eb43c2 +size 63880 diff --git a/BlackSheepVision-Phi-3/runs/Aug10_15-02-36_Troy-New-PC/events.out.tfevents.1723327356.Troy-New-PC.19660.0 b/BlackSheepVision-Phi-3/runs/Aug10_15-02-36_Troy-New-PC/events.out.tfevents.1723327356.Troy-New-PC.19660.0 new file mode 100644 index 0000000000000000000000000000000000000000..4d51c431a9c3b28fa8e101f7a697cfdb17a6c777 --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug10_15-02-36_Troy-New-PC/events.out.tfevents.1723327356.Troy-New-PC.19660.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81c5a67d71062f0d9d8248bed764eed4575f8a7717b22b4899c55734fab5e4ff +size 6358 diff --git a/BlackSheepVision-Phi-3/runs/Aug10_15-12-06_Troy-New-PC/events.out.tfevents.1723327926.Troy-New-PC.19660.1 b/BlackSheepVision-Phi-3/runs/Aug10_15-12-06_Troy-New-PC/events.out.tfevents.1723327926.Troy-New-PC.19660.1 new file mode 100644 index 0000000000000000000000000000000000000000..77cca5d95e467133b3e47657094aa9c77c4d2645 --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug10_15-12-06_Troy-New-PC/events.out.tfevents.1723327926.Troy-New-PC.19660.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6f698f4c18c619fe51ffea7ba82fd68d3f9048c018bb98b633a84005a8c7e65 +size 6346 diff --git a/BlackSheepVision-Phi-3/runs/Aug10_15-40-50_Troy-New-PC/events.out.tfevents.1723329650.Troy-New-PC.19660.2 b/BlackSheepVision-Phi-3/runs/Aug10_15-40-50_Troy-New-PC/events.out.tfevents.1723329650.Troy-New-PC.19660.2 new file mode 100644 index 0000000000000000000000000000000000000000..077bf427335b0495ad00d2b7385c3138c3ff0777 --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug10_15-40-50_Troy-New-PC/events.out.tfevents.1723329650.Troy-New-PC.19660.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34b7fc195da52fd1b181e23b725973caa6408e88358ac01d297dbed180655770 +size 6553 diff --git a/BlackSheepVision-Phi-3/runs/Aug10_15-48-28_Troy-New-PC/events.out.tfevents.1723330108.Troy-New-PC.19660.3 b/BlackSheepVision-Phi-3/runs/Aug10_15-48-28_Troy-New-PC/events.out.tfevents.1723330108.Troy-New-PC.19660.3 new file mode 100644 index 0000000000000000000000000000000000000000..01c7b0176210fe1018a20eed4df529f63e914796 --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug10_15-48-28_Troy-New-PC/events.out.tfevents.1723330108.Troy-New-PC.19660.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24b83801e1c45219db42779330b54432ee8d0681a650926ebfa588ca25c82282 +size 5378 diff --git a/BlackSheepVision-Phi-3/runs/Aug10_15-50-50_Troy-New-PC/events.out.tfevents.1723330250.Troy-New-PC.26212.0 b/BlackSheepVision-Phi-3/runs/Aug10_15-50-50_Troy-New-PC/events.out.tfevents.1723330250.Troy-New-PC.26212.0 new file mode 100644 index 0000000000000000000000000000000000000000..d384540f5f30c34f949b23aa93b2879400ecf36b --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug10_15-50-50_Troy-New-PC/events.out.tfevents.1723330250.Troy-New-PC.26212.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91c3a9fcb9a6c720b44f6f816bb4a04909fb8bc504a13030c034939e397cf5cc +size 5378 diff --git a/BlackSheepVision-Phi-3/runs/Aug10_15-54-59_Troy-New-PC/events.out.tfevents.1723330499.Troy-New-PC.24024.0 b/BlackSheepVision-Phi-3/runs/Aug10_15-54-59_Troy-New-PC/events.out.tfevents.1723330499.Troy-New-PC.24024.0 new file mode 100644 index 0000000000000000000000000000000000000000..269704b2ddfbb362c44524064a7e40ed15122aad --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug10_15-54-59_Troy-New-PC/events.out.tfevents.1723330499.Troy-New-PC.24024.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b93bbca065ef1cc0131af9debb6b4bfaf94ef650e866fdbdc91c238b33c5f509 +size 8690 diff --git a/BlackSheepVision-Phi-3/runs/Aug10_16-25-11_Troy-New-PC/events.out.tfevents.1723332311.Troy-New-PC.16236.0 b/BlackSheepVision-Phi-3/runs/Aug10_16-25-11_Troy-New-PC/events.out.tfevents.1723332311.Troy-New-PC.16236.0 new file mode 100644 index 0000000000000000000000000000000000000000..667ffe1093f506048edee57934ead9354d3a7645 --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug10_16-25-11_Troy-New-PC/events.out.tfevents.1723332311.Troy-New-PC.16236.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bb3163f967d46380f3cf70d0ffbf0cbcdcc3b15caefce9de3581082d72f4308 +size 5933 diff --git a/BlackSheepVision-Phi-3/runs/Aug10_16-32-57_Troy-New-PC/events.out.tfevents.1723332777.Troy-New-PC.16236.1 b/BlackSheepVision-Phi-3/runs/Aug10_16-32-57_Troy-New-PC/events.out.tfevents.1723332777.Troy-New-PC.16236.1 new file mode 100644 index 0000000000000000000000000000000000000000..fddbd8f25c2f517b4f9a16fb5041e651e6716842 --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug10_16-32-57_Troy-New-PC/events.out.tfevents.1723332777.Troy-New-PC.16236.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8a3254dc1542ea44995a2daf31ee1880d12b0c5c2d1f891af3c020f71ca8a8c +size 5378 diff --git a/BlackSheepVision-Phi-3/runs/Aug10_16-35-16_Troy-New-PC/events.out.tfevents.1723332916.Troy-New-PC.15040.0 b/BlackSheepVision-Phi-3/runs/Aug10_16-35-16_Troy-New-PC/events.out.tfevents.1723332916.Troy-New-PC.15040.0 new file mode 100644 index 0000000000000000000000000000000000000000..f8bd6c695117b7956b5d4be96c659a199b66393b --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug10_16-35-16_Troy-New-PC/events.out.tfevents.1723332916.Troy-New-PC.15040.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41985da8e645d226d39d9c81a1f57231a6adde20bf2a3bb8a51c45bfb15d3d2e +size 12595 diff --git a/BlackSheepVision-Phi-3/runs/Aug10_17-21-18_Troy-New-PC/events.out.tfevents.1723335678.Troy-New-PC.9632.0 b/BlackSheepVision-Phi-3/runs/Aug10_17-21-18_Troy-New-PC/events.out.tfevents.1723335678.Troy-New-PC.9632.0 new file mode 100644 index 0000000000000000000000000000000000000000..2a264e2e9c275254fe094bef1eff1f481e6ada77 --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug10_17-21-18_Troy-New-PC/events.out.tfevents.1723335678.Troy-New-PC.9632.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d31a5d9db85b4c9a8dd5544d62f229a0ea141b5147ad3c3f95163d56ca894750 +size 47832 diff --git a/BlackSheepVision-Phi-3/runs/Aug10_17-56-02_Troy-New-PC/events.out.tfevents.1723337762.Troy-New-PC.22188.0 b/BlackSheepVision-Phi-3/runs/Aug10_17-56-02_Troy-New-PC/events.out.tfevents.1723337762.Troy-New-PC.22188.0 new file mode 100644 index 0000000000000000000000000000000000000000..3024738c28eb5bfa97f0fb3452a582d403f74440 --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug10_17-56-02_Troy-New-PC/events.out.tfevents.1723337762.Troy-New-PC.22188.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d758a24bd567853a3c50507f4b9b7468e946049103f268547b3f2dcfeb9fc815 +size 5378 diff --git a/BlackSheepVision-Phi-3/runs/Aug10_17-57-40_Troy-New-PC/events.out.tfevents.1723337860.Troy-New-PC.15172.0 b/BlackSheepVision-Phi-3/runs/Aug10_17-57-40_Troy-New-PC/events.out.tfevents.1723337860.Troy-New-PC.15172.0 new file mode 100644 index 0000000000000000000000000000000000000000..6cfc8879a7809438cb0d71533dcb6299da0ea0ba --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug10_17-57-40_Troy-New-PC/events.out.tfevents.1723337860.Troy-New-PC.15172.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e326817cb78581d8b21921f8c1b3a9d56bb69bcde8aa5de9c5af59abe3148637 +size 5378 diff --git a/BlackSheepVision-Phi-3/runs/Aug10_17-58-53_Troy-New-PC/events.out.tfevents.1723337933.Troy-New-PC.22412.0 b/BlackSheepVision-Phi-3/runs/Aug10_17-58-53_Troy-New-PC/events.out.tfevents.1723337933.Troy-New-PC.22412.0 new file mode 100644 index 0000000000000000000000000000000000000000..e0ac0e697fcc4d794157a09ea381df91b81d3e19 --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug10_17-58-53_Troy-New-PC/events.out.tfevents.1723337933.Troy-New-PC.22412.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6de0e5d9d0b68ab9d41aa1e969c132bf1cb161ce63f3171384593af197b62daf +size 5378 diff --git a/BlackSheepVision-Phi-3/runs/Aug10_18-00-16_Troy-New-PC/events.out.tfevents.1723338016.Troy-New-PC.9200.0 b/BlackSheepVision-Phi-3/runs/Aug10_18-00-16_Troy-New-PC/events.out.tfevents.1723338016.Troy-New-PC.9200.0 new file mode 100644 index 0000000000000000000000000000000000000000..6b906d20a35dfc378ca9a26e142dd90250e1e1c8 --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug10_18-00-16_Troy-New-PC/events.out.tfevents.1723338016.Troy-New-PC.9200.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0bf93777958ccae26cfd15308e5c6b763f860b3bdfe2597759947396a358a32 +size 36438 diff --git a/BlackSheepVision-Phi-3/runs/Aug10_21-03-19_Troy-New-PC/events.out.tfevents.1723349000.Troy-New-PC.9200.1 b/BlackSheepVision-Phi-3/runs/Aug10_21-03-19_Troy-New-PC/events.out.tfevents.1723349000.Troy-New-PC.9200.1 new file mode 100644 index 0000000000000000000000000000000000000000..7a9a939ccb9d9b5d105fdb8e883c2401cae1dc4a --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug10_21-03-19_Troy-New-PC/events.out.tfevents.1723349000.Troy-New-PC.9200.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34dcd9366d7dd19c3805392402914b8f52fd7cc6281a2dd832b5e5c21b705ca9 +size 5378 diff --git a/BlackSheepVision-Phi-3/runs/Aug10_21-10-34_Troy-New-PC/events.out.tfevents.1723349435.Troy-New-PC.8440.0 b/BlackSheepVision-Phi-3/runs/Aug10_21-10-34_Troy-New-PC/events.out.tfevents.1723349435.Troy-New-PC.8440.0 new file mode 100644 index 0000000000000000000000000000000000000000..ee228a22c7b8e885cfc98dbb8db4be4aa362d5d4 --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug10_21-10-34_Troy-New-PC/events.out.tfevents.1723349435.Troy-New-PC.8440.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6abf58b49a5c23030c57f3910b52f41f82e05415f7bbd0e6798628a6a5aa5fa +size 5933 diff --git a/BlackSheepVision-Phi-3/runs/Aug10_21-14-10_Troy-New-PC/events.out.tfevents.1723349650.Troy-New-PC.8440.1 b/BlackSheepVision-Phi-3/runs/Aug10_21-14-10_Troy-New-PC/events.out.tfevents.1723349650.Troy-New-PC.8440.1 new file mode 100644 index 0000000000000000000000000000000000000000..22d9ae83c853bb9bc3bd11f5310c220783f1d216 --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug10_21-14-10_Troy-New-PC/events.out.tfevents.1723349650.Troy-New-PC.8440.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb457e4e01809c81f204571868046ae827686fc28e0d25ecb21482f47c89dddb +size 171478 diff --git a/BlackSheepVision-Phi-3/runs/Aug11_07-57-56_Troy-New-PC/events.out.tfevents.1723388276.Troy-New-PC.8440.2 b/BlackSheepVision-Phi-3/runs/Aug11_07-57-56_Troy-New-PC/events.out.tfevents.1723388276.Troy-New-PC.8440.2 new file mode 100644 index 0000000000000000000000000000000000000000..6cbd843d4d8b9cc222b6575032d30e6cc8f4a8a9 --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug11_07-57-56_Troy-New-PC/events.out.tfevents.1723388276.Troy-New-PC.8440.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43d8b2b45072fe1a703ecaf7165db2c4e786352c86227eae55da8d560945a779 +size 25677 diff --git a/BlackSheepVision-Phi-3/runs/Aug11_09-22-10_Troy-New-PC/events.out.tfevents.1723393331.Troy-New-PC.8440.3 b/BlackSheepVision-Phi-3/runs/Aug11_09-22-10_Troy-New-PC/events.out.tfevents.1723393331.Troy-New-PC.8440.3 new file mode 100644 index 0000000000000000000000000000000000000000..1880669bf30f2ce59fd556a333b675cd5c8234ba --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug11_09-22-10_Troy-New-PC/events.out.tfevents.1723393331.Troy-New-PC.8440.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1a24b3234092e7cdb7890f921e535ef333b3a0998b6233a53f43c0fddab1238 +size 64025 diff --git a/BlackSheepVision-Phi-3/runs/Aug11_10-11-33_Troy-New-PC/events.out.tfevents.1723396293.Troy-New-PC.3004.0 b/BlackSheepVision-Phi-3/runs/Aug11_10-11-33_Troy-New-PC/events.out.tfevents.1723396293.Troy-New-PC.3004.0 new file mode 100644 index 0000000000000000000000000000000000000000..ce035e064f1ef733e83db838446676baba025e59 --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug11_10-11-33_Troy-New-PC/events.out.tfevents.1723396293.Troy-New-PC.3004.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb53c22488cf45e8761d87b1ab893cd32045ef70188eefe73902ab189e8cccf8 +size 8422 diff --git a/BlackSheepVision-Phi-3/runs/Aug11_10-13-19_Troy-New-PC/events.out.tfevents.1723396399.Troy-New-PC.5380.0 b/BlackSheepVision-Phi-3/runs/Aug11_10-13-19_Troy-New-PC/events.out.tfevents.1723396399.Troy-New-PC.5380.0 new file mode 100644 index 0000000000000000000000000000000000000000..8a1a1041346e3cb2a1f6ee944d8f8c0bf9088180 --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug11_10-13-19_Troy-New-PC/events.out.tfevents.1723396399.Troy-New-PC.5380.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7eec9410902a0ba3e90218a30d0f3cf9bbe66d37df319ca2f5d175320ce1c88c +size 8423 diff --git a/BlackSheepVision-Phi-3/runs/Aug11_10-14-32_Troy-New-PC/events.out.tfevents.1723396473.Troy-New-PC.9536.0 b/BlackSheepVision-Phi-3/runs/Aug11_10-14-32_Troy-New-PC/events.out.tfevents.1723396473.Troy-New-PC.9536.0 new file mode 100644 index 0000000000000000000000000000000000000000..944510fca0203dc06b3058f2c51120dbc6eaf52f --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug11_10-14-32_Troy-New-PC/events.out.tfevents.1723396473.Troy-New-PC.9536.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff3401af62daff04da24364673f03a58c8f834d480f126e76e06ae570b6d75e4 +size 8423 diff --git a/BlackSheepVision-Phi-3/runs/Aug11_10-15-46_Troy-New-PC/events.out.tfevents.1723396546.Troy-New-PC.21572.0 b/BlackSheepVision-Phi-3/runs/Aug11_10-15-46_Troy-New-PC/events.out.tfevents.1723396546.Troy-New-PC.21572.0 new file mode 100644 index 0000000000000000000000000000000000000000..402e3d21aa3c1618a4bcd71a80c8f00f9beb8fe0 --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug11_10-15-46_Troy-New-PC/events.out.tfevents.1723396546.Troy-New-PC.21572.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c645d3e65856f03feb6baf4b1856c99c0c1109720f6408017f8a77a83cbd95e +size 8423 diff --git a/BlackSheepVision-Phi-3/runs/Aug11_10-18-58_Troy-New-PC/events.out.tfevents.1723396738.Troy-New-PC.12708.0 b/BlackSheepVision-Phi-3/runs/Aug11_10-18-58_Troy-New-PC/events.out.tfevents.1723396738.Troy-New-PC.12708.0 new file mode 100644 index 0000000000000000000000000000000000000000..e4420da112a7e4e4656134261796d717c0d71428 --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug11_10-18-58_Troy-New-PC/events.out.tfevents.1723396738.Troy-New-PC.12708.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8db83d9102cb1cca251756088221070b64cef098dcd44f3fb0ba15cdeba546b5 +size 8423 diff --git a/BlackSheepVision-Phi-3/runs/Aug11_10-22-18_Troy-New-PC/events.out.tfevents.1723396938.Troy-New-PC.13048.0 b/BlackSheepVision-Phi-3/runs/Aug11_10-22-18_Troy-New-PC/events.out.tfevents.1723396938.Troy-New-PC.13048.0 new file mode 100644 index 0000000000000000000000000000000000000000..cee35a24ddbe25ce71ec20db065c809a58df8669 --- /dev/null +++ b/BlackSheepVision-Phi-3/runs/Aug11_10-22-18_Troy-New-PC/events.out.tfevents.1723396938.Troy-New-PC.13048.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0cd51958843cce9335c9b7e6a5612d887b8b830cb37500d52a5234d5b5c0cef +size 113333 diff --git a/BlackSheepVision-Phi-3/training_log.json b/BlackSheepVision-Phi-3/training_log.json new file mode 100644 index 0000000000000000000000000000000000000000..18a73d16498a6b4b9ea86466d20b7eaa2798c91e --- /dev/null +++ b/BlackSheepVision-Phi-3/training_log.json @@ -0,0 +1,17 @@ +{ + "base_model_name": "microsoft_Phi-3-vision-128k-instruct", + "base_model_class": "Phi3VForCausalLM", + "base_loaded_in_4bit": true, + "base_loaded_in_8bit": false, + "projections": "gate, down, up, q, v, k, o", + "loss": 0.3423, + "grad_norm": 1.8447479009628296, + "learning_rate": 9.438738616283812e-05, + "epoch": 2.3596574690770695, + "current_steps": 4961, + "train_runtime": 14910.6647, + "train_samples_per_second": 5.921, + "train_steps_per_second": 2.96, + "total_flos": 6.693944118843802e+17, + "train_loss": 0.7060681312735523 +} \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/training_parameters.json b/BlackSheepVision-Phi-3/training_parameters.json new file mode 100644 index 0000000000000000000000000000000000000000..c6a3c3476da0af2a8cd9f7a9215674ac014efb7c --- /dev/null +++ b/BlackSheepVision-Phi-3/training_parameters.json @@ -0,0 +1,37 @@ +{ + "lora_name": "Nemo", + "always_override": true, + "q_proj_en": true, + "v_proj_en": true, + "k_proj_en": true, + "o_proj_en": true, + "gate_proj_en": true, + "down_proj_en": true, + "up_proj_en": true, + "save_steps": 1000, + "micro_batch_size": 1, + "batch_size": 2, + "epochs": 42, + "learning_rate": "1e-4", + "lr_scheduler_type": "polynomial", + "lora_rank": 2048, + "lora_alpha": 4096, + "lora_dropout": 0, + "cutoff_len": 4096, + "dataset": "BLACKSHEEP-Toxic_Assistant", + "eval_dataset": "None", + "format": "unwoke_alpaca-chatbot-format", + "eval_steps": 100, + "raw_text_file": "None", + "overlap_len": 512, + "newline_favor_len": 512, + "higher_rank_limit": true, + "warmup_steps": 0, + "optimizer": "adamw_bnb_8bit", + "hard_cut_string": "\\n\\n\\n", + "train_only_after": "", + "stop_at_loss": 0, + "add_eos_token": false, + "min_chars": 0, + "report_to": "tensorboard" +} \ No newline at end of file diff --git a/BlackSheepVision-Phi-3/training_prompt.json b/BlackSheepVision-Phi-3/training_prompt.json new file mode 100644 index 0000000000000000000000000000000000000000..f8f85b67d7b4c4c05d0bcf5e2f16b6a1eb01d5c6 --- /dev/null +++ b/BlackSheepVision-Phi-3/training_prompt.json @@ -0,0 +1,16 @@ +{ + "template_type": "dataset", + "template_1": "Who is your creator?\n\n%creator%", + "template_2": "%ChatML_CONVO%", + "template_3": "<|im_start|> I want you to say this next statement like a Gen-Z. \n %English% \n <|im_start|> %Gen-Z% <|im_end|>", + "template_4": "<|im_start|> %prompt% \n <|im_start|> %output% <|im_end|>", + "template_5": "<|im_start|> %instruction% \n <|im_start|> %output% <|im_end|>", + "template_6": "<|im_start|> %instruction%\n %input%\n <|im_start|> %output% <|im_end|>", + "template_7": "<|im_start|> %question% \n <|im_start|> %output% <|im_end|>", + "template_8": "<|im_start|> %question% \n <|im_start|> %response% <|im_end|>", + "template_9": "<|im_start|> %perspective% \n <|im_start|> %output% <|im_end|>", + "template_10": "<|im_start|> %perspective%\n %input%\n <|im_start|> %output% <|im_end|>", + "template_11": "<|im_start|> %instruction% \n <|im_start|> %toxic% <|im_end|>", + "template_12": "<|im_start|> %prompt% \n <|im_start|> %chosen% <|im_end|>", + "template_13": "<|im_start|> system\n : %system% \n <|im_end|> \n <|im_start|> %user% \n <|im_end|> \n <|im_start|> %assistant%" +} \ No newline at end of file