Upload prediction_artifacts/training_args.yaml with huggingface_hub
Browse files
prediction_artifacts/training_args.yaml
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
cutoff_len: 1024
|
| 2 |
+
dataset_dir: data
|
| 3 |
+
do_predict: true
|
| 4 |
+
eval_dataset: english_to_kannada_test
|
| 5 |
+
finetuning_type: lora
|
| 6 |
+
flash_attn: auto
|
| 7 |
+
max_new_tokens: 512
|
| 8 |
+
max_samples: 100000
|
| 9 |
+
model_name_or_path: /content/gemma_3_1b_it_kn_ext_init
|
| 10 |
+
output_dir: saves/Gemma-3-1B-Instruct/lora/gemma_3_1b_it_kn_ext_init
|
| 11 |
+
per_device_eval_batch_size: 16
|
| 12 |
+
predict_with_generate: true
|
| 13 |
+
preprocessing_num_workers: 16
|
| 14 |
+
quantization_method: bnb
|
| 15 |
+
stage: sft
|
| 16 |
+
temperature: 0.95
|
| 17 |
+
template: gemma
|
| 18 |
+
top_p: 0.7
|
| 19 |
+
trust_remote_code: true
|