pavan-naik commited on
Commit
8de4dca
·
verified ·
1 Parent(s): 7caf528

Upload prediction_artifacts/training_args.yaml with huggingface_hub

Browse files
prediction_artifacts/training_args.yaml ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ cutoff_len: 1024
2
+ dataset_dir: data
3
+ do_predict: true
4
+ eval_dataset: english_to_kannada_test
5
+ finetuning_type: lora
6
+ flash_attn: auto
7
+ max_new_tokens: 512
8
+ max_samples: 100000
9
+ model_name_or_path: /content/gemma_3_1b_it_kn_ext_init
10
+ output_dir: saves/Gemma-3-1B-Instruct/lora/gemma_3_1b_it_kn_ext_init
11
+ per_device_eval_batch_size: 16
12
+ predict_with_generate: true
13
+ preprocessing_num_workers: 16
14
+ quantization_method: bnb
15
+ stage: sft
16
+ temperature: 0.95
17
+ template: gemma
18
+ top_p: 0.7
19
+ trust_remote_code: true