| ############################################################################## | |
| # THIS FILE IS ONLY MEANT TO BE EDITED IF YOU ARE SURE! | |
| # PROGRAM FAILURE IS LIKELY TO OCCUR IF YOU ARE UNSURE OF THE | |
| # CONSEQUENCES OF YOUR CHANGES. | |
| # IF YOU HAVE CHANGED VALUES AND ARE ENCOUNTERING ERRORS, | |
| # STASH YOUR CHANGES ('git stash' in a git bash console in acodet directory) | |
| ############################################################################## | |
| #################### AUDIO PROCESSING PARAMETERS ########################### | |
| #!!! CHANGING THESE PARAMETERS WILL RESULT IN MODEL FAILURE, ONLY TO !!!# | |
| #!!! BE CHANGED FOR TRAINING OF NEW MODEL ESPECIALY FOR DIFFERENT SPECIES !!!# | |
| ## Global audio processing parameters | |
| # sample rate | |
| sample_rate: 2000 | |
| # length of context window in seconds | |
| # this is the audio segment length that the model is trained on | |
| context_window_in_seconds: 3.9 | |
| ## Mel-Spectrogram parameters | |
| # FFT window length | |
| stft_frame_len: 1024 | |
| # number of time bins for mel spectrogram | |
| number_of_time_bins: 128 | |
| ################### TFRECORD CREATION PARAMETERS ########################### | |
| ## Settings for Creation of Tfrecord Dataset | |
| # limit of context windows in a tfrecords file | |
| tfrecs_limit_per_file: 600 | |
| # train/test split | |
| train_ratio: 0.7 | |
| # test/val split | |
| test_val_ratio: 0.7 | |
| ######################## ANNOTATIONS ######################################## | |
| default_threshold: 0.5 | |
| # minimum frequency of annotation boxes | |
| annotation_df_fmin: 50 | |
| # maximum frequency of annotation boxes | |
| annotation_df_fmax: 1000 | |
| ######################## PATHS ############################################# | |
| # dataset destination directory - save tfrecord dataset to this directory | |
| # only change when really necessary | |
| tfrecords_destination_folder: 'tests/test-tfrec' | |
| # default folder to store newly created annotations | |
| generated_annotations_folder: '../generated_annotations' | |
| # name of current North Atlantic humpback whale song model | |
| model_name: 'Humpback_20221130' | |
| # name of top level directory when annotating multiple datasets | |
| top_dir_name: 'main' | |
| # custom string to add to timestamp for directory name | |
| # of created annotations | |
| annots_timestamp_folder: '' | |
| # default threshold folder name | |
| thresh_label: 'thresh_0.5' | |
| ####################### TRAINING ########################################### | |
| # Name of Model class, default is HumpBackNorthAtlantic, possible other classes | |
| # are GoogleMod for the modified ResNet-50 architecture, or KerasAppModel for | |
| # any of the Keras application models (name will get specified under keras_mod_name) | |
| ModelClassName: 'HumpBackNorthAtlantic' | |
| # batch size for training and evaluating purposes | |
| batch_size: 32 | |
| # number of epochs to run the model | |
| epochs: 50 | |
| # specify the path to your training checkpoint here to load a pretrained model | |
| load_ckpt_path: False | |
| # to run the google model, select True | |
| load_g_ckpt: False | |
| # specify the name of the keras application model that you want to run - select the | |
| # ModelClassName KerasAppModel for this | |
| keras_mod_name: False | |
| # number of steps per epoch | |
| steps_per_epoch: 1000 | |
| # select True if you want your training data to be time shift augmented (recommended) | |
| time_augs: True | |
| # select True if you want your training data to be MixUp augmented (recommended) | |
| mixup_augs: True | |
| # select True if you want your training data to be | |
| # time and frequency masked augmented (recommended) | |
| spec_aug: True | |
| # specify a string to describe the dataset used for this model run (to later be able | |
| # to understand what was significant about this model training) | |
| data_description: 'describe your dataset' | |
| # starting learning rate | |
| init_lr: 5e-4 | |
| # final learning rate | |
| final_lr: 5e-6 | |
| # number of preliminary blocks in model (are kept frozen) | |
| pre_blocks: 9 | |
| # threshold for f score beta | |
| f_score_beta: 0.5 | |
| f_score_thresh: 0.5 | |
| # number of layers to unfreeze, if False, the entire model is trainable | |
| unfreeze: False | |
| ######################## Streamlit ######################################### | |
| # select True if you want to run the streamlit app | |
| streamlit: False |