Tiger14n commited on
Commit
19ce837
·
verified ·
1 Parent(s): 7ef7abb

Update configs/inference.yaml

Browse files
Files changed (1) hide show
  1. configs/inference.yaml +64 -64
configs/inference.yaml CHANGED
@@ -1,65 +1,65 @@
1
- model:
2
- name: 'google/t5-v1_1-small'
3
- spectrogram:
4
- sample_rate: 16000
5
- hop_length: 128
6
- n_fft: 1024
7
- n_mels: 388
8
- do_style_embed: false
9
- input_features: false
10
-
11
- model_path: './checkpoint'
12
- audio_path: '' # Path to input audio
13
- total_duration_ms: 0 # Total duration of audio in milliseconds, 0 for full audio
14
- output_path: '' # Path to output directory
15
- bpm: 120 # Beats per minute of input audio
16
- offset: 0 # Start of beat, in miliseconds, from the beginning of input audio
17
- resnap_objects: false # Resnap objects beat timing ticks, requires accurate BPM and offset
18
- slider_multiplier: 1.7 # Multiplier for slider velocity
19
- title: '' # Song title
20
- artist: '' # Song artist
21
- beatmap_path: '' # Path to .osu file which will be remapped
22
- other_beatmap_path: '' # Path to .osu file of other beatmap in the mapset to use as reference
23
- beatmap_id: -1 # Beatmap ID to use as style
24
- difficulty: -1 # Difficulty star rating to map
25
- creator: '' # Beatmap creator
26
- version: '' # Beatmap version
27
- full_set: true # Generate full mapset
28
- set_difficulties: 5 # Number of difficulties to generate.
29
-
30
- # Diffusion settings
31
- generate_positions: true # Use diffusion to generate object positions
32
- diff_ckpt: './osudiffusion/DiT-B-0700000.pt' # Path to checkpoint for diffusion model
33
- diff_refine_ckpt: '' # Path to checkpoint for refining diffusion model
34
-
35
- diffusion:
36
- style_id: 1451282 # Style ID to use for diffusion
37
- num_sampling_steps: 100 # Number of sampling steps
38
- cfg_scale: 1 # Scale of classifier-free guidance
39
- num_classes: 52670 # Number of classes stored in the model
40
- beatmap_idx: 'osudiffusion/beatmap_idx.pickle' # Path to beatmap index
41
- use_amp: true # Use automatic mixed precision
42
- refine_iters: 10 # Number of refinement iterations
43
- seq_len: 128 # Sequence length
44
- model: 'DiT-B' # Model architecture
45
-
46
-
47
- data: # Data settings
48
- src_seq_len: 640
49
- tgt_seq_len: 480
50
- sample_rate: ${model.spectrogram.sample_rate}
51
- hop_length: ${model.spectrogram.hop_length}
52
- sequence_stride: 1 # Fraction of audio sequence length to shift inference window
53
- center_pad_decoder: false # Center pad decoder input
54
- add_pre_tokens: true
55
- special_token_len: 2
56
- diff_token_index: 0
57
- style_token_index: -1
58
- max_pre_token_len: 4
59
- add_gd_context: false # Prefix the decoder with tokens of another beatmap in the mapset
60
-
61
- hydra:
62
- job:
63
- chdir: False
64
- run:
65
  dir: ./logs/${now:%Y-%m-%d}/${now:%H-%M-%S}
 
1
+ model:
2
+ name: 'google/t5-v1_1-small'
3
+ spectrogram:
4
+ sample_rate: 16000
5
+ hop_length: 128
6
+ n_fft: 1024
7
+ n_mels: 256
8
+ do_style_embed: false
9
+ input_features: false
10
+
11
+ model_path: './checkpoint'
12
+ audio_path: '' # Path to input audio
13
+ total_duration_ms: 0 # Total duration of audio in milliseconds, 0 for full audio
14
+ output_path: '' # Path to output directory
15
+ bpm: 120 # Beats per minute of input audio
16
+ offset: 0 # Start of beat, in miliseconds, from the beginning of input audio
17
+ resnap_objects: false # Resnap objects beat timing ticks, requires accurate BPM and offset
18
+ slider_multiplier: 1.7 # Multiplier for slider velocity
19
+ title: '' # Song title
20
+ artist: '' # Song artist
21
+ beatmap_path: '' # Path to .osu file which will be remapped
22
+ other_beatmap_path: '' # Path to .osu file of other beatmap in the mapset to use as reference
23
+ beatmap_id: -1 # Beatmap ID to use as style
24
+ difficulty: -1 # Difficulty star rating to map
25
+ creator: '' # Beatmap creator
26
+ version: '' # Beatmap version
27
+ full_set: false # Generate full mapset
28
+ set_difficulties: 5 # Number of difficulties to generate.
29
+
30
+ # Diffusion settings
31
+ generate_positions: true # Use diffusion to generate object positions
32
+ diff_ckpt: './osudiffusion/DiT-B-0700000.pt' # Path to checkpoint for diffusion model
33
+ diff_refine_ckpt: '' # Path to checkpoint for refining diffusion model
34
+
35
+ diffusion:
36
+ style_id: 1451282 # Style ID to use for diffusion
37
+ num_sampling_steps: 100 # Number of sampling steps
38
+ cfg_scale: 1 # Scale of classifier-free guidance
39
+ num_classes: 52670 # Number of classes stored in the model
40
+ beatmap_idx: 'osudiffusion/beatmap_idx.pickle' # Path to beatmap index
41
+ use_amp: true # Use automatic mixed precision
42
+ refine_iters: 10 # Number of refinement iterations
43
+ seq_len: 128 # Sequence length
44
+ model: 'DiT-B' # Model architecture
45
+
46
+
47
+ data: # Data settings
48
+ src_seq_len: 800
49
+ tgt_seq_len: 600
50
+ sample_rate: ${model.spectrogram.sample_rate}
51
+ hop_length: ${model.spectrogram.hop_length}
52
+ sequence_stride: 1 # Fraction of audio sequence length to shift inference window
53
+ center_pad_decoder: false # Center pad decoder input
54
+ add_pre_tokens: true
55
+ special_token_len: 2
56
+ diff_token_index: 0
57
+ style_token_index: -1
58
+ max_pre_token_len: 4
59
+ add_gd_context: false # Prefix the decoder with tokens of another beatmap in the mapset
60
+
61
+ hydra:
62
+ job:
63
+ chdir: False
64
+ run:
65
  dir: ./logs/${now:%Y-%m-%d}/${now:%H-%M-%S}