Skip to content

Commit

Permalink
Merge branch 'main' of https://github.com/openvpi/SOME
Browse files Browse the repository at this point in the history
  • Loading branch information
yqzhishen committed Sep 20, 2023
2 parents 0befadd + de973eb commit 7c89acd
Show file tree
Hide file tree
Showing 7 changed files with 766 additions and 4 deletions.
1 change: 1 addition & 0 deletions configs/base.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -28,6 +28,7 @@ units_dim: 80 # 768
midi_num_bins: 128
model_cls: null
midi_extractor_args: {}
use_BCEWithLogitsLoss: false

# training
use_midi_loss: true
Expand Down
37 changes: 37 additions & 0 deletions configs/midi_conformer.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,37 @@
base_config:
- configs/base.yaml


model_cls: modules.model.Gmidi_conform.midi_conforms
task_cls: training.MIDIExtractionTask
binary_data_dir: data/some_ds_roundmidi_spk3_aug8/binary

num_valid_plots: 100
log_interval: 100
num_sanity_val_steps: 1 # steps of validation at the beginning
val_check_interval: 5000
num_ckpt_keep: 6
max_updates: 300000

midi_prob_deviation: 1.0
midi_shift_proportion: 0.0
midi_shift_range: [-12, 12]
rest_threshold: 0.1


use_BCEWithLogitsLoss: true
midi_extractor_args:
lay: 8
dim: 512

use_lay_skip: true
kernel_size: 31
conv_drop: 0.1
ffn_latent_drop: 0.1
ffn_out_drop: 0.1
attention_drop: 0.1
attention_heads: 8
attention_heads_dim: 64
sig: false

pl_trainer_precision: 'bf16'
39 changes: 39 additions & 0 deletions configs/unet.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,39 @@
base_config:
- configs/base.yaml


max_batch_size: 1
model_cls: modules.model.unet_conform.midi_unet_conforms
task_cls: training.MIDIExtractionTask
binary_data_dir: data/some_ds_roundmidi_spk3_aug8/binary

num_valid_plots: 100
log_interval: 100
num_sanity_val_steps: 1 # steps of validation at the beginning
val_check_interval: 5000
num_ckpt_keep: 6
max_updates: 100000

midi_prob_deviation: 1.0
midi_shift_proportion: 0.0
midi_shift_range: [-12, 12]
rest_threshold: 0.1

use_BCEWithLogitsLoss: true
midi_extractor_args:
output_lay: 3
dim: 512
kernel_size: 31
conv_drop: 0.1
ffn_latent_drop: 0.1
ffn_out_drop: 0.1
attention_drop: 0.1
attention_heads: 4
attention_heads_dim: 64
unet_type: 'cf_unet_full'
unet_down: [2, 2, 2,2,2]
unet_dim: [512, 512, 768,768,1024]
unet_latentdim: 1024
sig: false

pl_trainer_precision: 'bf16'
Loading

0 comments on commit 7c89acd

Please sign in to comment.