kacper commited on
Commit
01b6887
1 Parent(s): e2d4861

Initial model version

Browse files
Files changed (3) hide show
  1. README.md +14 -0
  2. config.yaml +132 -0
  3. percussion_v0-finetuned-triton.ckpt +3 -0
README.md ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - audio
4
+ - diffusion
5
+ - waveform diffusion
6
+ - audio diffusion
7
+ - unet
8
+ - korg
9
+ - triton
10
+ - grime
11
+ ---
12
+ # Model Card for tiny-audio-diffusion-percussion
13
+
14
+ General percussion/drum model for tiny-audio-diffusion, fine-tuned on a dataset of 382 Korg Triton drum samples for 56 epochs. Use with [tiny-audio-diffusion](https://github.com/crlandsc/tiny-audio-diffusion) repo to generate random drum samples of all types.
config.yaml ADDED
@@ -0,0 +1,132 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 12345
2
+ train: true
3
+ ignore_warnings: true
4
+ print_config: false
5
+ work_dir: ${hydra:runtime.cwd}
6
+ logs_dir: ${work_dir}${oc.env:DIR_LOGS}
7
+ data_dir: ${work_dir}${oc.env:DIR_DATA}
8
+ ckpt_dir: ${logs_dir}/runs/${now:%Y-%m-%d-%H-%M-%S}
9
+ module: main.module_base
10
+ batch_size: 16
11
+ accumulate_grad_batches: 2
12
+ num_workers: 16
13
+ sampling_rate: 44100
14
+ length: 32768
15
+ channels: 2
16
+ log_every_n_steps: 500
17
+ model:
18
+ _target_: ${module}.Model
19
+ lr: 0.0001
20
+ lr_beta1: 0.95
21
+ lr_beta2: 0.999
22
+ lr_eps: 1.0e-06
23
+ lr_weight_decay: 0.001
24
+ ema_beta: 0.995
25
+ ema_power: 0.7
26
+ model:
27
+ _target_: main.DiffusionModel
28
+ net_t:
29
+ _target_: ${module}.UNetT
30
+ in_channels: 2
31
+ channels:
32
+ - 32
33
+ - 32
34
+ - 64
35
+ - 64
36
+ - 128
37
+ - 128
38
+ - 256
39
+ - 256
40
+ factors:
41
+ - 1
42
+ - 2
43
+ - 2
44
+ - 2
45
+ - 2
46
+ - 2
47
+ - 2
48
+ - 2
49
+ items:
50
+ - 2
51
+ - 2
52
+ - 2
53
+ - 2
54
+ - 2
55
+ - 2
56
+ - 4
57
+ - 4
58
+ attentions:
59
+ - 0
60
+ - 0
61
+ - 0
62
+ - 0
63
+ - 0
64
+ - 1
65
+ - 1
66
+ - 1
67
+ attention_heads: 8
68
+ attention_features: 64
69
+ datamodule:
70
+ _target_: main.module_base.Datamodule
71
+ dataset:
72
+ _target_: audio_data_pytorch.WAVDataset
73
+ path: ./data/triton_aug
74
+ recursive: true
75
+ sample_rate: ${sampling_rate}
76
+ transforms:
77
+ _target_: audio_data_pytorch.AllTransform
78
+ crop_size: ${length}
79
+ stereo: true
80
+ source_rate: ${sampling_rate}
81
+ target_rate: ${sampling_rate}
82
+ loudness: -20
83
+ val_split: 0.05
84
+ batch_size: ${batch_size}
85
+ num_workers: ${num_workers}
86
+ pin_memory: true
87
+ callbacks:
88
+ rich_progress_bar:
89
+ _target_: pytorch_lightning.callbacks.RichProgressBar
90
+ model_checkpoint:
91
+ _target_: pytorch_lightning.callbacks.ModelCheckpoint
92
+ monitor: valid_loss
93
+ save_top_k: 1
94
+ save_last: true
95
+ mode: min
96
+ verbose: false
97
+ dirpath: ${logs_dir}/ckpts/${now:%Y-%m-%d-%H-%M-%S}
98
+ filename: '{epoch:02d}-{valid_loss:.3f}'
99
+ model_summary:
100
+ _target_: pytorch_lightning.callbacks.RichModelSummary
101
+ max_depth: 2
102
+ audio_samples_logger:
103
+ _target_: main.module_base.SampleLogger
104
+ num_items: 4
105
+ channels: ${channels}
106
+ sampling_rate: ${sampling_rate}
107
+ length: ${length}
108
+ sampling_steps:
109
+ - 50
110
+ use_ema_model: true
111
+ loggers:
112
+ wandb:
113
+ _target_: pytorch_lightning.loggers.wandb.WandbLogger
114
+ project: ${oc.env:WANDB_PROJECT}
115
+ entity: ${oc.env:WANDB_ENTITY}
116
+ name: percussion_v0-finetuned-triton
117
+ job_type: train
118
+ group: ''
119
+ save_dir: ${logs_dir}
120
+ trainer:
121
+ _target_: pytorch_lightning.Trainer
122
+ gpus: 1
123
+ precision: 16
124
+ accelerator: gpu
125
+ min_epochs: 0
126
+ max_epochs: -1
127
+ enable_model_summary: false
128
+ log_every_n_steps: 1
129
+ check_val_every_n_epoch: null
130
+ val_check_interval: ${log_every_n_steps}
131
+ accumulate_grad_batches: ${accumulate_grad_batches}
132
+ ckpt: saved_models/percussion-finetuned-triton/percussion_v0-finetuned-triton.ckpt
percussion_v0-finetuned-triton.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72c6f82de16914317fe163bb28d84459e0f7374804037fc622512cf782367980
3
+ size 509086849