crlandsc
/

tiny-audio-diffusion-hihats

waveform diffusion

audio diffusion

Model card Files Files and versions Community

crlandsc commited on Jun 15, 2023

Commit

d327db5

•

1 Parent(s): 222db38

added hihat ckpt and config

Files changed (2) hide show

config.yaml +131 -0
hihats_v2.ckpt +3 -0

config.yaml ADDED Viewed

	@@ -0,0 +1,131 @@

+seed: 12345
+train: true
+ignore_warnings: true
+print_config: false
+work_dir: ${hydra:runtime.cwd}
+logs_dir: ${work_dir}${oc.env:DIR_LOGS}
+data_dir: ${work_dir}${oc.env:DIR_DATA}
+ckpt_dir: ${logs_dir}/ckpts/${now:%Y-%m-%d-%H-%M-%S}
+module: main.module_base
+batch_size: 1
+accumulate_grad_batches: 32
+num_workers: 8
+sampling_rate: 44100
+length: 32768
+channels: 2
+log_every_n_steps: 1000
+model:
+  _target_: ${module}.Model
+  lr: 0.0001
+  lr_beta1: 0.95
+  lr_beta2: 0.999
+  lr_eps: 1.0e-06
+  lr_weight_decay: 0.001
+  ema_beta: 0.995
+  ema_power: 0.7
+  model:
+    _target_: main.DiffusionModel
+    net_t:
+      _target_: ${module}.UNetT
+    in_channels: 2
+    channels:
+    - 32
+    - 32
+    - 64
+    - 64
+    - 128
+    - 128
+    - 256
+    - 256
+    factors:
+    - 1
+    - 2
+    - 2
+    - 2
+    - 2
+    - 2
+    - 2
+    - 2
+    items:
+    - 2
+    - 2
+    - 2
+    - 2
+    - 2
+    - 2
+    - 4
+    - 4
+    attentions:
+    - 0
+    - 0
+    - 0
+    - 0
+    - 0
+    - 1
+    - 1
+    - 1
+    attention_heads: 8
+    attention_features: 64
+datamodule:
+  _target_: main.module_base.Datamodule
+  dataset:
+    _target_: audio_data_pytorch.WAVDataset
+    path: ./data/wav_dataset/kicks
+    recursive: true
+    sample_rate: ${sampling_rate}
+    transforms:
+      _target_: audio_data_pytorch.AllTransform
+      crop_size: ${length}
+      stereo: true
+      source_rate: ${sampling_rate}
+      target_rate: ${sampling_rate}
+      loudness: -20
+  val_split: 0.05
+  batch_size: ${batch_size}
+  num_workers: ${num_workers}
+  pin_memory: true
+callbacks:
+  rich_progress_bar:
+    _target_: pytorch_lightning.callbacks.RichProgressBar
+  model_checkpoint:
+    _target_: pytorch_lightning.callbacks.ModelCheckpoint
+    monitor: valid_loss
+    save_top_k: 1
+    save_last: true
+    mode: min
+    verbose: false
+    dirpath: ${logs_dir}/ckpts/${now:%Y-%m-%d-%H-%M-%S}
+    filename: '{epoch:02d}-{valid_loss:.3f}'
+  model_summary:
+    _target_: pytorch_lightning.callbacks.RichModelSummary
+    max_depth: 2
+  audio_samples_logger:
+    _target_: main.module_base.SampleLogger
+    num_items: 4
+    channels: ${channels}
+    sampling_rate: ${sampling_rate}
+    length: ${length}
+    sampling_steps:
+    - 50
+    use_ema_model: true
+loggers:
+  wandb:
+    _target_: pytorch_lightning.loggers.wandb.WandbLogger
+    project: ${oc.env:WANDB_PROJECT}
+    entity: ${oc.env:WANDB_ENTITY}
+    name: kicks_v7
+    job_type: train
+    group: ''
+    save_dir: ${logs_dir}
+trainer:
+  _target_: pytorch_lightning.Trainer
+  gpus: 1
+  precision: 16
+  accelerator: gpu
+  min_epochs: 0
+  max_epochs: -1
+  enable_model_summary: false
+  log_every_n_steps: 1
+  check_val_every_n_epoch: null
+  val_check_interval: ${log_every_n_steps}
+  accumulate_grad_batches: ${accumulate_grad_batches}

hihats_v2.ckpt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fc7245d3d5617bb3a76dcc8534d9cee25030c3986fa80502f19ec3506a68d05c
+size 509086593