Skip to content

Commit

Permalink
add configs for train private data
Browse files Browse the repository at this point in the history
  • Loading branch information
hungdinhxuan committed Dec 21, 2024
1 parent c7b511d commit 487600d
Show file tree
Hide file tree
Showing 7 changed files with 690 additions and 413 deletions.
1 change: 1 addition & 0 deletions configs/data/normal_largecorpus_multiview_cnsl.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -29,6 +29,7 @@ args:
augmentation_methods:
["RawBoost12", "pitch_1", "volume_10", "speed_01", "none"] # "none" is the original data
wav_samp_rate: 16000
trim_length: 64000
online_aug: true
aug_dir: ${oc.env:LARGE_CORPUS_FOR_CNSL}/aug
noise_path: ${oc.env:NOISE_PATH}
Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,48 @@
# @package _global_

# to execute this experiment run:
# python train.py experiment=example

defaults:
- override /data: normal_largecorpus_multiview_cnsl
- override /model: xlsr_conformertcm_baseline_multiview
- override /callbacks: default_loss
- override /trainer: default

# all parameters below will be merged with parameters from default configurations set above
# this allows you to overwrite only specified parameters

tags: ["normal_largecorpus_multiview_cnsl", "xlsr_conformertcm_baseline_multiview"]

seed: 1234

trainer:
max_epochs: 100
gradient_clip_val: 0.0
accelerator: cuda

model:
optimizer:
lr: 0.000001
weight_decay: 0.0001
net: null
scheduler: null
compile: true
cross_entropy_weight: [0.7, 0.3] # Balanced weights for cross entropy loss

data:
batch_size: 14
num_workers: 8
pin_memory: true
args:
augmentation_methods: ["RawBoost12", 'RawBoost12', 'RawBoostFull', "pitch_1", "volume_10", "speed_01", "none"] # "none" is the original data
padding_type: repeat
random_start: True


logger:
wandb:
tags: ${tags}
group: "normal_largecorpus_multiview_cnsl"
aim:
experiment: "normal_largecorpus_multiview_cnsl"
Loading

0 comments on commit 487600d

Please sign in to comment.