File size: 740 Bytes
b47a561
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
model:
  task: audio
  encoder:
    name: wavlm
    version: base
    pretrained: true
    pretrained_path: manipulate_model/encoder_checkpoints/wavlm/WavLM-Base+.pt
    output_layer: 3
  encoder_freeze: false
  decoder:
    name: aasist
    version: default
    output_size: 2
  online_encoding: true
data:
  name: av1m
  train_parts: all
  val_parts: all
  test_parts: all
  train_size: -1
  val_size: -1
  test_size: -1
  shape:
  - 3
  - 224
  - 224
  sr: 16000
  fps: 25
  center_transition: true
  window_size: 4
  sliding_window: false
train:
  num_workers: 16
  batch_size: 64
  num_epochs: 15
  optimizer: adam
  scheduler: step
  lr: 0.0001
  step_size: 1
  gamma: 0.1
  loss: bce
  log_interval: 100
  shuffle: true
debug: false