RoyalCities commited on
Commit
c72b261
·
verified ·
1 Parent(s): 145ccab

Upload 3 files

Browse files
Audialab_EDM_Elements.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:740c58fcf84a887d536ff39b3bf3e87318618fe79ed90483d31e3e85a6a18724
3
+ size 4854117139
Audialab_EDM_Elements_Small.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dffb8cfbed51ab90046987994f63b012f06844efa69d94583b3f639bcfa42443
3
+ size 2427159451
model_config.json ADDED
@@ -0,0 +1,128 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "diffusion_cond",
3
+ "sample_size": 882000,
4
+ "sample_rate": 44100,
5
+ "audio_channels": 2,
6
+ "model": {
7
+ "pretransform": {
8
+ "type": "autoencoder",
9
+ "iterate_batch": true,
10
+ "config": {
11
+ "encoder": {
12
+ "type": "oobleck",
13
+ "requires_grad": false,
14
+ "config": {
15
+ "in_channels": 2,
16
+ "channels": 128,
17
+ "c_mults": [1, 2, 4, 8, 16],
18
+ "strides": [2, 4, 4, 8, 8],
19
+ "latent_dim": 128,
20
+ "use_snake": true
21
+ }
22
+ },
23
+ "decoder": {
24
+ "type": "oobleck",
25
+ "config": {
26
+ "out_channels": 2,
27
+ "channels": 128,
28
+ "c_mults": [1, 2, 4, 8, 16],
29
+ "strides": [2, 4, 4, 8, 8],
30
+ "latent_dim": 64,
31
+ "use_snake": true,
32
+ "final_tanh": false
33
+ }
34
+ },
35
+ "bottleneck": {
36
+ "type": "vae"
37
+ },
38
+ "latent_dim": 64,
39
+ "downsampling_ratio": 2048,
40
+ "io_channels": 2
41
+ }
42
+ },
43
+ "conditioning": {
44
+ "configs": [
45
+ {
46
+ "id": "prompt",
47
+ "type": "t5",
48
+ "config": {
49
+ "t5_model_name": "t5-base",
50
+ "max_length": 128
51
+ }
52
+ },
53
+ {
54
+ "id": "seconds_start",
55
+ "type": "number",
56
+ "config": {
57
+ "min_val": 0,
58
+ "max_val": 512
59
+ }
60
+ },
61
+ {
62
+ "id": "seconds_total",
63
+ "type": "number",
64
+ "config": {
65
+ "min_val": 0,
66
+ "max_val": 512
67
+ }
68
+ }
69
+ ],
70
+ "cond_dim": 768
71
+ },
72
+ "diffusion": {
73
+ "cross_attention_cond_ids": ["prompt", "seconds_start", "seconds_total"],
74
+ "global_cond_ids": ["seconds_start", "seconds_total"],
75
+ "type": "dit",
76
+ "config": {
77
+ "io_channels": 64,
78
+ "embed_dim": 1536,
79
+ "depth": 24,
80
+ "num_heads": 24,
81
+ "cond_token_dim": 768,
82
+ "global_cond_dim": 1536,
83
+ "project_cond_tokens": false,
84
+ "transformer_type": "continuous_transformer"
85
+ }
86
+ },
87
+ "io_channels": 64
88
+ },
89
+ "training": {
90
+ "pre_encoded": true,
91
+ "use_ema": true,
92
+ "log_loss_info": false,
93
+ "optimizer_configs": {
94
+ "diffusion": {
95
+ "optimizer": {
96
+ "type": "AdamW",
97
+ "config": {
98
+ "lr": 5e-5,
99
+ "betas": [0.9, 0.999],
100
+ "weight_decay": 1e-3
101
+ }
102
+ },
103
+ "scheduler": {
104
+ "type": "InverseLR",
105
+ "config": {
106
+ "inv_gamma": 1000000,
107
+ "power": 0.5,
108
+ "warmup": 0.99
109
+ }
110
+ }
111
+ }
112
+ },
113
+ "demo": {
114
+ "demo_every": 4742,
115
+ "demo_steps": 250,
116
+ "num_demos": 6,
117
+ "demo_cond": [
118
+ {"prompt": "Lead, Square, Clean, Warm, MF, HF, fast speed, alternating arp melody, F# minor, 110BPM, 8 bars", "seconds_start": 0, "seconds_total": 17},
119
+ {"prompt": "Lead, Saw, Synth, Warm, Supersaw, MF, HF, medium speed, bounce, catchy, melody, E minor, 128BPM, 8 bars", "seconds_start": 0, "seconds_total": 15},
120
+ {"prompt": "Bass, Punchy, Pluck, Clean, Sub, Sine, LF, catchy top simple melody F# minor, 140BPM, 8 bars", "seconds_start": 0, "seconds_total": 13},
121
+ {"prompt": "Lead, Square, Synth, Buzzy, Legato, MF, HF, top catchy melody, F# minor, 150BPM, 8 bars, with medium reverb", "seconds_start": 0, "seconds_total": 7},
122
+ {"prompt": "Pluck, Sine, bright, clean, Bell, HF, fast chord progression, with rising arp melody, C minor, 120BPM, 4 bars, with quarter-beat gate, with rising low-pass", "seconds_start": 0, "seconds_total": 8},
123
+ {"prompt": "Pluck, Sine, bright, clean, Bell, HF, fast chord progression, with rising arp melody, C minor, 120BPM, 4 bars, with quarter-beat gate, with rising low-pass", "seconds_start": 0, "seconds_total": 8}
124
+ ],
125
+ "demo_cfg_scales": [4, 7]
126
+ }
127
+ }
128
+ }