-
Notifications
You must be signed in to change notification settings - Fork 1
/
best_model.json
105 lines (105 loc) · 3.38 KB
/
best_model.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
{
"model_type": "diffusion_cond",
"sample_size": 1048576,
"sample_rate": 44100,
"audio_channels": 1,
"model": {
"pretransform": {
"type": "autoencoder",
"iterate_batch": true,
"config": {
"encoder": {
"type": "dac",
"config": {
"in_channels": 1,
"latent_dim": 128,
"d_model": 128,
"strides": [4, 4, 8, 8]
}
},
"decoder": {
"type": "dac",
"config": {
"out_channels": 1,
"latent_dim": 64,
"channels": 1536,
"rates": [8, 8, 4, 4]
}
},
"bottleneck": {
"type": "vae"
},
"latent_dim": 64,
"downsampling_ratio": 1024,
"io_channels": 1
}
},
"conditioning": {
"configs": [
{
"id": "prompt",
"type": "clap_text",
"config": {
"audio_model_type": "HTSAT-base",
"enable_fusion": true,
"clap_ckpt_path": "./ckpts/clap/clap.ckpt",
"use_text_features": true,
"feature_layer_ix": -2
}
},
{
"id": "seconds_start",
"type": "int",
"config": {
"min_val": 0,
"max_val": 512
}
},
{
"id": "seconds_total",
"type": "int",
"config": {
"min_val": 0,
"max_val": 512
}
}
],
"cond_dim": 768
},
"diffusion": {
"type": "adp_cfg_1d",
"cross_attention_cond_ids": ["prompt", "seconds_start", "seconds_total"],
"config": {
"in_channels": 64,
"context_embedding_features": 768,
"context_embedding_max_length": 79,
"channels": 256,
"resnet_groups": 16,
"kernel_multiplier_downsample": 2,
"multipliers": [4, 4, 4, 5, 5],
"factors": [1, 2, 2, 4],
"num_blocks": [2, 2, 2, 2],
"attentions": [1, 3, 3, 3, 3],
"attention_heads": 16,
"attention_multiplier": 4,
"use_nearest_upsample": false,
"use_skip_scale": true,
"use_context_time": true
}
},
"io_channels": 64
},
"training": {
"learning_rate": 4e-5,
"demo": {
"demo_every": 2000,
"demo_steps": 250,
"num_demos": 2,
"demo_cond": [
{"prompt": "guitar, drums, bass, rock, 140 BPM", "seconds_start": 0, "seconds_total": 20},
{"prompt": "piano, classical, 161 BPM", "seconds_start": 10, "seconds_total": 25}
],
"demo_cfg_scales": [3, 6]
}
}
}