AbstractPhil commited on
Commit
d5ffbb5
·
verified ·
1 Parent(s): 7b168c5

Config update at step 1250

Browse files
Files changed (1) hide show
  1. config.json +77 -0
config.json ADDED
@@ -0,0 +1,77 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "modality_dims": {
3
+ "clip_l": 768,
4
+ "clip_g": 1280,
5
+ "t5_xl_l": 2048,
6
+ "t5_xl_g": 2048
7
+ },
8
+ "modality_seq_lens": {
9
+ "clip_l": 77,
10
+ "clip_g": 77,
11
+ "t5_xl_l": 512,
12
+ "t5_xl_g": 512
13
+ },
14
+ "binding_config": {
15
+ "clip_l": {
16
+ "t5_xl_l": 0.3
17
+ },
18
+ "clip_g": {
19
+ "t5_xl_g": 0.3
20
+ },
21
+ "t5_xl_l": {},
22
+ "t5_xl_g": {}
23
+ },
24
+ "latent_dim": 2048,
25
+ "seq_len": 77,
26
+ "encoder_layers": 3,
27
+ "decoder_layers": 3,
28
+ "hidden_dim": 1024,
29
+ "dropout": 0.1,
30
+ "fusion_strategy": "adaptive_cantor",
31
+ "fusion_heads": 8,
32
+ "fusion_dropout": 0.1,
33
+ "cantor_depth": 8,
34
+ "cantor_local_window": 3,
35
+ "alpha_init": 1.0,
36
+ "beta_init": 0.3,
37
+ "alpha_lr_scale": 0.1,
38
+ "beta_lr_scale": 1.0,
39
+ "beta_kl": 0.1,
40
+ "beta_reconstruction": 1.0,
41
+ "beta_cross_modal": 0.05,
42
+ "beta_alpha_regularization": 0.01,
43
+ "recon_type": "mse",
44
+ "modality_recon_weights": {
45
+ "clip_l": 1.0,
46
+ "clip_g": 1.0,
47
+ "t5_xl_l": 0.3,
48
+ "t5_xl_g": 0.3
49
+ },
50
+ "use_kl_annealing": true,
51
+ "kl_anneal_epochs": 10,
52
+ "kl_start_beta": 0.0,
53
+ "batch_size": 8,
54
+ "num_epochs": 100,
55
+ "learning_rate": 0.0001,
56
+ "weight_decay": 1e-05,
57
+ "gradient_clip": 1.0,
58
+ "use_scheduler": true,
59
+ "scheduler_type": "cosine",
60
+ "num_samples": 10000,
61
+ "synthetic_ratio": 0.15,
62
+ "checkpoint_dir": "./checkpoints_lyra_adaptive_cantor",
63
+ "save_every": 1000,
64
+ "keep_last_n": 3,
65
+ "hf_repo": "AbstractPhil/vae-lyra-xl-adaptive-cantor",
66
+ "push_to_hub": true,
67
+ "push_every": 2000,
68
+ "auto_load_from_hub": true,
69
+ "use_wandb": false,
70
+ "wandb_project": "vae-lyra-adaptive-cantor",
71
+ "wandb_entity": null,
72
+ "log_every": 50,
73
+ "device": "cuda",
74
+ "mixed_precision": true,
75
+ "seed": 42,
76
+ "num_workers": 0
77
+ }