Chengheng commited on
Commit
cba4934
·
verified ·
1 Parent(s): c9005bf

Upload manifest.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. manifest.json +31 -0
manifest.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "config": {
3
+ "project": "coconut-qwen3",
4
+ "name": "vq-on-latents-qwen3-0.6b-K4096-d64",
5
+ "save_dir": "/dlabscratch/dlabscratch1/Chengheng/mnlp/vq_on_latents/qwen3_0_6b/K_4096_d_64",
6
+ "latents_path": "/dlabscratch/dlabscratch1/Chengheng/mnlp/vq_on_latents/latent_embeddings_qwen3_0_6b_fp32/latents_train.npz",
7
+ "wandb": true,
8
+ "use_fsq": false,
9
+ "vq_latent_dim": 64,
10
+ "vq_num_embeddings": 4096,
11
+ "vq_commitment_cost": 1.0,
12
+ "vq_decay": 0.999,
13
+ "vq_threshold_ema_dead_code": 0,
14
+ "vq_use_cosine_sim": false,
15
+ "vq_orthogonal_reg_weight": 0,
16
+ "vq_orthogonal_reg_max_codes": 128,
17
+ "vq_sample_codebook_temp": 0.0,
18
+ "vq_lib_kmeans_init": false,
19
+ "kmeans_init_from_dataset": true,
20
+ "warmup_steps": 1000,
21
+ "per_position": false,
22
+ "commitment_weight": 0.1,
23
+ "batch_size": 256,
24
+ "num_epochs": 10,
25
+ "lr": 0.0005,
26
+ "weight_decay": 0.01,
27
+ "seed": 0,
28
+ "log_every": 50
29
+ },
30
+ "per_position": false
31
+ }