khursanirevo commited on
Commit
b373b5f
·
verified ·
1 Parent(s): 4d650bb

Upload folder using huggingface_hub

Browse files
Files changed (4) hide show
  1. config.json +51 -0
  2. lora.safetensors +3 -0
  3. optimizer.pt +3 -0
  4. train_state.pt +3 -0
config.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dim": 4096,
3
+ "text_card": 32000,
4
+ "existing_text_padding_id": 3,
5
+ "n_q": 16,
6
+ "dep_q": 8,
7
+ "card": 2048,
8
+ "num_heads": 32,
9
+ "num_layers": 32,
10
+ "hidden_scale": 4.125,
11
+ "causal": true,
12
+ "layer_scale": null,
13
+ "context": 3000,
14
+ "max_period": 10000,
15
+ "gating": "silu",
16
+ "norm": "rms_norm_f32",
17
+ "positional_embedding": "rope",
18
+ "depformer_dim": 1024,
19
+ "depformer_dim_feedforward": 4224,
20
+ "depformer_num_heads": 16,
21
+ "depformer_num_layers": 6,
22
+ "depformer_layer_scale": null,
23
+ "depformer_multi_linear": true,
24
+ "depformer_context": 8,
25
+ "depformer_max_period": 10000,
26
+ "depformer_gating": "silu",
27
+ "depformer_pos_emb": "none",
28
+ "depformer_weights_per_step": true,
29
+ "delays": [
30
+ 0,
31
+ 0,
32
+ 1,
33
+ 1,
34
+ 1,
35
+ 1,
36
+ 1,
37
+ 1,
38
+ 1,
39
+ 0,
40
+ 1,
41
+ 1,
42
+ 1,
43
+ 1,
44
+ 1,
45
+ 1,
46
+ 1
47
+ ],
48
+ "lora": true,
49
+ "lora_rank": 128,
50
+ "lora_scaling": 2.0
51
+ }
lora.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2ca82c3dcfe0ee5e6f382758daa69e9095f067c751912b1036368cc5b976323
3
+ size 775835456
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f44f32cb8f6534ebc3e693e2c86f9b108aa302e87c72d4aa4ea27fb78370833
3
+ size 3103570168
train_state.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90d8a1604c309efdd22e77092c02cf9eeef3a833ed46af234b350bb89bf86795
3
+ size 880