AKM-12 commited on
Commit
5f63d12
·
verified ·
1 Parent(s): cef1ec6

Upload general knowledge GRPO v3 final model

Browse files
config.json CHANGED
@@ -48,7 +48,7 @@
48
  "num_attention_heads": 16,
49
  "num_hidden_layers": 28,
50
  "num_key_value_heads": 8,
51
- "pad_token_id": null,
52
  "rms_norm_eps": 1e-06,
53
  "rope_parameters": {
54
  "rope_theta": 1000000,
@@ -57,7 +57,7 @@
57
  "sliding_window": null,
58
  "tie_word_embeddings": true,
59
  "transformers_version": "5.7.0",
60
- "use_cache": false,
61
  "use_sliding_window": false,
62
  "vocab_size": 151936
63
  }
 
48
  "num_attention_heads": 16,
49
  "num_hidden_layers": 28,
50
  "num_key_value_heads": 8,
51
+ "pad_token_id": 151643,
52
  "rms_norm_eps": 1e-06,
53
  "rope_parameters": {
54
  "rope_theta": 1000000,
 
57
  "sliding_window": null,
58
  "tie_word_embeddings": true,
59
  "transformers_version": "5.7.0",
60
+ "use_cache": true,
61
  "use_sliding_window": false,
62
  "vocab_size": 151936
63
  }
generation_config.json CHANGED
@@ -9,5 +9,5 @@
9
  "temperature": 0.1,
10
  "top_k": 20,
11
  "top_p": 0.8,
12
- "transformers_version": "5.7.0"
13
  }
 
9
  "temperature": 0.1,
10
  "top_k": 20,
11
  "top_p": 0.8,
12
+ "transformers_version": "4.51.0"
13
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96d5c91566d4105ba9dee18ed9fc9c1815b8dbae9f6c9315aec823792f9d8d64
3
  size 3441185608
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:813eaad9f372af34c6dbe827ef83b2f6fa4242f384b4b4513f0aa5030b9e5e20
3
  size 3441185608
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bbffd7f0e88d41e69661e1ed85706c62e4ca2d7670b594746f59d6a4b3bdbe13
3
- size 5265
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3f7e3941a0de7499e3168b07e258108060907a86cc3584f99173330ef33589d
3
+ size 7185