travistest commited on
Commit
647113f
·
verified ·
1 Parent(s): f59aee0

Training in progress, step 100

Browse files
README.md CHANGED
@@ -4,10 +4,10 @@ library_name: transformers
4
  model_name: phi-3.5-mini-grpo-v3
5
  tags:
6
  - generated_from_trainer
 
 
7
  - hf_jobs
8
  - trl
9
- - grpo
10
- - unsloth
11
  licence: license
12
  ---
13
 
 
4
  model_name: phi-3.5-mini-grpo-v3
5
  tags:
6
  - generated_from_trainer
7
+ - unsloth
8
+ - grpo
9
  - hf_jobs
10
  - trl
 
 
11
  licence: license
12
  ---
13
 
adapter_config.json CHANGED
@@ -33,13 +33,13 @@
33
  "rank_pattern": {},
34
  "revision": null,
35
  "target_modules": [
36
- "v_proj",
37
- "down_proj",
38
  "k_proj",
39
- "o_proj",
 
40
  "gate_proj",
41
- "up_proj",
42
- "q_proj"
43
  ],
44
  "target_parameters": null,
45
  "task_type": "CAUSAL_LM",
 
33
  "rank_pattern": {},
34
  "revision": null,
35
  "target_modules": [
36
+ "q_proj",
37
+ "up_proj",
38
  "k_proj",
39
+ "down_proj",
40
+ "v_proj",
41
  "gate_proj",
42
+ "o_proj"
 
43
  ],
44
  "target_parameters": null,
45
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6610c6769aff5b08d09e52f79883f61f960dc66717a9d5de95b2a4d2bc8d3d13
3
  size 59827904
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d87c83bd19d060b3d0e82ce25b2c87b9bb456c1718c20f6c84bdc8a275aad308
3
  size 59827904
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d45c721923d59890a86a891c9f4a5c3792af0a242a9175f97cf53645c645cc63
3
  size 7377
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00df46c50cf6f5b574e5463a5473be3b1833bb92d2b88bdc4870f2a74d0ab03c
3
  size 7377