Training in progress, step 100

Files changed (4) hide show

README.md CHANGED Viewed

@@ -4,10 +4,10 @@ library_name: transformers
 model_name: phi-3.5-mini-grpo-v3
 tags:
 - generated_from_trainer
 - hf_jobs
 - trl
-- grpo
-- unsloth
 licence: license
 ---

 model_name: phi-3.5-mini-grpo-v3
 tags:
 - generated_from_trainer
+- unsloth
+- grpo
 - hf_jobs
 - trl
 licence: license
 ---

adapter_config.json CHANGED Viewed

@@ -33,13 +33,13 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "v_proj",
-    "down_proj",
     "k_proj",
-    "o_proj",
     "gate_proj",
-    "up_proj",
-    "q_proj"
   ],
   "target_parameters": null,
   "task_type": "CAUSAL_LM",

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "q_proj",
+    "up_proj",
     "k_proj",
+    "down_proj",
+    "v_proj",
     "gate_proj",
+    "o_proj"
   ],
   "target_parameters": null,
   "task_type": "CAUSAL_LM",

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6610c6769aff5b08d09e52f79883f61f960dc66717a9d5de95b2a4d2bc8d3d13
 size 59827904

 version https://git-lfs.github.com/spec/v1
+oid sha256:d87c83bd19d060b3d0e82ce25b2c87b9bb456c1718c20f6c84bdc8a275aad308
 size 59827904

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d45c721923d59890a86a891c9f4a5c3792af0a242a9175f97cf53645c645cc63
 size 7377

 version https://git-lfs.github.com/spec/v1
+oid sha256:00df46c50cf6f5b574e5463a5473be3b1833bb92d2b88bdc4870f2a74d0ab03c
 size 7377