FOGmiaow commited on
Commit
528c26c
·
verified ·
1 Parent(s): d5b992a

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_0.pt +3 -0
  3. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_1.pt +3 -0
  4. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_10.pt +3 -0
  5. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_12.pt +3 -0
  6. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_13.pt +3 -0
  7. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_17.pt +3 -0
  8. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_18.pt +3 -0
  9. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_19.pt +3 -0
  10. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_22.pt +3 -0
  11. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_25.pt +3 -0
  12. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_26.pt +3 -0
  13. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_28.pt +3 -0
  14. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_29.pt +3 -0
  15. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_31.pt +3 -0
  16. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_4.pt +3 -0
  17. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_5.pt +3 -0
  18. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_6.pt +3 -0
  19. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_9.pt +3 -0
  20. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/huggingface/tokenizer.json +3 -0
  21. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_0.pt +3 -0
  22. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_1.pt +3 -0
  23. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_10.pt +3 -0
  24. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_11.pt +3 -0
  25. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_12.pt +3 -0
  26. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_13.pt +3 -0
  27. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_14.pt +3 -0
  28. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_16.pt +3 -0
  29. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_17.pt +3 -0
  30. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_19.pt +3 -0
  31. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_20.pt +3 -0
  32. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_21.pt +3 -0
  33. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_22.pt +3 -0
  34. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_23.pt +3 -0
  35. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_24.pt +3 -0
  36. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_25.pt +3 -0
  37. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_26.pt +3 -0
  38. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_27.pt +3 -0
  39. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_29.pt +3 -0
  40. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_30.pt +3 -0
  41. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_31.pt +3 -0
  42. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_4.pt +3 -0
  43. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_6.pt +3 -0
  44. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_8.pt +3 -0
  45. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_9.pt +3 -0
  46. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_15.pt +3 -0
  47. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_17.pt +3 -0
  48. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_20.pt +3 -0
  49. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_21.pt +3 -0
  50. mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_23.pt +3 -0
.gitattributes CHANGED
@@ -44,3 +44,4 @@ mn-coding-adam-2e6-32k-ds-r1-1.5b-adamw-lr2e-6/global_step_100/actor/huggingface
44
  coding-adam-3e6-16k-ds-r1-1.5b-adamw-lr3e-6/global_step_80/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
45
  coding-adam-3e6-32k-ds-r1-1.5b-adamw-lr3e-6/global_step_300/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
46
  mn-coding-adam-3e6-32k-ds-r1-1.5b-adamw-lr3e-6/global_step_340/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
44
  coding-adam-3e6-16k-ds-r1-1.5b-adamw-lr3e-6/global_step_80/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
45
  coding-adam-3e6-32k-ds-r1-1.5b-adamw-lr3e-6/global_step_300/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
46
  mn-coding-adam-3e6-32k-ds-r1-1.5b-adamw-lr3e-6/global_step_340/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
47
+ mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d1dd7ee7f01f51666f49082c72e36b83d4ab8b6e5ee6561523a9b045cec422f
3
+ size 15085
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_1.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96cbcf48d321ef8fe52221933081c988c5a92cee2d8461d29a1a64a5bd4e0279
3
+ size 15085
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_10.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43be47bd03d4f58376404353b0898d654473bfdbab5ff39954e66d94ad543790
3
+ size 15093
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_12.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0c0f20c7c02154d47c463bc4792591f6ed47c94eff2d0bddba5be9f02089535
3
+ size 15093
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_13.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b02335d8af967a694c406c21c62b5844ca597f093dcb8174b0d02b43a7bc1037
3
+ size 15093
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_17.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b727faf4558a86827cd6f81401d0636b5a2d27728870408887c2919ee3bf395
3
+ size 15093
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_18.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:311cfd4309bed6fffa981ff90ddf4e9018f10e50e6328e43412cecf18d165ca8
3
+ size 15093
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_19.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:694ff54a9b32da5b4eeea7b2d6840b4ceca0c4c7c485fc8bbaae7e2d703f9af8
3
+ size 15093
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_22.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2e486c28052f9a069da1894861b79c93e879a75ebf04d6f21fb449690e81af1
3
+ size 15093
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_25.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f2c49a165ddb15168263a7763eb9957694b39afd39cd0bc39f7e46b4ef16cbf
3
+ size 15093
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_26.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ef250194cd450872db2ff565460235d9c3f2e1d27d5c90c79e470825bc4ed75
3
+ size 15093
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_28.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74404bd16986350a0f7f3e8b2ddf2103facbe1a36e72e915f9b841ea9cb9883b
3
+ size 15093
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_29.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43b1eb6659d6d23fd35abe4d0276c9743ca7749c3040b7e5f8f06ec05a8ee335
3
+ size 15093
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_31.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43a4a02e861cee641c0266c8edb004f0ebff0310090a1ddbdf4e3a8614331914
3
+ size 15093
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_4.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5196e25f825462ee92ca35ad0a27cd195b27f020fd7dcd9bff79306e241e765f
3
+ size 15085
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_5.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ebaf8c18d653946def73b07880a13eef263f3ca70e2c729656d6996b214ed72
3
+ size 15085
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_6.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7afa34f2fc28ba77a40d60f944c30d17bf4ae4a3e8ccb4bb43180d42653b0efe
3
+ size 15085
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_9.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40297e63148004cc9cee9ca9ebb6fd13e33f958ee9e2254d444ab919fa2fce38
3
+ size 15085
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/huggingface/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
3
+ size 11422778
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afd390784c6c811539ae79ec0acbae1b80ac7c34575ef6c57eba2c6da5aceefc
3
+ size 222310341
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_1.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41684619ca9bdacdaa06fc94eeb9739517003a1429ee8329e1487147702f6d4b
3
+ size 222310341
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_10.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:728979783e4dd28b30b09b10617c86b778a6213ac63319f26cb654756938c2ad
3
+ size 222310687
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_11.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:628a9b748957e74400ece53eabf45bfb94bf70b5b4b8b493de448e74f97fc46d
3
+ size 222310687
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_12.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6d0bf35e280d60ac10d53c35539520c4c5d01d4e6340b150a90722613d0d837
3
+ size 222310687
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_13.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09d45ff1ee9af70cbeeab7ee2e0b0806c858bd7db2cc9aa08511dc890f3000b4
3
+ size 222310687
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_14.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:618b5015498b7cc155725b9e5fa8c4fdcc862ca689f47ba6e6d5413d7f3d3f41
3
+ size 222310687
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_16.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2adc6db6bde7dde1c6fcc83a16eae2f5f6a0f834006b9dc44eb9c657a37e2c6c
3
+ size 222310687
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_17.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78c72724e344835341505f498c71d55dcb5458933e83e9faf59f069847692e76
3
+ size 222310687
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_19.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1820b1867507e31733a8a0fbd9eb565e443634b509c974ca0e0f6573600577e
3
+ size 222310687
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_20.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cc5b629cd4b5c8b5757deda4a43f591883aac863b8062cbf95b07249939160f
3
+ size 222310687
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_21.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3394166150c2885791c8a2063305a56daee9d51d207cbad3646d77308b169489
3
+ size 222310687
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_22.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed979e92faaf810f46c39f1fd642f20212bf76ada3b366e7781bf07502bcdb7f
3
+ size 222310687
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_23.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4afad8878aabd0de0d289112f6fdc3d0af8db8c0e08800bc29dc1274f82dd987
3
+ size 222310687
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_24.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d51d847d4b75358f67aff0b6021e599f770a4cd098787f7ccca763a48823851
3
+ size 222310687
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_25.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e695b99959e268ab593db8dd9372d1655e01e80d78334e48ff751b1f01aa7540
3
+ size 222310687
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_26.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:172cbb6d585a749542b69298a5db4a99cee2700c0d8fb4c2158225856e072c41
3
+ size 222310687
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_27.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ddb74a7ba49aa891ee4967c20da6ca41b630930f1b3c9e1540dd0faf37691faf
3
+ size 222310687
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_29.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fb0a6ed8f13d32cba0041d5389714b0a7b6c863c95c383da63ea2197b158f97
3
+ size 222310687
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_30.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f594e9e0408c156587e82ce7f2e95b3258a95b669a3309e7ee49ec8690e15e9
3
+ size 222310687
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_31.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b1f0ceb8782bfb8d8314983ed226fb7fc0d7648815172f8f585ce4d8b808ec1
3
+ size 222310687
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_4.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:382abff4b803ff3302a19457f8e081a624399b24c1a6cc0d803a64cc56a080fc
3
+ size 222310341
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_6.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b28c06635e297d9671e01591807d1e40e730a92b87ad7fa94fea93f5dc601e52
3
+ size 222310341
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_8.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca9fcde5abf16c9c9127328eeffba716e7d5286294689d1ec44f9b5dc44e6d0e
3
+ size 222310341
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_9.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23855c8e9cf2f07cd98969c31f64e54abfe41a23e4bacfa609fb113ff1da787b
3
+ size 222310341
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_15.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89e4a318dd41369d88614c29761a31dd55d59a46032cc32a374534e9537ff851
3
+ size 444753565
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_17.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77a1d305822d7a184a1e9f0a2178d6679a83d610d2eb73445dd974e9d1b8c7c9
3
+ size 444753565
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_20.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad5e3875af2ff2ce738fc7f2ee2b98889bcc15af551402c5ea58a7eaed3fb775
3
+ size 444753565
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_21.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9080c0d87748fc6f1c283a41803895e8072316c5114c40525b6078618c2f2195
3
+ size 444753565
mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_23.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f39f8b1a9a9b244861c23af96e7c4229d11d01bf487c45c6d79c396069a7dbf0
3
+ size 444753565