FOGmiaow commited on
Commit
3be7ae9
·
verified ·
1 Parent(s): bf9350c

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_11.pt +3 -0
  2. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_17.pt +3 -0
  3. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_19.pt +3 -0
  4. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_25.pt +3 -0
  5. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_27.pt +3 -0
  6. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_28.pt +3 -0
  7. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_31.pt +3 -0
  8. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_4.pt +3 -0
  9. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_5.pt +3 -0
  10. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_9.pt +3 -0
  11. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_0.pt +3 -0
  12. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_1.pt +3 -0
  13. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_10.pt +3 -0
  14. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_11.pt +3 -0
  15. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_12.pt +3 -0
  16. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_14.pt +3 -0
  17. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_15.pt +3 -0
  18. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_17.pt +3 -0
  19. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_18.pt +3 -0
  20. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_19.pt +3 -0
  21. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_20.pt +3 -0
  22. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_21.pt +3 -0
  23. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_22.pt +3 -0
  24. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_23.pt +3 -0
  25. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_24.pt +3 -0
  26. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_25.pt +3 -0
  27. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_26.pt +3 -0
  28. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_27.pt +3 -0
  29. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_28.pt +3 -0
  30. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_29.pt +3 -0
  31. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_3.pt +3 -0
  32. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_31.pt +3 -0
  33. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_4.pt +3 -0
  34. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_5.pt +3 -0
  35. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_6.pt +3 -0
  36. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_7.pt +3 -0
  37. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_8.pt +3 -0
  38. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_1.pt +3 -0
  39. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_12.pt +3 -0
  40. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_13.pt +3 -0
  41. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_19.pt +3 -0
  42. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_2.pt +3 -0
  43. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_20.pt +3 -0
  44. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_22.pt +3 -0
  45. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_23.pt +3 -0
  46. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_24.pt +3 -0
  47. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_26.pt +3 -0
  48. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_3.pt +3 -0
  49. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_30.pt +3 -0
  50. mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_4.pt +3 -0
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_11.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6722b0b18d781e4c2e65707a66411b1c85fa4535efd43a4092c8aee1ee53234
3
+ size 15157
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_17.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fb5fcc0e0d6dd2ae3a6eac0ccfa7c847d30aa8ebdddac8b365bef0f8219f8eb
3
+ size 15157
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_19.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9b6769a255400a3a91a932f5124fb12060760c1a1263c17c4af30776cf59d65
3
+ size 15157
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_25.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9608f14e9d75816cd6a586012fe78fd70439df80260e43307eaafccce4ad47c7
3
+ size 15157
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_27.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95aab38bb235d2cb315f1612002ced4a0b53ece84565c026631df72a1810e3ed
3
+ size 15157
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_28.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d286ece46eda9f2cad57de2b3d8578e319825d9258de53317e42cbbb15cb1466
3
+ size 15157
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_31.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b749b265d58426b36ae07ac5ed425d8072e3f64edf60cf36455f95fa47d15b0a
3
+ size 15157
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_4.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2bcba39b44b99653fc59d4159981d669ecd4cee81d7bc2d5c93e85303cb6ee16
3
+ size 15149
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_5.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9047e52c1b60059aa8a26fbb21e9b46587bd725dcd7900e2b09b8684b4c406aa
3
+ size 15149
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_9.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c369987c41b249d562d23667db025dac946c0cb0dbcd46201ecb91fee2c702c
3
+ size 15149
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:033b838883c8ee1e753b6d7110b36d232c3c4b97542276fe97422c3e8000e157
3
+ size 222310341
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_1.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:beaf849e3fe0040a208de82b04cb6d94059821d6e5385e7ffee05db0a0b38528
3
+ size 222310341
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_10.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ae3f8322859abf44e11a1c755d39ab87a33399a76575b814ad751d498bd1400
3
+ size 222310687
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_11.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea9ab323cde9876b0042e0dcde0e3bd3a8391ab26c42c3538016a7b183b38e07
3
+ size 222310687
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_12.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64f48693870b007ad8a5d6bc424bf496b58687b1a54a06b07778ef645dfb283e
3
+ size 222310687
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_14.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5524374310d00e8658d9ab422392a0935a776c5546d74ff2fcf2f9c0dec7d371
3
+ size 222310687
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_15.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53dc83681229a9773fd2772dc96b0dba16a2405f5f900425b4cd49647cd79538
3
+ size 222310687
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_17.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58ede4ef75ae7d79dc038dc116905ac784f673ae01aaabd807830aaec82d3ff5
3
+ size 222310687
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_18.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5591192d0c4064d21ef24d878c9cb0642770c0d4cf9558f2f6a7962c9d00ae7f
3
+ size 222310687
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_19.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6409262bbfc06b775024282c1c3d283e9f8ea287f999df622191d9ccc5a7973
3
+ size 222310687
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_20.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:612888e31ab547c6a68e518b75abde0656a3acbd4af645b1b435e83554eb9fa6
3
+ size 222310687
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_21.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79fb4134281118a57107524c86cfdf44dacea223d8f95003a60a5b78e9001db0
3
+ size 222310687
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_22.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3d0275a9a5c15b50e6da19dd8785a0ebc7eb7bb7318d88e1a9bac2a7d177c38
3
+ size 222310687
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_23.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc72f8d1a866fe89b15625ec113524e69ce171b9ae39d3db927c53375d19494f
3
+ size 222310687
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_24.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a2e2069529cd61c41c42d19c4c2be8dcba517e263f7f6bfb1cd382d2f082681
3
+ size 222310687
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_25.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:485b17b52bff02dfdd9910af08356e8f2bbdb501bc7b74f683694ee4a9151809
3
+ size 222310687
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_26.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99c81b6c12d47c1f62c0dbc076f204ccd29a8f42ff6c8422a33fff673e3521d6
3
+ size 222310687
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_27.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:925551a45c218f6316b0f779d67f79ae217fde3f9df31b6ad38d17a6fb72b525
3
+ size 222310687
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_28.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d18b99509281f33fc7a07860ffa6bbff091deabbf43b64001cd1ede0370b0ae6
3
+ size 222310687
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_29.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcc394c0be8fd4efc09289b4985f88077e886d5b4136cd44c8fa09661e0c23fe
3
+ size 222310687
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_3.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92462d93652215678e2ac8e6b6a68fb28566dc722563e8331704a10eabc15eb0
3
+ size 222310341
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_31.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42a90bdd0779ede2b10a322abd83e073de25a3cc4046d3b8610c20299e771686
3
+ size 222310687
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_4.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f051cbe10a18972fa251a158365dd573ef1269cbac5faced8d4375414f09b23
3
+ size 222310341
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_5.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ba5c71643d6f1617a16a424010c835025919772c5ef863dab28e914dc7c18e1
3
+ size 222310341
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_6.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0977bf494c648de1132dfca70bd9a7582d3277e3064c98c9197b518d6205cb7
3
+ size 222310341
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_7.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c43c48aec244b4b27f7a0cb54988effb74a65500ec38ec6d8ee242b727213ea
3
+ size 222310341
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_8.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2be11efd6fe71420ecf19968d1f076aef7f28c0b97d98c7ff00fba193977b3f2
3
+ size 222310341
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_1.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:431cb8db6525a495f878bbb56f338366c302425eb3076847bd95ae0f8f7009e0
3
+ size 280698884
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_12.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b162f6f93bd2b8673b4c94bbc10aa63ae8f75f32d48f1403444b24e61b17fca
3
+ size 280699373
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_13.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03195bee439e9e487c6a385dd47eed4144b239c3d39c32171f2e892cb8076bd6
3
+ size 280699373
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_19.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc2715606fbbd031ee291a9e37ed035142c253d2bef32d24ebc3de82e21e8665
3
+ size 280699373
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_2.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3eea50f4d241841add93b49431064c19c43de21f0d4712b5705bbd384ea92c54
3
+ size 280698884
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_20.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd5f6921fee858a26266abcb8d7235a8b98dfac085716caddf75ee99601c3036
3
+ size 280699373
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_22.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8780089422496e4a438c17a76338f755dc42abc64e8d64d773291a8313dc7128
3
+ size 280699373
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_23.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17aa1414d92ae012e4f16aa0018c1494bd847301f60513a2d044daeb782cc911
3
+ size 280699373
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_24.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:817c95c63330d57b04931da0f00ba23273042f316b0f05a5580a3324e72089d5
3
+ size 280699373
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_26.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fa28649383a25709d860ca5a54b164398ffd081d386b8a1526ce9e0998d1955
3
+ size 280699373
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_3.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73fcf405a2be56a091f16fcc49d3d2c5a98d161c7e8431f3fd7ff001e5f302c4
3
+ size 280698884
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_30.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80d4ce92b6fee3cc5a24d725bc32ae3b37b84545b907f57e04a464825a33ff2a
3
+ size 280699373
mn-coding-muon-1e4-32k-ds-r1-1.5b-muon-muonlr1e-4-spectral_norm-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_4.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79fc58d32fadfc3d9c3b7a950d77cf3fb96e17a8a6fdbe8f868b4f34b86c40fe
3
+ size 280698884