diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_10.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_10.pt new file mode 100644 index 0000000000000000000000000000000000000000..273d6481c6bbea3b05748d2ca49df1b6fd70091a --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_10.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32075475b3e269c3725f13bf7fc26b9cca2cdf926ed808f537b987a7c17af9c6 +size 15157 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_11.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_11.pt new file mode 100644 index 0000000000000000000000000000000000000000..df7f3ddf43f105aca3cc1c5d8789cc93e5898562 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_11.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca756791b1a10b8a31f39c4e9a4dd15f1c7c04b8a6504c70bbcb365c349b5d7e +size 15157 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_12.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_12.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a2b0ed5faf1faf6c247eaaf9f962ef81c91df6b --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_12.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12708cd485c1b6e3119ff3f6b25e97de1d9d93dbc0d200fbb9981c550d675875 +size 15157 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_13.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_13.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8d02468021cf7884f8651e9b91cbd2c20883f43 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_13.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:616be0bb3ac30d6f5c3d9bd9b36faf0b0952304442688e400d5d383b7ca92fd8 +size 15157 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_15.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_15.pt new file mode 100644 index 0000000000000000000000000000000000000000..64f0b24b917a3207dac947a6ba33dea1686b0c38 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_15.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:330ecb4ababec3b487ab9dd33806aec35a826f7e2ff8b8ba36c3ee9dfe8c0aa5 +size 15157 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_16.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_16.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdbb06fcee1903f196e270d4761d4b43787d5e5d --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_16.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e87f10487043e6c61e775a2e3a9efbc55d2cfa7c5e81203c24f2528880c50d9c +size 15157 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_17.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_17.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9de37613c63cbf07cbd316c48aed940f8dd19ef --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_17.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ad117c0c1fc878753b63ce27d3fb2efffd4fb53de63f767e2f8099009bcaba6 +size 15157 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_19.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_19.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d34b998de8c8faab7a4e0d2a99b4a8136f4e250 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_19.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51ae5696353c790e37080fc2197e7f602794a6e386280cf8a0cef2ff76fce7fa +size 15157 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_20.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_20.pt new file mode 100644 index 0000000000000000000000000000000000000000..c801802f9b26afa757b7bb38123664ad13974cc9 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_20.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56a963a46d709ccf5a5dfe29e6ab94e5192b55d2cd3ee6bebb4a97360b017681 +size 15157 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_21.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_21.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea58815442602f2464d9636efff15a21f1f278a7 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_21.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27a57e9ec7278894e90489fd03f4348acf9cef9aaf1229085d0c7caba3c0ef0e +size 15157 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_23.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_23.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6ad03996e8225f0e94571dfd48694076ac67da1 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_23.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed7117b616c64eb8ca101cb49a0d81748bd9c7b2f8235f63e109c94d2664c5e0 +size 15157 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_25.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_25.pt new file mode 100644 index 0000000000000000000000000000000000000000..44f5ae45da13899a817b5173a7f694a46223af87 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_25.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f957b22081de15a266db99c7d1dfac997ab2c7ec06cedbce088bdc00c00899eb +size 15157 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_26.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_26.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6e1307e1911b7d51cfaf22315cbdefa4c4777d5 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_26.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:144b1deb40b8a9316cad8b3ea36287e28fadde756dde6280068fe05bb16ef85c +size 15157 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_28.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_28.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e034b163e7dcafa5272a9c53d865e50981e3c13 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_28.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6796b161da22fe787ff66a07783f1b654e5b3880ddca7f055234e5e5f53c597 +size 15157 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_29.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_29.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b85ff7b33de592b436d74c6c5a7e0e7a06be3a4 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_29.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae93657511407ecfb5f6709ab4ca19f67ea20db3457f47ae2ac70d70cdf43f7e +size 15157 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_31.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_31.pt new file mode 100644 index 0000000000000000000000000000000000000000..880447a70a87692f5aae01c81b0a7d8be87b207a --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_31.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cabfc971a97db1b2eebc7585958cd15fcce2de9e9046fbbff01d4043b761c0b4 +size 15157 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_4.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_4.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ed0ed6b2fc8b02ca1ce4f67c43fb6294dac792d --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0405d0ff4c4186fb76ab6ded919164ed52df3ed5db21610fcddf4fb55771e7c0 +size 15149 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_6.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_6.pt new file mode 100644 index 0000000000000000000000000000000000000000..9113f4314afc79e916845965d5f445458b0c297a --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87ffa5095cc5b871d79f259cd31f3ac99f9c518fccd1d7a750645d79ca0c1f55 +size 15149 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_7.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_7.pt new file mode 100644 index 0000000000000000000000000000000000000000..b60705134d17ff0d407773b38018eb9c95248ce0 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_7.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c781ec2129b6395aec2e2b0cc94c8f4526fa2d86bdf9313eb2558b55458ab8e6 +size 15149 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_8.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_8.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a1228e1406d97c0d4cf0ee8093eb7bcb924a6d6 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_8.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8a7bf5d3066e27ae1da68a985150bb0041211d2526fe9ee1cbb8c367aca33f0 +size 15149 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_9.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_9.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fa93b3a755d478326752050a1cbc246f5bf7536 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/extra_state_world_size_32_rank_9.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7c976faca5d4aeba945054a674d8b744ac4e8d507fe2ac575b884f81f1bf141 +size 15149 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_10.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_10.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfa33a022c23be4274fc48cd3d702e01b8b1b986 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_10.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:583f1fe8f6d5a499dcd72921b4a64ca73e7ae95157bd13d4f4082aacbdbba044 +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_11.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_11.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9567cb8e8f93e6d2b6cb313a6bd55d7fc3724d1 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_11.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73b9558504774c75f6be2cfc7d130b48da6999854a5a942ef1cada2dd1f1f722 +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_12.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_12.pt new file mode 100644 index 0000000000000000000000000000000000000000..127c4bff54432b2279ecefce6d5049a4cdba892f --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_12.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78776e24e8c9eade04b77fff5a04d4dc3aae44800cfd82e108867ea289f9883b +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_13.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_13.pt new file mode 100644 index 0000000000000000000000000000000000000000..d56d7d60d39c6ac4ab9986f74c508515775c94a6 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_13.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e541038c9347982b6ca06433d668eeb31d68ed7e7e2aa0273a583a319ecac2c +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_14.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_14.pt new file mode 100644 index 0000000000000000000000000000000000000000..91432d8d2bd332da7fb9a612798945b398fc118a --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_14.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0efb7792f7d71e5b016f458ffd04dc4b6f1551bfe720a2b76319a9696e542029 +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_15.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_15.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a302b86c8f06cc828e3f7bcbc9d578f0daa26f6 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_15.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4db9f631cd140e8af30eedb14a53b61595d533cfdd253ec1a8010b287f38b675 +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_16.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_16.pt new file mode 100644 index 0000000000000000000000000000000000000000..93838f92bc92f2f23e81492078b09e1f6a2b7a49 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_16.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:105800b7b88bcde4672c6dbd4dac41f672ad195254c60ee136542ef2f938f517 +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_17.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_17.pt new file mode 100644 index 0000000000000000000000000000000000000000..87e989ed1458f39db4c914e1bbf423dc46a29c10 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_17.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:778f21c46efeb5b14ceba3371ef2c72fe9f60727af2576111d04b6d24f9fef9c +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_18.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_18.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd0be23dd57b1659032f4dcc556dc9ed44d09434 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_18.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad3146059f709b4184ac1b46121f72db82e10740cc45acebbd871e5bd16d1253 +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_19.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_19.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c13126087a0027aae86191a0ec419c21494d0a3 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_19.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cc7f04c7b826a7c3e5731d98ea83c51dd60e7e1e118587a627d87942959eb70 +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_2.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_2.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ca2cd1e869d2005724d11a0799e4555b07fdc9e --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d07cce8cec4c3bd4f4806e3df01e31b92b924bf5cbe9bdf3896f4198bf677718 +size 222310341 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_20.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_20.pt new file mode 100644 index 0000000000000000000000000000000000000000..60ea70d9cc3b1dd347530d0a118aa861f28351d1 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_20.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e2e763120a4fa5d7d87de9e45b42cddaf5e348f82ad55413ac5b681c0a1ffd0 +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_21.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_21.pt new file mode 100644 index 0000000000000000000000000000000000000000..94e119d306fbe89217f102d0cca118ff318f4344 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_21.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd5e31c28db29f37cab5e90617df743427c3c1dc4e4e336cebe4545806dc0b7d +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_22.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_22.pt new file mode 100644 index 0000000000000000000000000000000000000000..74db36189834e2bba306fd4645359a5011d29b0e --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_22.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96dac4928922dfd560183e2f531b616b90225315ffceebbfce9b18e515dd890d +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_23.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_23.pt new file mode 100644 index 0000000000000000000000000000000000000000..1144e1a72bc04b68abd8ba2d20722c66ea1d662e --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_23.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc366a7d5b815d0153866d6a62ed276939b8c63d3230fcccf48dde5dddc4c0d0 +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_24.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_24.pt new file mode 100644 index 0000000000000000000000000000000000000000..635c768d3780f3a3c6a8ac12261fc1b5a230d5aa --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_24.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f484ec1c3cdb1d6cfef5a6d492081308e032f66bd82d006f0be9c2fdbea142be +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_25.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_25.pt new file mode 100644 index 0000000000000000000000000000000000000000..80215977b0a814e5d4fb9e19d43d6aa1960d3972 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_25.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c23259bb7fc817b9bd743401add0796a6abbf2725b4430b37c1051ad5f5567b +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_27.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_27.pt new file mode 100644 index 0000000000000000000000000000000000000000..12da01ec762aea9d7a1ef7b9685217a8ae7a68d9 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_27.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35109509090a60e845512ab02fdfe1db336265b2b5b0e590c309067757bb4055 +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_28.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_28.pt new file mode 100644 index 0000000000000000000000000000000000000000..99dfd1f912b83e2ef32813a15c14186c3fc57984 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_28.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07c7889e8f83df2d2d2b826f2c4d0d497567b2c314bd8548970c13fae709a452 +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_29.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_29.pt new file mode 100644 index 0000000000000000000000000000000000000000..06a12bbbd3708423031b817a7b0200a11255cfbc --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_29.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70b26f45d6202706442a77878b21f93bab256df2819f3ba49f9395b921665e5e +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_3.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_3.pt new file mode 100644 index 0000000000000000000000000000000000000000..a91c900a62b85a75b0f6cef0c237665d916e0ed7 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e9cd107879362e73565fe81fbd8e3166f0a6fd437163f1876294ae1c2d6e0c0 +size 222310341 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_30.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_30.pt new file mode 100644 index 0000000000000000000000000000000000000000..464d1173bd16bba26fcca48d2edd6cbf6d53d780 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_30.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9567b5b8bc052c5bd8c1c3c2f8e0ffbdfa810ef411958ace10200ea40c6bf563 +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_31.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_31.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab0c037e398fa640cf000d0b3a4aae8337db9387 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_31.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:868a75aefdcbfc47672971e8fa6e5b08d107af4c342a3ea6afa6d739f1ac0548 +size 222310687 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_5.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_5.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f10394d2cf832e0dadfda5aeac2928aa35b02bd --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a777e664626c3e1f210706c1f0da702db54e385ed9700afe454711329fd9d98 +size 222310341 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_6.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_6.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cb983561831f34625f9f7c8b6123654caa57fc5 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5ed3e20fdae3da59e40187e22e501214d496b4b89d31ed5e36788b3b5913e0b +size 222310341 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_7.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_7.pt new file mode 100644 index 0000000000000000000000000000000000000000..5749decdc702dc5ed653cb45169d82ff7f417744 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_7.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45c7b46c655058e1f1a6f248b398a82d3a7511b39231da1980fa00602e34034f +size 222310341 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_8.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_8.pt new file mode 100644 index 0000000000000000000000000000000000000000..221add21836d277849376b395d57f47eebef3814 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/model_world_size_32_rank_8.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7296d6d18b13c47e01c9d2f5bed8ac7d9a6534ee2ba01adf983e6c7249ca646 +size 222310341 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/optim_world_size_32_rank_17.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/optim_world_size_32_rank_17.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b40970f0985a00dc0134e7a5165b699dacbccb4 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/optim_world_size_32_rank_17.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:794cc547d0476f9aa2a823374b2e8877d46b91e9f727a45998f37d56d8b5df24 +size 736714952 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/optim_world_size_32_rank_20.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/optim_world_size_32_rank_20.pt new file mode 100644 index 0000000000000000000000000000000000000000..91826d9d868cfc792e97fcc6259f7e99e2adfbbc --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/optim_world_size_32_rank_20.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e13fb9b5d59a02186f96fa4ba2f167ffa4e010c9903d3fe05c171bf1d3c7a95f +size 736714952 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/optim_world_size_32_rank_24.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/optim_world_size_32_rank_24.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffceef8be3f7ef08b1e48e1ba2ab86ef949273ee --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/optim_world_size_32_rank_24.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27e6f5e083152de92ba0595c09d269b8e82445958d12826b7ab89619bb23a7a1 +size 736714952 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/optim_world_size_32_rank_29.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/optim_world_size_32_rank_29.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d68866e29f88bc660fb7d6d093740377bde1936 --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/optim_world_size_32_rank_29.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2805f7e31e5f98d4ac1d52494db119c20351b6256cc97d74893c03497eee8aa4 +size 736714952 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/optim_world_size_32_rank_7.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/optim_world_size_32_rank_7.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfb44d03c0a89b4b99c6c6846ebac69b29729a6e --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/optim_world_size_32_rank_7.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daf4b8b7c5ecd49bd8944770ed3678dda08f308f9bd3fcae4625ca3478f05466 +size 736712895 diff --git a/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/optim_world_size_32_rank_9.pt b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/optim_world_size_32_rank_9.pt new file mode 100644 index 0000000000000000000000000000000000000000..008b7ced83a144b4f4221f82d8ee462bc2eb06bc --- /dev/null +++ b/mn-coding-uv-2e6-32k-ds-r1-1.5b-svd_muon-ulr2e-6-vlr2e-6-none-muonadamlr1e-6/global_step_160/actor/optim_world_size_32_rank_9.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:284540339965c19c133a24710b9eb3859a0baae89c2a81eb937730122bc9c3c5 +size 736712895