diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_1.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_1.pt new file mode 100644 index 0000000000000000000000000000000000000000..16c52babf4edfdeebe3ef8236e4b9a3dc32fb62b --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5dda17c80d0d1e2c28c9c69a8ca1a1397291e226e6432e64514ecce59f0b3db +size 15149 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_10.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_10.pt new file mode 100644 index 0000000000000000000000000000000000000000..3840048e86403b5affd2bda4b58ad943164ac8a7 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_10.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20c162a865e4735957bc64534c4fe4325b82470a61c0debcd872f48244b203f3 +size 15157 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_16.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_16.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b8e02d6cf82b1af86ab9cdfa27dcc26fa46d353 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_16.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97b8c4fb4ba99bcdbd1155a0ad46b5b913e05d896222eb1b8fa8e7c6b845e660 +size 15157 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_20.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_20.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b123bd58d11249bec0e306deb3685f50914a1f6 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_20.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d5389a9d1143778a36dea869acde3ea863718dd15459bf89fa0ad5daeebc449 +size 15157 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_23.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_23.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0f3daf4647aab3d548a2eafb6a2f2ef00f66698 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_23.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95157b1010406e0e7bb146780b4eea311da21299ca309d695a7ff7271b4931cd +size 15157 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_25.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_25.pt new file mode 100644 index 0000000000000000000000000000000000000000..801e9a2424c79d6ca2132f4a4094bbeb424bbf2e --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_25.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56e07c8d3fe242f0ca3e222e061ef49c23581b6d1967d45ffeb75d6bb049016d +size 15157 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_28.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_28.pt new file mode 100644 index 0000000000000000000000000000000000000000..64debf9af0255e8607378dc72fb9cadfc7fb1a67 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_28.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:047c4201354ec90427b5372ba83b30f97eefd0de68fb7a034c1f6c506dbe0891 +size 15157 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_29.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_29.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c762d16793d3789851963f6c59cd814593f3649 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_29.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca4b542323ca8a23f9501424fa9a77c27484c1a1cf1fb27f22078eab72bbbed5 +size 15157 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_31.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_31.pt new file mode 100644 index 0000000000000000000000000000000000000000..a83e43428215b7b9c642d09c53928df5116b347c --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_31.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76c3ba3aff0dc316e0b946d62a127a29aa41ee9c5dac815bc997c6d37170985b +size 15157 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_5.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_5.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bfc2f0d33db39a6d73362b0005b1ced4b2745e5 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:485d70cc037545602772141a3d13cba2d22ac11b1c9e24fc8d8bd6a39c635306 +size 15149 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_6.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_6.pt new file mode 100644 index 0000000000000000000000000000000000000000..4516c0f8cbe935dc55f812650af19b12b752ceed --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e27fa775aeccb40dbe917d399890325d9bfb100f096edd274def16e1180a574 +size 15149 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_7.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_7.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5723472ba7023ef7b6c8b7c3879b8b59da2f599 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/extra_state_world_size_32_rank_7.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f45b60a4997f4e24a7d23264c5b1a598fa3f4fe1cda37e1316ee79e67c482b76 +size 15149 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_0.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c99ea47782559e3d524822cfc7d35c0b0e71531 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4ed5782534158c717ebcdc940ae7c70454ad25502af3f36cb2c169aa8d500a4 +size 222310341 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_1.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_1.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8dd23c08176093a593fa03494f110139109a11f --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c55c3484ce09ee74ae45f147c917471e5e0075e371c52f3fd0f097be547a3c9 +size 222310341 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_10.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_10.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6c7c64c90871e8dbedfa82f28d487b6898d3a91 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_10.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:600f92f21e1231c2556df3bd3b84225777d9e26a7738803ba43655bb525125d8 +size 222310687 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_11.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_11.pt new file mode 100644 index 0000000000000000000000000000000000000000..80928108f8a796a5b548affb0cf4978828c15b55 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_11.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ab41ec5102c70c8813e5c0c8c3bfb18e4ec2e9dd3a20f69dcfc59edf0d55db5 +size 222310687 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_12.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_12.pt new file mode 100644 index 0000000000000000000000000000000000000000..389244ef31ca4eb98e6f337c1ab996292075f9f0 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_12.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bc92f22958a3930a5af3f2a9879a1b47fa1f6ef02e352a08e4c8197625c35da +size 222310687 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_13.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_13.pt new file mode 100644 index 0000000000000000000000000000000000000000..89d62f7f11ca46ee87c2e073ae40053e29241733 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_13.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20055222bb47e74d8d1d442b7aeb02a883a6ef30ae59be7513860b887317c405 +size 222310687 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_14.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_14.pt new file mode 100644 index 0000000000000000000000000000000000000000..6410e8add57d5c00e8deadb33ce3ec06551d07ec --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_14.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aa73b180d47e71c96c439eddbcba7a8d380446bb4fbf71809fd2cd951988e36 +size 222310687 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_15.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_15.pt new file mode 100644 index 0000000000000000000000000000000000000000..a91c2feadf4138e337c3c5241418fb19c50f0b9f --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_15.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fab5c274606a0a2b3d46d8c71e760efdfb14e55b64c3ce11c308510344a07867 +size 222310687 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_16.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_16.pt new file mode 100644 index 0000000000000000000000000000000000000000..fce192c5a8cff063028260dc789d95cca0ae67dd --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_16.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77a73c0868bec1e8ac524dedad2acb521c512fa6c2d7f15c713d25d64bdf065b +size 222310687 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_17.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_17.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4975ee0fdccb05272a76d64aecc7851e8338a1d --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_17.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6936da2346e2ff3597d9be170682eb1c0b43c8f4766f65b524ffcc8a1234004e +size 222310687 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_18.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_18.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d1f54505b830e832302f58681a834aea0fa15f5 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_18.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b49f59d4312ed9f9116c482a0e59347a9745d8c762db183d6784a3d233566cb +size 222310687 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_2.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_2.pt new file mode 100644 index 0000000000000000000000000000000000000000..22e48cd7e262eeca93471b9533efb42ddc954417 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd2ce563e5aa59f3cdaaa5a30d7f32007459b963dee99884dfb50aec97789633 +size 222310341 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_20.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_20.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5fda4fa1c554c5af42bbc3138205c939f44837a --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_20.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:018a6beacf99c4471e9e97ea6513d824b7f3f79d336c541c8ed8574f1d957a46 +size 222310687 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_21.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_21.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf9bbeba36ff9fe342c0f88dbd7d02c710f88466 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_21.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf43e7eaf72e699a34c9bde5b4e94fb1a7b8c5b1800a47f51264388ebeaaf7bc +size 222310687 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_23.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_23.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e5faaaebde1c0ff97def3fbc291d50033baa63a --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_23.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d104d82e0a74b922981d9eb3dbbaa10b791fe1fdf8689bc557cf4f544e76969 +size 222310687 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_24.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_24.pt new file mode 100644 index 0000000000000000000000000000000000000000..73c3ba7badb27a003446ca1179c1e3cf63eb9d0c --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_24.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed35dc412fd7410e33cac4e25f89e259c927a89fd75a16dbd9cf67baf820dbc3 +size 222310687 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_25.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_25.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b17e20b51b553a7931f7228bebf1f6d1cba095d --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_25.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce73de4f351c87b5384c740e5670cefd33ecdf5001cbda02ddd792674b7df83b +size 222310687 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_27.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_27.pt new file mode 100644 index 0000000000000000000000000000000000000000..c83894410a72e2dbeffc7ca5c745cc686fbe7b11 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_27.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3d772fb77de69bf6d41e5ae4ee6b243a488371e7c32f4d7983047a60e70208c +size 222310687 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_28.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_28.pt new file mode 100644 index 0000000000000000000000000000000000000000..453b8b45690b9f0a0e01a45165065a7f35c53be1 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_28.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5f726ea2c830e2e3d45e6bdb47604d83d8826493c532ecf7da302897ec5b404 +size 222310687 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_29.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_29.pt new file mode 100644 index 0000000000000000000000000000000000000000..da7222376f8cfd5fcbad630f6b4ca0082bef4a2a --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_29.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a53e1c02f46952ffcf5fb6c228b84e125e9e56dece3a106ec6aa3d55e0a38875 +size 222310687 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_3.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_3.pt new file mode 100644 index 0000000000000000000000000000000000000000..a49156463f44b8f1e135883673f970dd8dfd67d8 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22f6711d2c3cbbb5bddaaaea18f10c020e2a79af16c5dbb968ace2d236933c8c +size 222310341 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_30.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_30.pt new file mode 100644 index 0000000000000000000000000000000000000000..2be7dc75099b4a72322b3735d8cbd8b27895c413 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_30.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:482f5e30fea1203001b02ec108c00d95e11f630100aeede916cc11064993c772 +size 222310687 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_31.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_31.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f482bc69ccb21cf8d941cff926964433f893521 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_31.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79eb4385a55dfa54ef7ed7aebfdfe15865dbd07b0653aacfc03e4f6dec0ab459 +size 222310687 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_4.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_4.pt new file mode 100644 index 0000000000000000000000000000000000000000..a694542d3474ebb1cb816baa3375c582cdb324d1 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8adb3333ddad4be1e4ab607d6f4552842bf83c81cc8ed65893c3aaa28f02581 +size 222310341 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_5.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_5.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f91daac110326dc89bf894d33a7ff47af00973d --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ab897e6f82936fd60581b175962383cd26e5dba916c3386677c3bac2fd38c55 +size 222310341 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_6.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_6.pt new file mode 100644 index 0000000000000000000000000000000000000000..207fe5ca56459466b0351d26db9b73ea3492ace3 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf7c1a89faa975799ac491a9aacbefabe119f12ab588213b4f0eba6179b2b1ed +size 222310341 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_8.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_8.pt new file mode 100644 index 0000000000000000000000000000000000000000..65db20b3d249158dc02799e8e9c42e9b69a596ff --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_8.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e323c6ba8d6b3f69b86405925ed9af1bbf53cbbc817cf3a331174d811158ca2 +size 222310341 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_9.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_9.pt new file mode 100644 index 0000000000000000000000000000000000000000..1325d806c830d953c5b95a7df32341fdbb28eb0d --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/model_world_size_32_rank_9.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6c19ee0fce1cb6c81d7ccf8c550a269be565d6c62fbc9ff04a3d90370d9bf1d +size 222310341 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_0.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9d3bdc5e7a268b10697790bae65decf0fb990d5 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44adeaf2b1914a529287771086c18c992bede251a34327fe97ae4ccd579064fd +size 736724479 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_10.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_10.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d298ec7915cb2f8daf201e79208f6865ad4875f --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_10.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ccdb30726d27bfe6bcf201c84b45e772bf1140a3850eeedeba90ef3930c4458 +size 736726536 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_12.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_12.pt new file mode 100644 index 0000000000000000000000000000000000000000..38148e52a143bd75ce88e75decbbaea27f96ecaf --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_12.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6d9431d2b17246272ccd91a034ef8852918ef30b10e80bd587a2c86fd27a05e +size 736726536 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_13.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_13.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb02d8998bcb64a3db6651862b651e4430b82a0c --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_13.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ceb3cf324c69537aceba26e8312d21b9d3fae7b397651e5907d84d85f34e109 +size 736726536 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_15.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_15.pt new file mode 100644 index 0000000000000000000000000000000000000000..26e8a45ab60f2bddb9bef0e9f8c08a9c7631559b --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_15.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc81f2daed30f97aadcd0732fd2f8298933a63ca09aa1833f80a526ef92d4563 +size 736726536 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_16.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_16.pt new file mode 100644 index 0000000000000000000000000000000000000000..68b3f018cf52890f49f421b9a6d7cc0b50283bd6 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_16.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:390a0c5d45df8a54724f919d594169b52a079f8d01a0499fe925fdf553d41b9c +size 736726536 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_17.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_17.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca0c7d6b9edb5222043615fd01c3a982fb467871 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_17.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94465a10b916dfeab7b79df47c54f5b7152f03dbd74bb156a1e968b0ffa8f0ae +size 736726536 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_20.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_20.pt new file mode 100644 index 0000000000000000000000000000000000000000..911c6e0fc01fb492f9da089a604ecb92d8f5413c --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_20.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47bf224204994cc0920a51c1868b3a4491c21e80cbe7700db66ec5250c6cb6a8 +size 736726536 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_24.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_24.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ac781f7df339fbaaefcdd23f03c2e9a7b33aadb --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_24.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7ebac4b88c6aa3d51405010064c274fda58a062dcf7502169f27f6b84f921c1 +size 736726536 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_26.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_26.pt new file mode 100644 index 0000000000000000000000000000000000000000..b02909a7f509f79d197ce3f1ff0430e2af1d27e9 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_26.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ff5452baab57412c8e9c9e6e55e94aed356577661abd0e1a2b9e7924675b94f +size 736726536 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_4.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_4.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e1be3a03875806da014475ee42321cbb525caed --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca70bbbca079630dd5c7c68a99243bfb3749120d81f3e4552e74656f336929b3 +size 736724479 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_6.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_6.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb950f430434a15c3b9b32ff3de5c163ecd14c71 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:810966bbd51b1bbc75763346a5a6b87510cc5eb40b58527217e180bbf4c3c66e +size 736724479 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_7.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_7.pt new file mode 100644 index 0000000000000000000000000000000000000000..f787e7aa07521f8cb31962172a6c2ee09ddb1fb7 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_7.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee10f8377408f4ad7bb656c2e1e30873b06854ecd0dfe3b44b501bccb3be834d +size 736724479 diff --git a/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_8.pt b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_8.pt new file mode 100644 index 0000000000000000000000000000000000000000..c02f3f3eba7891666cf352c0ebb3b01ce8bfae11 --- /dev/null +++ b/mn-coding-uv-1e6-32k-ds-r1-1.5b-svd_muon-ulr1e-6-vlr1e-6-none-muonadamlr1e-6/global_step_280/actor/optim_world_size_32_rank_8.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1e04f2e51843a2e776d6b822eae41bd8863a431b660cd68f2e878e8d939a0c0 +size 736724479