diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_11.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_11.pt new file mode 100644 index 0000000000000000000000000000000000000000..75aa2799ca13a9c98274a3d85c664289b7442ec2 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_11.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1819c832d2652c1dbf5cc5f362878bb07b25bf85d4b78c88adae0624d6e09822 +size 15093 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_13.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_13.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef481f7f3abd944e65c70ff709871d9d5642ff66 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_13.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:387a5932d9dafe2e16b4be9f21f1ec87094e9432b79808e08f62351ff58331a9 +size 15093 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_14.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_14.pt new file mode 100644 index 0000000000000000000000000000000000000000..37602e7af7402674c4f2ddb91a146bc892da0ae8 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_14.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaa9d1c5e70b57b7958ef212fb28a39cd6180bda887cd7f66ff8072c37558735 +size 15093 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_23.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_23.pt new file mode 100644 index 0000000000000000000000000000000000000000..a10b6eb62b03b49539f66d0c17af5da9ca30821b --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_23.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea0ef42a28e599e87b00c3d8aa4f52c72da5988b11aaf868255e8360953efd48 +size 15093 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_24.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_24.pt new file mode 100644 index 0000000000000000000000000000000000000000..9171ecf128a60868dfb5578c24265b3d83c2f6d9 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_24.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67167b54ff775eba7105394effeaae6754fe5fb8cd97a52755cd15da5ea3d3ad +size 15093 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_26.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_26.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ec109f9c91d46f18d6c6739c6ed9871af48e3b5 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_26.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4d2cde07b0854a8ba522b1f9db2fc3d6cc4400d8d43df39dc27f84d1ef241f8 +size 15093 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_28.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_28.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb2fe4f2fd765110c91947474277f6393bde407f --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_28.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:946303709024d434fddeb8aa1c0d1f8d9a1acd754f867d91900dc416a3ca5d75 +size 15093 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_29.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_29.pt new file mode 100644 index 0000000000000000000000000000000000000000..f72347df2ca409de70c73e119db8da8c9d42ad9d --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_29.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de5abf40e340eab5fcb84249e7ad6aef605344e8adb513e104fecd5cb1ee344e +size 15093 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_3.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_3.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc8fb26b5670dd42e41aff6bb6464a88a43b971d --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5639b77b9d31c323a078e6c34214bb1e951e9928b3f642c07dd3cc226f71013 +size 15085 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_7.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_7.pt new file mode 100644 index 0000000000000000000000000000000000000000..e026f425cf9206e20d4f4808afbd71f1d913cbe7 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/extra_state_world_size_32_rank_7.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8607a8933f1adbfc325ed8d9473ace8078d8b8c84c0dce19f2553f5023d843e1 +size 15085 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_0.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..281bd1f4d442bbb300b90ae5309bb545322d3293 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f837123ae792a9220c77ccf00d34a215de36bc445066533491eb572278696c8 +size 215237656 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_1.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_1.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f7f8f978ea27dffd247df750cde6a7059bdd025 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e07fdf5e357abc3625a4b7cd9dd3937bddd855d1a67dd7cb4433abde8c6c0809 +size 215237656 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_10.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_10.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebc25619b13319f3829366c1b337064b79e517f5 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_10.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f45ff51ffb09d9eb2a07e4bd8025373d5b3af6ff9f1dbaeb384017d0f813d613 +size 215237973 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_16.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_16.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bba164f03cc488bc0e5565145e3ff891e9d1e7c --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_16.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dd1c6e2c06fb2317b10a32e6bc2ac942a83a80c66b167aa0b8b4f7614c55f8f +size 215237973 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_18.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_18.pt new file mode 100644 index 0000000000000000000000000000000000000000..9632b4413c8c52e14d14642fa6cb860d17b67b7c --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_18.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:735b34c063fa85acf5d745c080afdb3870e887d30076d8e0567cd839537e8bdd +size 215237973 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_2.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_2.pt new file mode 100644 index 0000000000000000000000000000000000000000..a211a0271bc21c913965c9d82e193ad29bf8282a --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f0b094d15c2bdac45bb06c89e1b30a38751aaaaa96eb2548ad8896dc837e766 +size 215237656 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_20.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_20.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba400747ed36ece8d43002d05e3a5cf535a24686 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_20.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:296ef5ed9933807c94e942ca02eac0314e1ebb06669a838be8bcaf7688168d88 +size 215237973 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_21.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_21.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e5c8f1cdde2ebb7d033b360ee4dc75b120e9e86 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_21.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de859ed047e28e31c1e19c8e4a605a83ab8000ab7ad1c50fc9b7108c7b2dc471 +size 215237973 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_23.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_23.pt new file mode 100644 index 0000000000000000000000000000000000000000..e090df418c7318f064756f9214c134f10a6917fc --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_23.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53d7bc074af972523452433fe2af63a5ab57d13005112170822f20d2ca6340e7 +size 215237973 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_24.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_24.pt new file mode 100644 index 0000000000000000000000000000000000000000..05f9b510aa125a3437032e7558881ce5a9eb2679 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_24.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef77befad96c86b1bde9021eaa522ca4a87b29672ab880c07a119ba32450a28e +size 215237973 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_26.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_26.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2e8034de65ac079a9d5933ca8204ff62298ad7c --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_26.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:404819aa22245dd2a7108fd26695b41865775db2de489eec74ce80441e087e37 +size 215237973 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_27.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_27.pt new file mode 100644 index 0000000000000000000000000000000000000000..4900d089a3ca27d96a0326bfbb2b21c0251608b8 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_27.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b23e0f7b438f51283443111b6868a1f7c46e011612b576a5744ab2c193cf1881 +size 215237973 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_28.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_28.pt new file mode 100644 index 0000000000000000000000000000000000000000..63bbd4db0f9abb97433031e9c9dfb1d238efc19f --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_28.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f46dd188e21e96e0818c8d56474d40b1eb93d0ee8195d0835e84ea475ca90627 +size 215237973 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_29.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_29.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d4850405472d6df3590f2c9a9ccd7408b5bd70f --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_29.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f583b61db0b21bcccc1f7fa841159d2ee318d31c2ababc801ce4fbaf6e037b86 +size 215237973 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_3.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_3.pt new file mode 100644 index 0000000000000000000000000000000000000000..884e21666f8e56e6b1352d07ac717b2fc7c70e36 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48dc480a2ebb43fdeb2386a621116e6302a5eb7d3f25e4ae9a4f1b7112b9592b +size 215237656 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_30.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_30.pt new file mode 100644 index 0000000000000000000000000000000000000000..951ddd25382f26b19b6cff71585f3a148e95d420 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_30.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02b47ee4a85e699634e07264b9220cce5a6cff8930d4edc18a42c822a8c448f7 +size 215237973 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_31.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_31.pt new file mode 100644 index 0000000000000000000000000000000000000000..f87c9e1e051553a87d0b80cb66926fe117a56b39 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_31.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e6bdc6f5a8feaceb38c6c97c6869bb6ce864aa9e34a0aa7c33b871e4ea9df1b +size 215237973 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_4.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_4.pt new file mode 100644 index 0000000000000000000000000000000000000000..186247ca8b6d4331affabe3eb999b8f72bf6e678 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b429fea92818d26a13c3fff6a4d7bae886d8bdc3dab0b54191599eb83989d130 +size 215237656 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_5.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_5.pt new file mode 100644 index 0000000000000000000000000000000000000000..34c780686a5ad4e3957f8d02cda3d874a41b3ee9 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e98d88b4147d61389a24ad40250e09f06c0c3f8634fbf80de7d7bd8627a0b2c0 +size 215237656 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_6.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_6.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff578933cfefbc9b3544f0d5cb672c7dafb4cea8 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00faa03d538164d1a12e26c941930b0c5c9fd418abba74833d8478b2fa273d0c +size 215237656 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_8.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_8.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3f8b6eb62ef2b116aeb42a46cf0dcfdd31eed3f --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_8.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6653ac842bd696551f54c30dcec35cb37870b6244b832155dd3b2300dfa27b7e +size 215237656 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_9.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_9.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc65aa0e8aefe73b3eca689d8e1289f67b97270e --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/model_world_size_32_rank_9.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87748f2ea0f7c02762a2472183ac5a7afc98f379989d5e5c2ed8ce190e9b8c03 +size 215237656 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_10.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_10.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdb0c80f201bc7f192280f27630e7a5aa7738c52 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_10.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4177d980d44f9f5bb750c7b6db3af7536264f6e555eb92cf12137343f3a5abaa +size 430597037 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_12.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_12.pt new file mode 100644 index 0000000000000000000000000000000000000000..d52366e9e25a389ba5b91e7ffd1bcc08567b051d --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_12.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3288f79e8aba3c7766f652d32ef66af5442df8125612a49fcb4c04605dba9a92 +size 430597037 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_13.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_13.pt new file mode 100644 index 0000000000000000000000000000000000000000..c71d247bcd8e6181e3e86fe164515df7601693ca --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_13.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95c62eea4fe415b70f6310ba2503c5ec7a77bdfbdc124403dae4daa54fb63890 +size 430597037 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_15.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_15.pt new file mode 100644 index 0000000000000000000000000000000000000000..f75c659cb6e076edae3cdfb9561c7d0d546e4e23 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_15.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86a39296f770b0344d10c2421353e88d46e5a9c5e28cec41c0cc6e31cc4c99f9 +size 430597037 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_16.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_16.pt new file mode 100644 index 0000000000000000000000000000000000000000..cedbc1139f50a837d7adb9b4310f606e4d253e5e --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_16.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89d13bc144a821cf23e2d35b918ebe83499caf23921e51ebb682a8c5eda5a5c2 +size 430597037 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_17.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_17.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f4f82625dce2e5bd21ecb585a51e2b074ba69a7 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_17.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d5a809053bb7314e25928b12a631e62cc908f19e35c52943f5056af7e0f1548 +size 430597037 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_18.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_18.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5434c9519738d02a9e3676d129ef45f5477e8f2 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_18.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59986cbd59fd0c7b17634adcaba0e6b91550f29ec1430ff9b65e8f7a46ea9e99 +size 430597037 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_19.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_19.pt new file mode 100644 index 0000000000000000000000000000000000000000..38bb08d6d3c159ea659bdc54f41feb84417a334a --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_19.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04affa953198d08149cfa3e04a133c32f74c3d45e6c2c8e292d7c5f2869863d3 +size 430597037 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_2.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_2.pt new file mode 100644 index 0000000000000000000000000000000000000000..16e903ae3b51d4d81b9f8e7819b49cd730011079 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_2.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92c73748b65166ed2e92e7d0cfe7f299c512903040c8fc57dc47e10a64ce4675 +size 430596100 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_22.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_22.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d1813c284c88f9420e27080f0a8009778029ca9 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_22.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86ae64d57ef3eeae20a525492315b6c5e5536ec375a4d32c494746c066bdb4ef +size 430597037 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_23.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_23.pt new file mode 100644 index 0000000000000000000000000000000000000000..c84e9d18945a350e3cd85cf4c24a9cce60c95104 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_23.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0445152a12bb06f3062a705faeb063ae15359d9a93cbce502dd2d446ad59c8f1 +size 430597037 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_24.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_24.pt new file mode 100644 index 0000000000000000000000000000000000000000..72baa0b94bab80a33a23dcc8210423e33679bd56 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_24.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aa7851555fcefef22fee701ee464f5cfefaeee7aade9c7c72133877720411e5 +size 430597037 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_25.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_25.pt new file mode 100644 index 0000000000000000000000000000000000000000..055f4cd7e73367cc1f26b9a14d2d3962db3041a5 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_25.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d0ede2de807d4a550a1552a7b8c77105ec211356d5c35dff87a8befc36d582d +size 430597037 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_26.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_26.pt new file mode 100644 index 0000000000000000000000000000000000000000..11152c514043b0558fade4de6b10e7b94f82e868 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_26.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5b1ce52ac14c5b8d1e6b27ded2901671afafc777ce5c16284b13ddcf9c7355e +size 430597037 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_27.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_27.pt new file mode 100644 index 0000000000000000000000000000000000000000..89ef4e4a6fbb8a6d01c07b6cb92d188f5d0fe560 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_27.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa0e22736f04f8d86af2ea0ea25b038c04e0d4f8c0f7139095afd1f28b94be82 +size 430597037 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_29.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_29.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4dbc928648b46534beaf14dd9c428d07ca79863 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_29.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56988456a6829b50e4bb1129517e86993532273a091b751f767b3e45c2f1df10 +size 430597037 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_3.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_3.pt new file mode 100644 index 0000000000000000000000000000000000000000..2794d9d27dd44c1d25d2dd23c5430d3d2389271c --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_3.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:456e3dacdaf1c73c160fe2d27688071d2d81e1557ab2e62b517f45dd09688d33 +size 430596100 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_31.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_31.pt new file mode 100644 index 0000000000000000000000000000000000000000..91dc194b288c06bdfc041c4eda6d3bc9d6cee292 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_31.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d4519fbf576ae3f2cdbe8bd6390815a72473204def570b830b682d4d2f25a5b +size 430597037 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_4.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_4.pt new file mode 100644 index 0000000000000000000000000000000000000000..526e7ba5e1e2f6fc0d6653fd7d0840f8ddb9ab4c --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6d76acc6653e02c4a06f90acad2d0b6ea9f30c43bdc253366cc30f8ab4105fc +size 430596100 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_5.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_5.pt new file mode 100644 index 0000000000000000000000000000000000000000..ace781f8c2ccecf05213d3a2d9d65feb0b459344 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4a6fe0eea9e4b2a8b20881877057910814de9fce748c75ad39993c1b8e1b52f +size 430596100 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_6.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_6.pt new file mode 100644 index 0000000000000000000000000000000000000000..de31924d054726ab4ae0e8ee5cb212b8a2b8a218 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1159114f2a93e2be442e34b04c415bc7e3463287f720b72dc3e7289e1587742 +size 430596100 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_7.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_7.pt new file mode 100644 index 0000000000000000000000000000000000000000..07122fd37a8c4869636d4c1483982fd8d2e846a3 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_7.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0664e9fb21aafe1c4db9873ba6adf9cfcc096d5dd47ab9b90fe3c54e62eeb228 +size 430596100 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_8.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_8.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfe1111a334bccf360556957ed399d58b11b0b55 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_8.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b902bd817b1d11b518f366653d1f05ae5562bf93c1527c7476e809ab99237841 +size 430596100 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_9.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_9.pt new file mode 100644 index 0000000000000000000000000000000000000000..305ece6cff8c34ad85d9ec7cc8e5f6b1e61f3465 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/actor/optim_world_size_32_rank_9.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fa5fcde63f059224a7387d6b9a3db8520f5d636c9c2b37161f8ca6a081bc680 +size 430596100 diff --git a/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/data.pt b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/data.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6574e9a71c67488b87612fc140885f2f95b7910 --- /dev/null +++ b/mn-1.7b-adam-2e6-8k-qwen3-1.7b-base-adamw-lr2e-6-kl-losscoef0.001/global_step_40/data.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbc1215807148fe96df96b51a8a295d034e408e3377b14419bfd623862af7b75 +size 1947