diff --git a/.gitattributes b/.gitattributes index 22da35949fb21c4138240d5b5c724558a0b765be..a080f71f683b6339bcc5558d3f6f999917798118 100644 --- a/.gitattributes +++ b/.gitattributes @@ -44,3 +44,4 @@ mn-coding-adam-2e6-32k-ds-r1-1.5b-adamw-lr2e-6/global_step_100/actor/huggingface coding-adam-3e6-16k-ds-r1-1.5b-adamw-lr3e-6/global_step_80/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text coding-adam-3e6-32k-ds-r1-1.5b-adamw-lr3e-6/global_step_300/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text mn-coding-adam-3e6-32k-ds-r1-1.5b-adamw-lr3e-6/global_step_340/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text +mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_0.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..13987d6d9a9a5b02901450602890f78e40e3737e --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d1dd7ee7f01f51666f49082c72e36b83d4ab8b6e5ee6561523a9b045cec422f +size 15085 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_1.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_1.pt new file mode 100644 index 0000000000000000000000000000000000000000..717a486038b38c9f94e0d320c24d5ed9542bc218 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96cbcf48d321ef8fe52221933081c988c5a92cee2d8461d29a1a64a5bd4e0279 +size 15085 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_10.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_10.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a9c15df4f48f9c4b2556d3017a540cd048e5302 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_10.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43be47bd03d4f58376404353b0898d654473bfdbab5ff39954e66d94ad543790 +size 15093 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_12.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_12.pt new file mode 100644 index 0000000000000000000000000000000000000000..620f6fb02b183149856620a7375b5f00b499ee5a --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_12.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0c0f20c7c02154d47c463bc4792591f6ed47c94eff2d0bddba5be9f02089535 +size 15093 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_13.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_13.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f7ce154a14712652fc366cac58582a523860746 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_13.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b02335d8af967a694c406c21c62b5844ca597f093dcb8174b0d02b43a7bc1037 +size 15093 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_17.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_17.pt new file mode 100644 index 0000000000000000000000000000000000000000..4722258b1f85dc0f001eb824bd469524cea3c58a --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_17.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b727faf4558a86827cd6f81401d0636b5a2d27728870408887c2919ee3bf395 +size 15093 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_18.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_18.pt new file mode 100644 index 0000000000000000000000000000000000000000..a48252ce174aabbc2eb3802a6b45528af13af77e --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_18.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:311cfd4309bed6fffa981ff90ddf4e9018f10e50e6328e43412cecf18d165ca8 +size 15093 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_19.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_19.pt new file mode 100644 index 0000000000000000000000000000000000000000..706157ef10f6f16c96e79ee5bcf363130c750004 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_19.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:694ff54a9b32da5b4eeea7b2d6840b4ceca0c4c7c485fc8bbaae7e2d703f9af8 +size 15093 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_22.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_22.pt new file mode 100644 index 0000000000000000000000000000000000000000..02a1812a7b37572ba5a73d75848e87552b4d98e0 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_22.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2e486c28052f9a069da1894861b79c93e879a75ebf04d6f21fb449690e81af1 +size 15093 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_25.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_25.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ed24ce7f27ca070e2784fe9a882169616c20082 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_25.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f2c49a165ddb15168263a7763eb9957694b39afd39cd0bc39f7e46b4ef16cbf +size 15093 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_26.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_26.pt new file mode 100644 index 0000000000000000000000000000000000000000..84ac8e8ec4905b9fde292568ee91d3419ca046f2 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_26.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ef250194cd450872db2ff565460235d9c3f2e1d27d5c90c79e470825bc4ed75 +size 15093 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_28.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_28.pt new file mode 100644 index 0000000000000000000000000000000000000000..56e2ea49165def76a7c14008ec1ecf4e06161bcf --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_28.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74404bd16986350a0f7f3e8b2ddf2103facbe1a36e72e915f9b841ea9cb9883b +size 15093 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_29.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_29.pt new file mode 100644 index 0000000000000000000000000000000000000000..099c32183a77351063d79db4a73caf2d0cb2002f --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_29.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43b1eb6659d6d23fd35abe4d0276c9743ca7749c3040b7e5f8f06ec05a8ee335 +size 15093 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_31.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_31.pt new file mode 100644 index 0000000000000000000000000000000000000000..96c0a7f9cb21f41b4e3c8b5c93eead72407365bc --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_31.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43a4a02e861cee641c0266c8edb004f0ebff0310090a1ddbdf4e3a8614331914 +size 15093 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_4.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_4.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0552f6c2515b23f1500912f5bc69687d7528b50 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5196e25f825462ee92ca35ad0a27cd195b27f020fd7dcd9bff79306e241e765f +size 15085 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_5.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_5.pt new file mode 100644 index 0000000000000000000000000000000000000000..17e28d6eff40199c14d25cd326df8c28977c129a --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ebaf8c18d653946def73b07880a13eef263f3ca70e2c729656d6996b214ed72 +size 15085 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_6.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_6.pt new file mode 100644 index 0000000000000000000000000000000000000000..b600934b758d53d3df26a4ad9b50ea6fea810474 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7afa34f2fc28ba77a40d60f944c30d17bf4ae4a3e8ccb4bb43180d42653b0efe +size 15085 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_9.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_9.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3c1de5675c0c7b08b7b4bd6df03f567bd0b931a --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/extra_state_world_size_32_rank_9.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40297e63148004cc9cee9ca9ebb6fd13e33f958ee9e2254d444ab919fa2fce38 +size 15085 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/huggingface/tokenizer.json b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/huggingface/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1a2db243e47cbc113f6b2ddcc388aeeb8fe1a94c --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/huggingface/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893 +size 11422778 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_0.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbbb93679ec378bda31a783b0f50eeef026b08f1 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afd390784c6c811539ae79ec0acbae1b80ac7c34575ef6c57eba2c6da5aceefc +size 222310341 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_1.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_1.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcf9abdf8ea02ddd6cf4e09640388d17f1d242e6 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41684619ca9bdacdaa06fc94eeb9739517003a1429ee8329e1487147702f6d4b +size 222310341 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_10.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_10.pt new file mode 100644 index 0000000000000000000000000000000000000000..52d89dfd9bd0145c95b58002cd5ea876e4a53cc7 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_10.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:728979783e4dd28b30b09b10617c86b778a6213ac63319f26cb654756938c2ad +size 222310687 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_11.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_11.pt new file mode 100644 index 0000000000000000000000000000000000000000..c58ecbdfe1245ff1776c477abefa22c4f9c20e82 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_11.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:628a9b748957e74400ece53eabf45bfb94bf70b5b4b8b493de448e74f97fc46d +size 222310687 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_12.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_12.pt new file mode 100644 index 0000000000000000000000000000000000000000..67c51f0fabe1fa864816d48800dd6eee53767f0b --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_12.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6d0bf35e280d60ac10d53c35539520c4c5d01d4e6340b150a90722613d0d837 +size 222310687 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_13.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_13.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4041ccd5e4007340ecb5a3234a412aca2b63b72 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_13.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09d45ff1ee9af70cbeeab7ee2e0b0806c858bd7db2cc9aa08511dc890f3000b4 +size 222310687 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_14.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_14.pt new file mode 100644 index 0000000000000000000000000000000000000000..df3734279bbd944f588b3e4281b8ea1bc37c4795 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_14.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:618b5015498b7cc155725b9e5fa8c4fdcc862ca689f47ba6e6d5413d7f3d3f41 +size 222310687 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_16.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_16.pt new file mode 100644 index 0000000000000000000000000000000000000000..77ddf73728c0e34a8ad3378b39fcd5596688c3fa --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_16.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2adc6db6bde7dde1c6fcc83a16eae2f5f6a0f834006b9dc44eb9c657a37e2c6c +size 222310687 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_17.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_17.pt new file mode 100644 index 0000000000000000000000000000000000000000..77b07296fdf8f3a853cd4ccd2fd2f7b30eeb4d01 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_17.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78c72724e344835341505f498c71d55dcb5458933e83e9faf59f069847692e76 +size 222310687 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_19.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_19.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a881d56d8bcd98a82903a6e566305e0811697f2 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_19.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1820b1867507e31733a8a0fbd9eb565e443634b509c974ca0e0f6573600577e +size 222310687 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_20.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_20.pt new file mode 100644 index 0000000000000000000000000000000000000000..847a9519837c64643b92c3ce73e7ef56cb9beaa4 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_20.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cc5b629cd4b5c8b5757deda4a43f591883aac863b8062cbf95b07249939160f +size 222310687 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_21.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_21.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ec59cb2eef75dea07e18addfe439e631fecca8a --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_21.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3394166150c2885791c8a2063305a56daee9d51d207cbad3646d77308b169489 +size 222310687 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_22.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_22.pt new file mode 100644 index 0000000000000000000000000000000000000000..64d0222275c28ac04ea36ce07ba52cf8bb21e311 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_22.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed979e92faaf810f46c39f1fd642f20212bf76ada3b366e7781bf07502bcdb7f +size 222310687 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_23.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_23.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c19af1efb8d1cbcd19e4f2838bcdc6245fcc6a6 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_23.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4afad8878aabd0de0d289112f6fdc3d0af8db8c0e08800bc29dc1274f82dd987 +size 222310687 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_24.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_24.pt new file mode 100644 index 0000000000000000000000000000000000000000..b45995fd5ca79d0bdeaa04155e36788e441156cf --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_24.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d51d847d4b75358f67aff0b6021e599f770a4cd098787f7ccca763a48823851 +size 222310687 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_25.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_25.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2ea4d2f19713b03235c0a94b65784576bd7773f --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_25.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e695b99959e268ab593db8dd9372d1655e01e80d78334e48ff751b1f01aa7540 +size 222310687 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_26.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_26.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbe16cd66a61a7ff135667ece94acae2b9ab94ce --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_26.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:172cbb6d585a749542b69298a5db4a99cee2700c0d8fb4c2158225856e072c41 +size 222310687 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_27.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_27.pt new file mode 100644 index 0000000000000000000000000000000000000000..3afae07dd4f6a8974989f0752d10ad77bf68fa6d --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_27.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddb74a7ba49aa891ee4967c20da6ca41b630930f1b3c9e1540dd0faf37691faf +size 222310687 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_29.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_29.pt new file mode 100644 index 0000000000000000000000000000000000000000..0584aa4494b827142aa26230d0f62896cc5ef469 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_29.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fb0a6ed8f13d32cba0041d5389714b0a7b6c863c95c383da63ea2197b158f97 +size 222310687 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_30.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_30.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e5269329a60025b9595117037624d15b308caee --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_30.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f594e9e0408c156587e82ce7f2e95b3258a95b669a3309e7ee49ec8690e15e9 +size 222310687 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_31.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_31.pt new file mode 100644 index 0000000000000000000000000000000000000000..da4154a6c92a38a8db9551902528e4a2321b2374 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_31.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b1f0ceb8782bfb8d8314983ed226fb7fc0d7648815172f8f585ce4d8b808ec1 +size 222310687 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_4.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_4.pt new file mode 100644 index 0000000000000000000000000000000000000000..8856464351ced71a0d73f55a149387395689a52b --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_4.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:382abff4b803ff3302a19457f8e081a624399b24c1a6cc0d803a64cc56a080fc +size 222310341 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_6.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_6.pt new file mode 100644 index 0000000000000000000000000000000000000000..92626bc16bee55189949bff4749dee94f4577fe9 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b28c06635e297d9671e01591807d1e40e730a92b87ad7fa94fea93f5dc601e52 +size 222310341 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_8.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_8.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccf7a530fe12afd466e4b4b72887e1ea9cb740b4 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_8.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca9fcde5abf16c9c9127328eeffba716e7d5286294689d1ec44f9b5dc44e6d0e +size 222310341 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_9.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_9.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1ff1fad630e0dbeb26555c8c7677b97aa9b72cb --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/model_world_size_32_rank_9.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23855c8e9cf2f07cd98969c31f64e54abfe41a23e4bacfa609fb113ff1da787b +size 222310341 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_15.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_15.pt new file mode 100644 index 0000000000000000000000000000000000000000..a64f63e3ce5e1fa5b498c498bae7fb657315bae3 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_15.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89e4a318dd41369d88614c29761a31dd55d59a46032cc32a374534e9537ff851 +size 444753565 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_17.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_17.pt new file mode 100644 index 0000000000000000000000000000000000000000..b31d6efb298cea28963486127ceaffeeeb9b7158 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_17.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77a1d305822d7a184a1e9f0a2178d6679a83d610d2eb73445dd974e9d1b8c7c9 +size 444753565 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_20.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_20.pt new file mode 100644 index 0000000000000000000000000000000000000000..29d1cb370bf144b2c544955f65051fefa4352d07 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_20.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad5e3875af2ff2ce738fc7f2ee2b98889bcc15af551402c5ea58a7eaed3fb775 +size 444753565 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_21.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_21.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ecf3fd4d24935eaabff8791b9599387cfe03513 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_21.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9080c0d87748fc6f1c283a41803895e8072316c5114c40525b6078618c2f2195 +size 444753565 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_23.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_23.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8b59ceeb1ab30f65fb63c446eeec6f058f0aff --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_23.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f39f8b1a9a9b244861c23af96e7c4229d11d01bf487c45c6d79c396069a7dbf0 +size 444753565 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_24.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_24.pt new file mode 100644 index 0000000000000000000000000000000000000000..849eb76a9e8ed1fa2802c6c4bc1b0a17875123a1 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_24.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d67298cc04e7140e7ba3459ee91d8101235cc54d060ad5fe99d48edeb287cc1e +size 444753565 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_26.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_26.pt new file mode 100644 index 0000000000000000000000000000000000000000..10cb3c8c3dfc0929f3674890d72257ca3c16cea3 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_26.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e695d27a72751d711918297da27e400ec9a6dcbf1c78773dbdceccf109915f39 +size 444753565 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_5.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_5.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe2e7a17a56797f8db7b258abdedfddc50f86ac1 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_5.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:651c2a19f5e3636b04dab07a54b11c9d2f56880b730037d56bb7bca968f8fe8c +size 444752541 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_6.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_6.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e0805208cb9b98ba0ef0a3e7d9ea7774e0a9296 --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_6.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ca4129c61ca73be9d08c73308925badb11f27254dd818ca13af7092eb3923fa +size 444752541 diff --git a/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_8.pt b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_8.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e5bed4fd9e36a03f6c21d24a1e9d51c9781d38d --- /dev/null +++ b/mn-coding-adam-5e6-32k-ds-r1-1.5b-adamw-lr5e-6/global_step_240/actor/optim_world_size_32_rank_8.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e821044881dfa4de78c3fdc6d3ea19c2fd818f77e95c0fbea0d3fb5758e248b8 +size 444752541