diff --git a/.gitattributes b/.gitattributes index 7128f1464aca0056ac2a1ac841324ec14f0fd234..b44f937e3c70e90949474d42b6684a3a1c1dd627 100644 --- a/.gitattributes +++ b/.gitattributes @@ -728,3 +728,66 @@ sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-19704/to sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-3284/tokenizer.json filter=lfs diff=lfs merge=lfs -text sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-14778/tokenizer.json filter=lfs diff=lfs merge=lfs -text sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-72248/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-34482/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-4248/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/tokenizer.json filter=lfs diff=lfs merge=lfs -text +grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..317534874b9133aabd9352aa9e13eb20b586d41b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccd61d65cb4b6c5620b6f52209b197c9358ca97736a9b61da04129a46425bd78 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d7be719ee152e224597a778e4d04ae713ec0926 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e882e92811d603b1d7c33169f0b025c4049b2669e537e66bb23bad26ea032be +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..8757ea04e93fc3d0d99347b238fbf7678e593b3f --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:032478a582980ef2c598efe75ad315499f6d42a4e32aa077084cb113a48b8a6e +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..c7f721af80dc8e14068d3c5f7344ccec05ba376f --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4debf9dda4f462fe3511ec26606053718fedd02f09970b78403f90a11722f202 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..e7f03299f7784fa6f11504bfb65dd885cdbdeefb --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25086c52a71c82f8f2df859291ac870e7bfd87f70293e98d086e60d4317c1fda +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..557a162cb5ec787898845b65b3f29c29236738d8 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8400c05d78a868f3fb8829167d16a485f84e33d77e8ca368f247247e86d506d2 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..36368e44910bff87ddd737997f65276fcc5d364a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7467d71986e05cec05766ced10155b94f8de393746facf714bb23d4c4e0f4bc4 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..317534874b9133aabd9352aa9e13eb20b586d41b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccd61d65cb4b6c5620b6f52209b197c9358ca97736a9b61da04129a46425bd78 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..2aaeb126e9d99257792a4aceba5d75f10383f475 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ed6a42ed7e39af915d76774028325eb34053221e67cef08522b0dbf29e9360b +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..d6b93456ba93eb9e5aabb0624754dd4566dc3d0c --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:496dab5ac434081715cf9f19a53b79013cc1af9c13392f766b50c29fd432c14b +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..21f886a57c43800fe940a3b40c33f79ed1404359 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e32d69705c106a176d6d90a7526ca0aff0c53dbc698628dc24edbbcf855626f +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..9f348ff430de3fc4237dca93e484cc35f3e382d2 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae3a5f9f9438f8d33e9a0b1045fb33356838f16c5979de475cb6db60f6920e9a +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..72d6891780f9c0734e0eb0fdd980eeb92dc6a8cf --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04f2401e284b6d6c90d110756cf3afe8dec75b249400c865cf2376b9b319c4c +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..36368e44910bff87ddd737997f65276fcc5d364a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7467d71986e05cec05766ced10155b94f8de393746facf714bb23d4c4e0f4bc4 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..317534874b9133aabd9352aa9e13eb20b586d41b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccd61d65cb4b6c5620b6f52209b197c9358ca97736a9b61da04129a46425bd78 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0318fba87d722cd57fcfd4682498f3110c5c774 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b5ab141ecb9251f7455208a1d7f9c99b1cfc57988cdfb86f11ef65655817a85 +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..50e8f42b4158d0660d22e355f299055f8acd653d --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:623d9cc8857f6fe5de0394fb47b498e3cd846748829ea9da03c995c8db951dd8 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..5cb6a94c2487869db88bbbf984cfb4b7e4dd756d --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c63a212562315fa03da9928d36545a70960c3e9b92ff46463386489fd524b2ee +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..83abd9d8d93336f001dd5821d5f14028322abd52 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c77f1281f31768af4e25df89af97425bb99e7ca1c8e207f78ff7f6ba5957bcf +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..36368e44910bff87ddd737997f65276fcc5d364a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7467d71986e05cec05766ced10155b94f8de393746facf714bb23d4c4e0f4bc4 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..317534874b9133aabd9352aa9e13eb20b586d41b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccd61d65cb4b6c5620b6f52209b197c9358ca97736a9b61da04129a46425bd78 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..f555f2312aa9be3c5151517fdbcf83ca8e46d82a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71da3b020316f488e9841c0d5447d857215527a1303732558eb8b0d5dcf2da4b +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..82865a2408177cc8e0a9a5ba9c80d7025e0eb3ec --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6a0b5bcfa1fd7883b7d3eaa51bc8bf12b62570765d047f46336d204932f169d +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..9640d48e0f036cdc7bf806a62e99a0d4903bcedd --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59236a094fbd4155468af539e1d001f6c83152d87694314e1728f9ed82fa161f +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..54cf153f6659cdfbe3fa5abf516bce42511dcf1a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d19a19a1621e733f81299b50ee7e52464ab66cd11517f247062c3dc897bdc62 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba52efc90706a1fadb0e6e492f0dbc1e66e05654 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24e7ca248b81bb822afa3560fb61ce397c3061d8dfceeb6ebbdbe3c1a81414eb +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..36368e44910bff87ddd737997f65276fcc5d364a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7467d71986e05cec05766ced10155b94f8de393746facf714bb23d4c4e0f4bc4 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..317534874b9133aabd9352aa9e13eb20b586d41b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccd61d65cb4b6c5620b6f52209b197c9358ca97736a9b61da04129a46425bd78 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..91ff0419f3e1c0202b367cedf9b46255dd077060 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee67cf4314e0c7ccf5c81174590919078e9753aea37ae2797812a7d1a68c0ae2 +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..6528cb881c1d1f236cb9878abe699e1e80f67895 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:407f251a8ecbe7fda1229f6223cf007607a4c15dff3ec5c2ad574c3400d86d75 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..930f5b22db746ad74cec9077d78f2254cef51e4c --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2353dc8a88e88a7841e663c0c899be9842606f89b006fc5bc99fedad4ce3f8c3 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..19c690ca04f74cfde0190fd97821085131e3fef7 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e9e1cc29e53955ff814da39132fcbf7befe00596ce55773da2c57ddebce732f +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..995a8cb2efcf9d9f4cdd0440f9c0421b20d36202 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5edfe6d7cca9ca522c7a28c2b9b2eaf9fcc5d05da256709ba38b82a48de2086 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..36368e44910bff87ddd737997f65276fcc5d364a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7467d71986e05cec05766ced10155b94f8de393746facf714bb23d4c4e0f4bc4 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..317534874b9133aabd9352aa9e13eb20b586d41b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccd61d65cb4b6c5620b6f52209b197c9358ca97736a9b61da04129a46425bd78 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd3dcd8c2b6bf0ce655b49030f55be8ae9ff340a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f2fba107150e8764af2ede60cf0ecde71465c8088d8af01b08afe9f41a45138 +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..b02912ebe02c12a50d9c83c7f21ad6d4c8fe8833 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf32bbba4838d91a90a84eccb3ee5448194306672167b2592f52f0574eca0f49 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..22b27c08b6a06db34fad1df59e024c3537ff3bda --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1536138e373843f9832da972f066736eff132e58f7d5ad0977019fe93eeb414 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..8d0a3b153a6a2d066b34483dc00d9ae615f9893a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02fdcf932b5458b87023d7a45c060420452d7a97a8b969889ebedd3cbddca1ba +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5d235d6b4e556a42a974d980b85530b71dd8ec3 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee90731ea0c0dd8f909335cf442242f60a5949e7f041ece4b7ac574989d9808a +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..36368e44910bff87ddd737997f65276fcc5d364a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7467d71986e05cec05766ced10155b94f8de393746facf714bb23d4c4e0f4bc4 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bcdaa2fcae3630e30810f59ba729304eb7be756e --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75da0e1656a768eb7b28b613273eb13d782d7ca19af3cecd252cf86174381625 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..07c92021f706653a6b99c0f0a9a182bd2369fc95 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23ad97008180864f0fbf5aeb018396bab33c7779ef7a0f5ea7d231555bf306ab +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..64c464da4923e255f31cd8eba4b7d4ddcb144828 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:547b0d6f98d44f896382bf36cccc97565692b04e6e52dad6d7894cba3dddae49 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..88729c59c2f3197aabd74571bf47da2d43a9a8ff --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4cc99b2b92fdd880d55857d800a5da6eaea4caeab4e4912e83b93766408b141 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..a4c56eac959f99e65b318140c18b86df2061de2b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b639ce196f3610e2eb3af39352fc8f21abf360311a3523f0fe91765f625f0ac +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f6144a9489666c0a51927d3dd1ccd7e20587a05 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ea6506fecbbc2ee9a78553cc1d3c62a976f52e1e4b6cc7c87dd907f2b762e8e +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0ec11610c7cdd670691964271806b7517045f29f --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6dafb57a5906a5a3c0658b1a3d672a00caeb26d6e312e7f425e322ff93ea049 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..93bb2fc655a563b6e9d8cb5143e192a4dab1a335 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1fccd139966bdfc2c5122badf94f37ae32361f5ec47d236b7e8f0093977dbd2 +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..0f9a6dfbc0c7f41572f43e0154e0d007f129bbb6 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b8e7de87d3952c7534ffdbef5304b5d85ba0819ed8084a72e21454f822aa364 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..223a4eb6e24e6849dbcdecd283b5cd544c802b12 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee6efdcae557eb2602456e8128e670273c26455c6d92ea41cf72a17b7bca1434 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..df16cd77717cd7cc92bf339cca6c1b9d2fafcd2e --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a7a02c41da4bb78f1188d22bd86e7a48e495ce6eb0c0c3a02074902b56dfa17 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2b6d99f29e6275de54008184b1b0e9d6266c2de --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:911c1036b3a6ca1a25d873a19cd2a53a6cb9ce23ec077bb523a68d3f1da0c69a +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..97df34d8d01feae5d3a0e7a1b34be7e5e82740cc --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c013489c8e20d8542454683ba036c0fc1061e7c19cc3101615d7e157da508590 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..0276f73ed837457c42e3c50e67efb8c1954c26e7 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c28d8932700fcf65e3c6a85e3759bdd1c59595a91e14dabf054b1967225403af +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..7dec3493909e792c31f1a236f8d5cf2738b1aafe --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73eba5bf78813d47246d763134eba9718317cb29d4aa512dd4ea19d0fef0171c +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..adc94a82eeba2aba119bafd780c35fde9b632bfc --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e58bec20d1d32125a3ca5cc442a2475d57119f6ffaa1a7f46c126a1c0a09ef65 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..2f777c2f671c43c3d4b74bf39c3f3559853572da --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4553df47428cd2185f21d7119b35bba5498ab2ab47b98eb42f4f1d453d1eb8ac +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a24bf63a4d055d763e5754a75e8d7d63ffe1db2 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1028e5b3f624fde0eb55361b2a88ba91061dbb06c9c5cc1cede1cc259b0f5978 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..92661e706dd76dd110724a659196165cd49a23a5 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6da4b444341935bd8943f57310b2d448b1e7c6d81d709c7ca17001b8468e3c6e +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..19bfaa7be81aa321993119c59d6208a1220d572e --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:874908755296f11c7abc05818d9159159d9a76b4ee80d48877612d229d33145c +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..c1bc9282fc50c749e538e94882f88ffb50079006 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bcdfa4c69103dff1a4ddd87255fae8636accc7e7ba53e084c6ab239ebfd009a +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..bf427dd50985d8253138b9a5079168cf4abdde11 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10af2bba71873094675b15c200ed540fd24ad5d8ed2774cd8147308ced080ba9 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..5149bb54d1790c9fc3e12c6e7835f1da7c0416cb --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9889d294fa3e43a33f6c0fa29bd58fae1605f05bf1b14cf40f3479726f4ef952 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..96094e089523a06b353bf856e90ce3695d9d1062 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b36ff5b02ee4e50859f323aa94e729cb245cd73853c43bff4934fff383d47d4d +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..385bd4dee22c85a2993b4ea0d331eb1584c70710 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a9d1127bd89d02652438a9bffb9d087793f57e1b6c02616c860d9204513f476 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cbf118f88cfc34bfe433ba43b8fd3e8b94618ac --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5130cf59c31b25e411c992ab36eebe5d8ca1f0f5494cb56724f512c80a2c2368 +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..d2048ed35b47f7c1e2e5d0f2a5119c2b36f09f42 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59b987cd10b7c03b754e7575ea7bdde8be1beaad37001550ea4ed714d087a535 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..72323215d8442b3794c58a43625c76bff31066ef --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4423ce78a060c23ad80e35f48f1e156ca15ce7afee114cbc43ec1bb9e427d600 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..1237bf0a80d1bd1c43d3ef07d5153cb9d81c02f4 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e071dbd678827ff7c3aae0f5a8db237726bfa7fcc7ac64996df351b173d14948 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5e5ad4da925d655396db6fd3157e9b4d77a4d33 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3003d44eab6ac4751dd988d046415d4328ca8170e33b8982c3623f026e539eee +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f5db9f1df1ae0efc3b2e21a3819bdefc7211dfb7 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d80e460a6ec4ace8231ada65c8422f35e82eabe11cd30150bd5521f9d37099a4 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf8a182841f1a30f27a04b50a36bfee6c89718ff --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b295394cda05aa7f0c75959846adaf7787599d3f57a72daf2aac475981f477a9 +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..64126e035a1f043a1a2695cfd3f57560e25926c5 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f64c0214be5e29e9202121f9c64173aed090584f18c3bc569467cf58919df082 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..565da74cf0518a30ee686422fc2e5bf06eade4c6 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcc4888d7fae239b4a904547f8772cd629dee6ad9f6c3ef2f388c6b8b140625c +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..b89ef85eb4c549679c2dee1f42113fa27675cd48 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f10f983e0eaa7122653a1d75acc2f7481e7cf7e702723d2fe4927220e770da3a +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..29239fd6dd841094e05facd312a48486e812b2bc --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58d6bcab03d2532cab897fa32dae91c1e0c5f12cf637107a681c4e9e5a000fb4 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..926d3b33c4067c856776a607fd07b5572129c2c8 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37f9d2099f34590664144b861ab1e68ff639a6b9e565c5776b2a86139135b224 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..cccc89323fc9d1f961c55e94235fe6a6aeba5009 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1cdedffa1d7c00564aa0df1c55aa9542319de198e30406bf96ec00caa29d42b +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..3ce2b3ed2991fd8b43218dd2cac99bf9b6c228fc --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f5a5e0c5bd2d8714c43d9d5995dd8b3ae4f971744b069d1dfe107623187e44c +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..73a90ef66a86725d1a27bb05d455498b499b0aaf --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f536a77ecb5eb973a00af0836e7bf1ff3e2232d052fb95bc7742c4982056679 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..6220853d84379b52dfa717127b066e768c7322ff --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dbf4b42b574cd04df0c8942692dcec7760ba2cec35902b02683a2d532d75925 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a5870b95188645d59fb86bd90e31b3f8fa27ad6 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0f41a0c4edf2cf228c77e24994d078e827f5de46c8315ca87afac3018172331 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..38d386f193de366c34a8b515bf93608084ddb2a7 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90c6d41419199ed2ad1a078e17610fb69dab046c5aa6abe8a1004bf4ac4db864 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ab3515d129e4e52a4006edd5f9a1209cd0d5af5 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62b54b20f9bc5ad979c64993014556920a4d51ecdd58ab08ee1722b62ce77332 +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..6c0e14cb622d8261f3821323701685cdbfec493e --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90fdf8bc87fa5784d5db42ae823e66be8782009847532a691ed88a02a3f1e194 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..5036804d656f3c7742f5d6ec2132278418b43dbe --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be0682b12a84dc162ae5d9c417506412198996e2fa05d02841ccbf0cf88f6f09 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..588cc746d0bdecd4bc12bd22474fbda19bbab1ad --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb4302fa2bf68128bd91cea25691e000bbd4b7a1c2d288198b13a5157a1cffa9 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec66ffa9d84c1874167bfb4bdfa4f519a9a49ae3 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb8b3e5dac7f5ac84d3f28c7861a0c807e712bef300152c520b8b552df32e2e5 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..09a9a1dee0d0bfdf34cf5301f6ceba0406ea5aa9 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7eec9ea3105e5803d96e15a97134aeaa059f9a76fde512435c1239a551263aa +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..db7be77c267ab89730e28a02e37a951084c4b830 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23dd736694796846a513219a3940ce36932be29a65fb4f44f3275aa40cd00a30 +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..1594a200b76b5f379a71d703b15c87f6e19767ea --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:170730d4aa5de6a2add2ee371178225ec880ce10bf378de332f6f002f2160193 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..147656fb22d55e94ed6da50ff1649bbf129040a6 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e4d5ace3a9f71ac725b6fae38c3f8afed0b23f186de9c6f3edf3b22c3322547 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..3a63ad0a28c24263fd0482a002b8acd2bcc57cea --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ade54307073800861fe183143aa323934b5c30f17d3d499b33ab3d2513eaaae +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a536e1805cdadac0d4252ccaf6312536e35ac0c --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:272c2188cf1a27718154b5463bb8e397c96cb61145ad6668647206d081ee9fa0 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..211471cef0c2a95473a73a1a87e70c9cbe452c26 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:107f0062cfbe35c3159256f1de79c3c63370c01585101fbd7b22fb86986e0a69 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d181273ccb61cbd5a90d8d8df52fb243af14354 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1ba4d8d6271d9d8fc03df46899f2d635a4fe1e918682076f178535e4cf6cc91 +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..e0914a8217754182987fada1e81f190812c7be48 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cff140929976127b7d5793b93e37b6cbc757f887965befdfdf8e0d4395210c96 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..b396ab1ee08615ba5f1b01d68bfb0731b6b418b2 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:368cfe327cecd6f6ea669ebf713f975f47d68a7846c26fe5a94b79909a3fb61c +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..718f5a631809b738aa8e9ae4af145e80ec7ba98b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64b8d22745be08cc89e74f8791ab209a5f22e65a1f87fd2afcc507b9dbe4de5f +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..86212a2d46d556c77510df8e3c73f4e0fe5f402b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9a03fe4d9f5e900ba38b309433d5e533eb4b56095b62800fd445abd38f16147 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ad7391e1d421e2d1c629c09cb2c2eaed5a2eb819 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd8c5302cb8574ad449a7bcf1f2b464aeb3b65d9ec3b7e50bbbffa755b76a6b0 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8b295035387af1c59b6350caf712762df51f441 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94cd437b1214a1b5b8a71f955aa4b649def59f83fd22ffee0e5d84f48bc91067 +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..202495371ba20fce84c7e284b11b336949f2b470 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59f4974942a04d30b89aa2bbea2d256afa35115c7a78c4b887b8fdba7f03f4cc +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..85a4a392fac616df73bac3e74650bb204947c33b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa155ebffb813e5c8ad93dbb2e9770b14540a0897f9ba4b92777e4a61c83885d +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..3aef1b540fcc382b68d9dd30ebf330fdf58a80b2 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:913a38cf6648db82f76f571e8c0f966fb8eb8302efd910aee7cd065bb8293b12 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb1ef2915ab85175d367c36c7dfc6d4c6a140228 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14377969c01a0ab0fbcf41d9d9440acbcf3687c3878b0a5be2ea88db0d54e1b4 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..20cad37ef5c5d7c609628d65be8abdf1fa1ec675 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0abb996e9a4a549c84c677de328220e02b1080144ba4a516c263e4a8c8810002 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..28816b098d9bc6e3decd989dcfe855a3abe27d3c --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5064f7f99c1527bf39b53c75dc31ac8f790aceaf7f4871761c0290debfc616d9 +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..d0608f34f323ec56d53fa471cbb51eabcd407a87 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:284406fd7f9e0b716a8272559ca75cb0c4ceb7e74c42a5a94a76567f2a40f04c +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..d6d591025f5214000aa1cce5ec18dde96191d470 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0f68b82eb636479e4bebb766020463d28c3ccb55a25466bf60c7ede6b3515bc +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..dc3cb9ca449e7415b9e4ec6021db27728577a9d0 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6db1470f1ce6a9af91d4f70aa48df156ba1f2e1b21fecf12cfa9fbd303a2a55f +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..db137e60c3e43fcb3a75bc9b412a4f8db0c4ab18 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e115aa770deb339dedc7c5ac8e98eb29b9331e879d146b8ca0a047e129873433 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cfac3ca24145ffa07893d11efad215f484a15525 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64ab386b252f5edf21d90686ba21fa1a61a3c38ee85845013bbe670534beea79 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c80bd3f3c3e77d606314bd513e2bf0f2d191610 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1e11afeea5c9aba33603e8d1533106025bbbddf73df6045a4ba0377b2f19c17 +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..4fec6ee18404c32ddb0c136db80d950888b06b78 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aec7162ad0a8ec3b4d8c081233fa6ee71025873538f3fcc4615adf23af46b892 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..ab7c0ff341f14395ad6cd0e15db68b6d8a3013a6 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93250de9a30c6422217257f923e08e3caa444decdffcb831afbc00270a640069 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..f0b56718bff520c3a0f83561cfab470c14f954a7 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:620ffaedcfa2a265a4e5f23267da23859d7be788037cd2c8ae584f3206fcfeb3 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..703b803e8e91e1d0c16d7515e84fd6c809183c34 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18c9ec46b64ee013ef85da509548a167c4b6711a8f98d8a337c000502a2b3143 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-4248/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-4248/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..093e7e4b7ff53832c53ce8f0618dfc8494ff5a67 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-4248/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:998f854a91507ceab9ded8c39b768e1855976bc4e79e1ed6486889355799fa9f +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-4248/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-4248/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..1e386cb55c275e874f74f394058da8b6ba4b0ce8 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-4248/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9b12f0dd48df6700cec2007eaa6c372f5dea8c8bda0ca1fe3aa426e53bdfc9d +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-4248/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-4248/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-4248/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d73f7699dc1783edb1bad336504ec9466536662a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da50742cd6995c66e4a0208fea077eaa357637e378f66e147905805e11bbc4d8 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..05c1030e6adf6a1d44a4f0a5e932194196b3d505 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62a5c99f5ac77160a92a87dfa814d1c6fa9c4caf2c849599ddd7dec4148a0610 +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..92cca86c9c6f6cb40fd2dc2db3ce3607d8a79885 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9496e4bee607d904d2691ff9482452f94024e36a768a32b5720f31aab5ff54f +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..85848552e2fb127ac455c80d7e69d79033cfd038 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec752707b4a6f3e798e655c5f710e4657ddb3695bc1d8df359ab93ee98e6b85a +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..0b2778a1d2cc2c600336844c2141dd11ed6df4c4 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24cfa7f4daf735af11b9e6fadd71c32672f28d4c806e43744ef9f34f2a57abe5 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..601df5190badb8ca213be68de541f4baa89da98c --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba75c482d2703a84a765f0b334db4ccdd4df94eccafe43a129337410d34cccd0 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9a260379f2bc6a9d1a99c3239347f8a8fa4c94b6 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25e4f89948ad2afacc5fdd46a3f0f610b558d544af93670705a781778d798b2f +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..867643fa29f696854a99f9da0ba63abe0a5984b8 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e82d0829faa12e57b038811787a011e608499a331407ba023e73c4ab0879e2a +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..09e2479a2b7ee8f683a04fcb3c72e36bffabce19 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81c12c81b00ed288ec2109236e8bf0c6471c5d7e960e573390b70e4241e34195 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..a844190f3e8cd76cef32a3c0934f191cc8fe9c9c --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1150553fcfbdfae38f14b5c3f3fff50b2b1f7680e835423b0bc9c43554143d40 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..a5ce665cfba9e91cc42f782a1152ca330cb31365 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d3d3ddb3c961df900faef8a0e2ae9f9d16375b377e91eec25d86c6ae5989f75 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..008b2dc25d74443d7e0b02288b254ef18ce76828 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce2a60f1906f1b36a4e3b097452d2be2d1975a2821bcdaede3597940f0c3142b +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fb012d4343ecb583e8d22c304fe0838ccd84c7b1 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70e36a84c5f028ede3dda4d86ec0c8ff8e7e9eec112b8a4c1d9400d97f4b4bde +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f1bd2841219f8f93b5cd788819eb59866833e46 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:402671482d75afbfa1e553f39ba373037b6c4e3b49cb4b25c888a3e2eb5f3372 +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..4f0b561efa643e428b948648fa1d6ca45a15f397 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06fa0c88b9e51e9ce91c650da90d875a1d5c0223da20c015af8f574387ce7ac0 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..5d92698c207b68e81605754688d2706383a99590 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b55ee0fd0c4ba7848900e9ecd5b36504d22357de383853ffd25e0a3a0c320e4b +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..32d1c1289f48ee512a656b1964223d263ac5f4c2 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21a9fb0f3fca61f4ccc4f8ebc8da85b39dd30016549c5563ff65726838734427 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..9508a6a65c1c2f4ffa8b200a144be9ac739e75ee --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd2eb8fbedf2622b763e36f591dbc0932487d1f828574657ea6843229286f53e +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8458aeec346f6da286ca0637440b902b78e5846e --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1eb90747a87533ad5ce62d2ef56b1a35e891b771492feb7fd1493554c27c5253 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e5d5877de611042bb438bee313c9cc25fb92e4f --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83ca00243cde342af265abe2202f94bdccb6d6359621d2c423a5d2d3234ffe5f +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..19241169bdddab1d0dc3970e2f5d680b6c468559 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4687eb56ed9d07720dd81d57e596cb37cdd96972d54f42cb7467ff842e2dbe48 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..d9228a12651c7e7e66cb60e1b92953ab15d5509e --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a205b330c15259116ad4d232c85a3b454bf5cc7e36eebd5382ef22e50bffff0 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..e15a377fe340448f39aedfde13fb4b8620d29432 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0ca12131b8d1709deaca6ce00aedf524bc08b8d6c96832317ac56d2d08190ae +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e4ba7947bc86b2ebc4e33b592e04da27b161f12 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53c2943323563e42caaa1671e34ed2b9742b743a0a3042a5e9c0aebd9b65594b +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cf4dff6d3da93764ae82c0f0b3416084a1c0f5b2 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78d7aec6eda503262d27da50c405fae5a98a7184ad24f7d417b8de35d096e1ae +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef9aebed8aaadad2d1a867379a4df2d0f2bbdf46 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7922911bfdd442d7a0cf91414186bc39712d891732f7f94707ac473900c3760b +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..d32dda4ef818a47ba2a5b490aa643df5686a5e27 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb76e600fdbc7e9e41615108a184b14955fe04785e4e3ce00185b0bbaf6c28a6 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..ac8007172516e9676c177df7296af0563135879b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9c1a3ce288ff2b88ade76f000b43f101367de039c27a21532ee5dc28abc8772 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..a4cfc387c4fe8c6a4ef225a1aba6be6262535b7b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69e92cd305248f59d5999039d86abc6abea96f2bbd91b33e782a4e6a09dac00e +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3436493dbb69ac93b0954db5493686c44ed2987 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:354946768bde0e2291b96fcead2911c03be890bd1d9924fb4622062787ff7710 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9d4bdfe98320fef2151d538487db21dba8d729d4 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c3a2c2223ffc3cc10f934fbbc3929adfd19e36832cf9be185b199b097c1449f +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a83be13d908c2ffc9affe4d606f86bf3a2cd1ba --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60e5ad4cc4ed883137e349be454fc2309315115cfc90a2a14c0b11b71da29f7d +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..b50d77a84ef88178aa30437a2669edfaeab8781c --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22a1355accd5a9a89a73e32514bffe591367be838c247ec51a028dcff277dec4 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..ab4707cdb8a0144d9ddaaf281c67f0519a9aec9b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4db4f36e4e6b15429f9e877eafc6545b154249a4939c44e2dbef6420fd233027 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..74b4d7382c330f27e06b136b75f273dc5987b00b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a15c207f5e268fcad4ba2161c29afb6438abdf8a902f5d9bbf64133e5066e784 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c721ae801c3f4b774b4ffda5ce9ef2eabaf6dc1 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90c31d72d622ba088645fb7df75c0aa263c650e5177b2d11652737191c2ade73 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e105b5e7492892caa63e3c912d5b1da45bb5d5b4 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:092f000a36ff29c1c270fb06b28ddf75d23953e53e4d3d105fbc9b72ae775316 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..0774f415bf457c751f179ea34aaf5b58cd4741ab --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:130935a882242938f1a4deb8ef88efba919ae14f9fcf8e65792ec7ae2f7cd28c +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..ea64a8c00233fd7c02bae2b24fe6bfc85624d77f --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bfc3586f4c90a26eeb5a4e95f46f5a0e9081c9707aa160cbfce164ce193f436 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..6a95513c0a6d06417a41d1a0b813ed4c5b161756 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cd392876c4c7ac2ab25cc7e5a285595dfa2d7339afeed264555d59a79279260 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..0994354129cb0de7236e36a9aaa10c47eb6eb2de --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f28afec868183c1a4f186d6afeb5f23e677c0102abaa9174946118ba09f528a2 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..043faa0e42da99e35ca9870070523ecb7236d15b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f0542277bd717072f3424835ae32d436c6ea860ea6577dd1b95d3d0f3d1bf5c +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fc544990b488fd719f61fd972352ee319bc8856b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0717f012615bb939ee7a646d70477d3d009559d361e5972b31eff8482d178d0 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f26a19400af6f00fe6442f640d1e7da5d92cc36 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef0e9d36db43685e54af106c38e5eb35c6621bb2d1104a323c2a4d2c64704329 +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..78d1d35b81c3a297f5f7f749b450e38bbf0048c0 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d4d9b9dd8b0a0f347fdf1fad6e43c426939f9da40912e2b502329aae03b3a6e +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..cc57ea0121db75e25b01f3e7ad4283daa5d33eb0 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eb3e5cb2c6efd08bc1fab626304617129d598d6c5affd24971f6c68f3aadfef +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..2229de27c703905018d1c72dcee7f938596d7b80 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88adf94d0d4807e3ccd0e8e1e1c401bdd59ac42e8c033d8f483ccd5e6cc74948 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..df521209a61e47c90eb382e0e52ce0ea0fc207f1 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7db3339939b6e3b2723d5524b4b8f0fc861bf749999156f307df333ef709577 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..354112180d0ec96e8fa28252cbca6ff1ae0e5a2d --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8b8493373a722c186aaf14d5369582b61650e44e81a6c028b9131437fb599c3 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..23dfe6a9691cb5aae8ae57b1c038ee8682d5e632 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9e85749f275f2d445fe6ea01be0378b9c5fd9b3bb77d2cad48df4392dde7d64 +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..bff986861286bbd893f025852a8de54234df82f8 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c7343e4ba23ecc2a6fbe2e8cea0accaa3621841f44bc9fef0d18884a04aca6d +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..fad11ffa30d44a0f0bba8b2294981b4d1f554827 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1b377db38874e51acf31f8257565e0710b07d89fe63c7605e194b41132973bd +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..c2eab4d6d63cf8439e9cada131555c1a565f526f --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0525262b753b65db98a6a262566fec0e96e01093b2ec25d0d0220960c91f143e +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..311c78f83f4d945da59112b617cc6a678d6eba5c --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b6f869d5336e484cee39586b18bc06a042d818065fcaf1a7aa321734a1355cb +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1fa6fa385c45f3219829b001a037817c0a2b8e03 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:064ed37b5f7be40e49794a8121cb02447c38035305afec4de800293a12d6533f +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..e55b3e5275c65c348b196b9daac93eabb7dcbcc8 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d77f5603effeda716910cb9cb30d6570b11ee830cd9fbd1e400ff57d7f5ed83 +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..d4269f412c53bf2693aea4939973a4d3b721ccfb --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5bf3e42fa662c494b18b9d1be5f26abef95d5920306fa99a5d3c2e3b9a102a7 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..2d5b80f9b10271e1b169389d8127d3bdd4cbb085 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe291048efb11074a8d49b1cb03081a77b9f19ff80abe5e60c6c4c582dfee866 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..3252076a1bf5ab59f8220a140c2bd4a0facb2c50 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cd9efe6589a35fc637f7c2e261d29fa0d80112b05faaae33441a5678570f8b8 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5f4698d665470153afcbd30013c7129ac87548b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31be5c567817d85f33ea39de4ef3e203167e641be020c2b3318a2f8decbc96b5 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3c7f4711f1837e770b2f9d0db0bf192ae49973e3 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e8a344c7bea0f149886ab48212a7bd6dd5901817f729e2c24a4f63b7dc37ea3 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..75137b900f22bf6a5d134c64071a9e370345886a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64464425fbff4983bc14444eeee91dd3df8992b835ba0171de4699b9670ecfc2 +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..c2fa37bb53f3536610e96a0244cbad53411b1fa6 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13fb28048ef89b1d82e0025460be64e2bdef9049c123b230a1b1ed2897d1ffee +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..3417ca5f8b78b4c637cb12b80d2f6ce689ee0619 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8198f55a54acdff7c95ee3894621736323a96bb9762d8f82b1cd6e756ad0a084 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..2cca10aed775113a23e70b49d8bfb9d743c81512 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f4bf1438a955e5594efa4faee233ff3b23c3ab52facb288e462bb7864b6e98a +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b269e341de0c923951befd10cab7a9ef15af09d --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6eefa5bda3853f64754f2acae82c4b22c55796fb1ea51822e1c0a7f67fb86de0 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d6f138164d8aa15f2261afe50de9fb81204af7db --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b99fe72fa48519dcc788a57642812bb12b3fe91fde8b22884a15c919cd73f417 +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c03f7a6c1e815d12334002b3ff0457c378ae208 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:621eeba37ba3a10516d637566502d3f849f23be26b0f3f43fa15fd53da0b372a +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..ff0d3de569f1f04707299448b071c39115b5bd71 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b25a73da3071ac84b807e99a3bbc3a0c109588d0e1fef6f151f592814842140 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..470d45d71bc48de00a06e05130c651a1f3a37517 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eff895f5daafbc76efeccc3e1dd373f6dd6c88c8dcb270f0382ccfe42db0212a +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..0ed6710c9dedaf03c26798019588b1e4f3513d12 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be704873bf09ecc34636472e440526fdb1afd97660940c22f360d4d5d53ea830 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d991992f5982e37c14939d2da8f093b1825b87f --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59321707982695dd442e232eb36f4208166d2d1e690900c80c6810c0a15cd106 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/adapter_model.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..60e8bc641e818f684d06d58fd97dcac71ccaa459 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1818e17d8c04d0b9e79b59e77a533e3c05b07aee1ba268df24be927553a94a4c +size 22056664 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/optimizer.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..041153e77fe7b20ff58f0ddac69a40e7c9a95920 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed479aeaaee539f0dbb71c74fb0e0cce5613f39f31853edd84e70fa2ac97e7de +size 33662330 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..097788f37db0b6eba92348725ebd3c1be9bf9cc0 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a359cbf24a90825c4d088a1ce1fafacac28183df4b02b6451d37eefee2795f8 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..407fb7997e122b0b46edfe5e3b1f7a787c7bd3b9 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2595db11e3c24b5f9d81dc96a29084859ce762683e837138c59ace106d47e15 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..2fcc56170ca5dad617642e03fc1cbe677f1b6077 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:902597ff9f4ddf085abbd8d2e9cc7b5128389ea0afb18cd4b5d0ca75e8e8f3c4 +size 14768 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..48abb65c227c2b31b456d54ddc8f0744547850f7 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4026c342ea4ce8a065c907bea2b0316604be937451901152ccbb8d22d5546916 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..08ac16c37bd04cbfc3d79d052e43e2d0505ac29a --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97354df042b57754fe7f516d93895d4c1c23b3311c26953ea279c58a3f198e00 +size 6392 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/runs/Apr25_18-10-59_gcn136.local.snellius.surf.nl/events.out.tfevents.1745597530.gcn136.local.snellius.surf.nl.775809.0 b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/runs/Apr25_18-10-59_gcn136.local.snellius.surf.nl/events.out.tfevents.1745597530.gcn136.local.snellius.surf.nl.775809.0 new file mode 100644 index 0000000000000000000000000000000000000000..e186cd9f235c83c784bc544ef0c5026f3ee6e6dc --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/runs/Apr25_18-10-59_gcn136.local.snellius.surf.nl/events.out.tfevents.1745597530.gcn136.local.snellius.surf.nl.775809.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f89cf5656e98c59d11819b0c32e4dd6afef6c8ed960dd38dc2a44a7df5836557 +size 2466864 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_132107/runs/Apr20_13-21-07_lrdn2378.leonardo.local/events.out.tfevents.1745148103.lrdn2378.leonardo.local.2502777.0 b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_132107/runs/Apr20_13-21-07_lrdn2378.leonardo.local/events.out.tfevents.1745148103.lrdn2378.leonardo.local.2502777.0 new file mode 100644 index 0000000000000000000000000000000000000000..2e2bde3eb4d9e4331eb1e9c05736cba7f37754cc --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_132107/runs/Apr20_13-21-07_lrdn2378.leonardo.local/events.out.tfevents.1745148103.lrdn2378.leonardo.local.2502777.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18b92ae580954143bbf260abe707ae216fce46b8a1ef3e1ad6cabab8249c9587 +size 8529 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/global_step262/zero_pp_rank_0_mp_rank_00_model_states.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/global_step262/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d12a9d2d071eeafa7698f4cba404127415223c46 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/global_step262/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86aac596cd507b3f33861fea2995b839b40914ab6f589efb87c2f40cb027fc7c +size 1401735 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/global_step262/zero_pp_rank_1_mp_rank_00_model_states.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/global_step262/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13ceb034a917ab258609f75d2c178cdb54352599 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/global_step262/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:514679bdd452133d6e67a94099342f46839d3b0d20fa3ad129773368bfda520c +size 1401735 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/global_step262/zero_pp_rank_2_mp_rank_00_model_states.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/global_step262/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb474858e21c05f05223fc228881e53fa6f96e2c --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/global_step262/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71b27452f380c728fdb46a4c8eb52de0929cf05d554e22f2895047cd86380727 +size 1401735 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/global_step262/zero_pp_rank_3_mp_rank_00_model_states.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/global_step262/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4b29c65c735b2f9b91d4303809f92f7b576bb31 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/global_step262/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:016521056b46bcc917b65fafc327d5d1d43ad9d409e22876d5627c9d32e60e63 +size 1401735 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/model-00001-of-00004.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/model-00001-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..525113c6258fda5395cb95717fc91ddb4b51b651 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/model-00001-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a79bd330dc71781037f822328dc8872056f0f8db0a44155ac327969f1dbb565 +size 4991459544 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/model-00002-of-00004.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/model-00002-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1aa8ae4e417c9bba970a99b9f3740ac1c2cd586d --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/model-00002-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:679518d38b004d441d42d9630429cfc5861b795ce5a32710983881055e075ec4 +size 4991757456 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/model-00003-of-00004.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/model-00003-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1a2615cdd7141037c67e5fc2b0384810405dc743 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/model-00003-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c98e8b3551c90ceb99d3fb675aed286d4cd349ebe08a48dc48d4619576b82ae5 +size 4947691960 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/model-00004-of-00004.safetensors b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/model-00004-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b1422ca2dfd72536b0cf93c3c5948f8819438d5d --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/model-00004-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1be8230528c92cf9b94745c1a6c6fe8e5976cd515657ed177d7333129d1adde7 +size 1863387424 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/rng_state_0.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..9c287de26f76b389db025ad109f0595b0b77fd22 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92cc13315f24c28015d695b6cde08bb1cd6fea4cbc435998485ed6fbe4c91285 +size 15024 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/rng_state_1.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..a650912080f22db0d79c6b787d62e9fc2cf473bb --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93534a5e1a72750a0a250a8b7f453be2d25abf03a7ddd59220f8f95670323176 +size 14960 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/rng_state_2.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..747c72054d13f1c91ff62e95009fbd8998b69be0 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15e7056d80551f130219ac8e710c1cdaf71949805baf2be9ab493dd3954bd3dc +size 14960 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/rng_state_3.pth b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..89060acb72d5f33517c24eb175a50ba32deb06b7 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8397bc9f57009902c93d0bfa319f443b7a6a2750655aed7855a65b89b3276701 +size 15024 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/scheduler.pt b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2a614bf26e29e6b435acab2087be8cc319dfa89 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6abfe1ebe766137f3680f6508999c257cfee4711cea22be1e9fb282530139656 +size 1064 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/tokenizer.json b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/training_args.bin b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..bd1ab3bdd69921a77e7c9beafb58be7574220b00 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47039f16d5275d9ea3ada3298d78b5a1de72278807641f20e607be1594f4afc8 +size 7736 diff --git a/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/runs/Apr20_14-12-56_lrdn0904.leonardo.local/events.out.tfevents.1745151214.lrdn0904.leonardo.local.2838705.0 b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/runs/Apr20_14-12-56_lrdn0904.leonardo.local/events.out.tfevents.1745151214.lrdn0904.leonardo.local.2838705.0 new file mode 100644 index 0000000000000000000000000000000000000000..9f353a634f26bf81dec9d9cd1848168c1c7f59a4 --- /dev/null +++ b/grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/runs/Apr20_14-12-56_lrdn0904.leonardo.local/events.out.tfevents.1745151214.lrdn0904.leonardo.local.2838705.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aee789b88212f243b1d31a218fb7445e17844b48b4dcd02c577e2d08227c8589 +size 33448 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/adapter_model.safetensors b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fe44a65ad058bf522544ae1fc61eaa183dc6b507 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d281727506e34f69fdf0acf5c8df13bd3d5156fab97568d1a315b00bb1148410 +size 11046672 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a86e1331c824b772b6b1e7bfc1abf0fdb608b7d --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7484022fc605819a5c5aa68e52666b6e25c7864b030837c1a8db15d4cf39b10e +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bacaa9a62fd29faec786aec512726beb4ded617b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63018224e70960487b29d8732799e76a76cdca081b662ec4b2216960b2e3817e +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1137e6abcd20f39ee26da2758f71a64a02fb66ed --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:688186ec119407153b462ea2d2ec4db627d4b86058c7ead07a434e632d0a88f0 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1e0de7512d7635f4c1fc06dfbb1ec679820b763 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:995da8d56d8e4aa24bafacf5ef337d7f391cde40d5dabc6add286e8ecf094b87 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/zero_pp_rank_0_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6fc8febb29009a44247df5494a080357184c942 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac965a7d2bf38f9a7dca25f3285578da981c5238e429f902a78401d848dad910 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/zero_pp_rank_1_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b898016ee8efbc1281e5088060ac50ed5afc81de --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:815bcea5543594c6a9b563dd2865cd107740fdc42f3fe2871cb88c982f0f4ecf +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/zero_pp_rank_2_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e51f4d2c13492df8e8def6f6fea72839fb59096 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78f15177a911df448f2f05d281893ff987c0f293627d6a64c6ad5a983759d663 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/zero_pp_rank_3_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6452a0240433a4d62780e3fef8d245bf62674c1a --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/global_step1048/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:336b0de9c7d8ea24bf355c4e8317571a8ca53db0d78b56fc71d7de405e2188bb +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/rng_state_0.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..7b768905d37025f07cde33a155dea41d88b601d4 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e41755b91be7b46fe2c536d4e9fee3143438108ae2aebd8e138a5b82c3d8119a +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/rng_state_1.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..6bfa92375ded08076d747fa0b034e0a79c7d3817 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4364823e6303f0ac612e10804706c5b0349d4ceb26997ea100a0f3e076f3ef34 +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/rng_state_2.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..bd47cd5cfd87046491e7edad3bdc19f9f550b00d --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6960a966f0a377c6f54934ac6e1eb3e0a8919cda45960fc1cce1c176c924563c +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/rng_state_3.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..e28f073a9f9bc3c3ca90300873d490ed7a467947 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00599e135d2d8ec2ca1373843bc34f4a74af0ff3745c0046f9710de6d1d49243 +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/scheduler.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..87fc5bab102ab62fecab1cbc584f3bf53bf97e4c --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb4dd0edc5db109349393e9a3dc3c39f42877724cf7a618037de7c20692d3123 +size 1064 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/tokenizer.json b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/training_args.bin b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..71a7a679bafd58fdbda78505d1846d457c53c968 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11053b058d5fdfbbeb42a2bffc040d300a12628fc29bcd3a89f97b09157f5c03 +size 7736 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1310/global_step1310/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1310/global_step1310/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0c444f5fd8a118c5503fb4b023ca988f23c1fcf --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1310/global_step1310/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44a7cb79d432e745c61ae8f1d1940d7fda8cef7c706854ddb7ab7fad5e5b91bd +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1310/global_step1310/zero_pp_rank_1_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1310/global_step1310/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9511fae334e669d762af17349a9775e8fe704628 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1310/global_step1310/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd55ce5bac1f6da1be73ce4ae67294ea32b00b19490e14a9aed3cba616c43354 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/adapter_model.safetensors b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..489505328a0b80fe9b860c331b16542a804686f6 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39f3eb677abae7f5a79c594e9cfb089be231631c31a3611874816c58767081c1 +size 11046672 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e34ffb2a190b41bf57bc7a8a5158a59f51eca5ce --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:358431864cc56dff95487ad67f78f9b1a5c18eccc693602a20b5fa9acf60ac3d +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..895a044fcb5797b8ae5f3d61e8c08c023928b896 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85b22e7154ba30c18fa128c9799aa2693e0f0937b0d748453cb2c2a80793b45a +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..968fc0ee5027d029c0c956f8b69600a2c0252792 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4c20b620bbf920d954bf93c5d59ddac46da8d073e225b7a1aa2b823f0c3629d +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbb37c9ca2a04927c21982e445ada98b9a8675da --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:308037ec281f5cc9059c8f8caf21288e38df68640d4c5e21f79ed427ed9da698 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/zero_pp_rank_0_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d34bcd2700cdd6683b7c979d3aff4ba1f64b9fbe --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:324841cb4030552a9f6ada4e9a8c024405108ded71abfe3f86c3d0e0948e66f2 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/zero_pp_rank_1_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4facef721b66b51032180a76d79a32164c8c5ac6 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94159a58e82445dd8e6991e8a00e55b341578b01db6daf5833f13dfa457433c2 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/zero_pp_rank_2_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a902d642f8fde1c1a6f3cba5b4fd42d983d696c --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba1e46c0b8b3935895287447fe18bef45a7e3a25e1eb56b97c858b48daac07c7 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/zero_pp_rank_3_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8854f49836fd4576892a10d3c2cf35e11cf7b3c5 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/global_step1572/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77e09142da75c23aaa373dd2b3d0b9073a882e4482ca1697d05722ff13664410 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/rng_state_0.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..cdf724c9fb53470bf116aefeafd35e8afb6e66d4 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb5a27fcfefc9ae5bc27112824b0e29c42f544f9ad26a368f265d7e8c0335f7a +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/rng_state_1.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..e9dbcaca59a05a642c9808289cd643151728c08d --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89bfeccb994ecef50e9da873d1da179fc6761c200b39c8f66820b431312959f3 +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/rng_state_2.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..c7fde5ca65b9a00c7f11fbdc01d77f60304a6b37 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3c8ddac2c1cc2cc638eb053fb625c5638f49c40d008f3eac5a4f6a5631e0056 +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/rng_state_3.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..9228cf98f328680fd9dd7df887f60cda4241c93f --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fb402e090acea2bd62a3fbe42397582fa4e418e066cb8e86a3264f0f73d50bd +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/scheduler.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..b06f783f8059aebf8d68138e75bfa46e628ae352 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8d7d7c9d8e94eaa8ce9fc8d338a818a8de4035590658906dd497abd2e644db9 +size 1064 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/tokenizer.json b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/training_args.bin b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..71a7a679bafd58fdbda78505d1846d457c53c968 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11053b058d5fdfbbeb42a2bffc040d300a12628fc29bcd3a89f97b09157f5c03 +size 7736 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/adapter_model.safetensors b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..88924f373d7607b41eebcc920dbaa65d4071759b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dee2e29a49c0d634ca5eded4fcd6f2675888f5b40ee7d659cf6c6641d3e153f4 +size 11046672 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75b6817b4c69880792bbc74f0a2e05b1ce167226 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1462563f1c2c05543af79f8f70aa2bb0aa54375d3d4ad118ba814ab42d44937e +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..906c9ddccc4767543a25d5e4e266602d4dc65df5 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00997ccace341d715077468955fb83a5f4afb026b720b820409cb80930c3d54b +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e110297a1f39f78494c781a3ba6dd211fb27d14 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3b7f20e15e0111173b9d4d33574e64897a5b08d2d0edab98bdf905af2576660 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7656ec7da0d04ad1b28578d6717f5f78574ba58 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:174cf0429f372839603c52349f7edc26ee1a18b2792fae6fca2fbd54dae25c78 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/zero_pp_rank_0_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a995813e45314415614c5db81dc0fc9e0bd04b1e --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a8026fd54d3a7f9f201b0b8f95127c00ac60e9a5c90585d2947868863f6e142 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/zero_pp_rank_1_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..910948403f838a3f099e02a4ef7da6cc34181f76 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:442a844b10856c1119c6cc1c28cb51fd2ff11a2392577782a2ac8f6301018b21 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/zero_pp_rank_2_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9687cdd1d53eec5f61b820524b3d67adfc929d8a --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e730a44201e0b63fcceec998c14c27dd9ee5ebfbc6708cea69e3831b2958c157 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/zero_pp_rank_3_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f60ab67bcc04920f0a0c2b2819210e4538d334f8 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/global_step1834/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73ef9f714bbf28526df8d29fd804e22fa553659dade414e5a77d9afa086cb760 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/rng_state_0.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..4d1c158dbc9fd6613c586ab31768c021fe7db7a9 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8632ba33a805b72550fdce4505b359b071cfcc2dd6417262fdc4ac589078ada7 +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/rng_state_1.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..09f912d0f0869ac7e634c30691817ffad549099f --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13d9f4ba2fea4443d0a091fa42ecf5b7375e218af289dc3b3359d3a4e37cea5e +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/rng_state_2.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..21b52bf58292e3df416d8aa009e3392031bdf171 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5586d47814e59d16be026f561551c6e1eacd66e16e4461f81cd015c8e365aa19 +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/rng_state_3.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..5373d12be69323a0aa7a057d74f50752ed175dc0 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90e970cdc233e99739cd51dec49e4b503488a86d0dc5c09b716e8c918434ab0a +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/scheduler.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..10aab41085ed6bd1a5f62282d66cd68d7d3f3d25 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2b34a8786430a32f6199720b54ffc88bb0ba099d3bd8a154c5e46d2745a8875 +size 1064 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/tokenizer.json b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/training_args.bin b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..71a7a679bafd58fdbda78505d1846d457c53c968 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11053b058d5fdfbbeb42a2bffc040d300a12628fc29bcd3a89f97b09157f5c03 +size 7736 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/adapter_model.safetensors b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d26f02b412372d734f82037d6ff0439dc753fcdd --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c59cbe361d922f609c3dadac3e8d352009f875112dc0922155e2530d55ca3eb +size 11046672 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd5528408c5fa0e49cd6ed3116e99836f19473c1 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1131bb39d8c80afa948b7ae6b36c6b397b86f81b6c5d72bf45f9896862ce7ed +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e3e74c1b68be0eb32e962adfa65796011295276 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85b637a26286c3607f5743f09d0db314976570d510c878f16f981c57e0cb6106 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8645766c8fcc27ef020c11bc55cba4cea8dc893f --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b8b2d0da0c88c14b8f04b2b38a2679daa0a84cfdb042e9387616682a445a715 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3396c21f93332cf7089f25230793f988c807ef40 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b77df0c857c15c50c871e14c1379e7ee2ca726c588e784ec4ae628e3281e064 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/zero_pp_rank_0_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74f83372692dce18392d38846d1bd61c067ba554 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4789c8dfaec5204b216501b16b661623f5fdd2d01cde29befe9f68011998d99 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/zero_pp_rank_1_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4917757f5160c1c87b88bd9de00a1ec695b33f9a --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:907b8d7b3c768697797cf83edaf09b56867672a1cdcb549dc08c2d4f3f206c96 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/zero_pp_rank_2_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cfac500c2936ed78f0ca7c8bc95d77bdc845ae5 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fa591dcd95a10d45f58531d06f405974d6a33da420af3668d16598e3cca942e +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/zero_pp_rank_3_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0ce618e719a97b2e9fa8e5a0ebd6e89555fdbd4 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/global_step2096/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbf1f33dbeb8b887e143ea84b998ee3e166ca94650061ff66ed2107ab4222218 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/rng_state_0.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..d70d5260bbc6c2ff026b9ed683de536a9ea7531e --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7424f45a61d80d61f05bf12b2b22805e8017a97ffeebbec7a4aa7869c52c057 +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/rng_state_1.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..1892f0c3a196d72526f0d7b51fbf499cdc7bd83b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8949af96e68dc4dff456ce61a9714bd86cf8aff701a643b567a44f0a80e1c5b2 +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/rng_state_2.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..b209c18e459329a57aaa13da357c316a05165b78 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83669f178652466715765a921152c689272df88eda8ab0f03c520c2f3f8d49ef +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/rng_state_3.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..5feda806f4f984b8d83f582dbddc6af41b9c1c7c --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3fcd813493b2cc277f267235dda263795b44db9c637348862c948fff72ba079 +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/scheduler.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b3d842942ac88aedd95e421634972c2ba03cbd8 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89d4dabf0defb403b6f24329425fc771b5f3da77b0fd3e8ef787296dae06f463 +size 1064 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/tokenizer.json b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/training_args.bin b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..71a7a679bafd58fdbda78505d1846d457c53c968 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11053b058d5fdfbbeb42a2bffc040d300a12628fc29bcd3a89f97b09157f5c03 +size 7736 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/adapter_model.safetensors b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ea9ee767bbec74fb34a36bcee599df7aa72aaebf --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a2bbd47c7fd19daf39ac0e911337245bbf312798bb3a336378e8d04bcb75a24 +size 11046672 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9798a1622e714b9acbef23944590f02168796a71 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b8c486f4cd3978109f66f59d53bc4b7de5a04aa432964dc4820fb8a3dd25815 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..446732d8a45f25c7f8fba1e7b6fb6070f12f2f10 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dc1297c1b5d6673cf9d700d73e91040e7c671b43ee2c1ce7164bb0f3573af38 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d7e30f1a1f24f6943bc061f5f7f4b07a5e76d80 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90e59cb95ec0271387444664db31bdb1fb3e3ce35cd5c6f3508c241521d995cc +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd1c218135ae169ab5a54d361c46664ed78c4eed --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1ea30baafe23b68d0327f103115c820d4e6be06000b4058e7e97e0d9c22532f +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/zero_pp_rank_0_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6df0b898e41e412787a7e55194aea986a9608523 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a29edb9d6fbdc53a79b9d258b46504dec6778c7c3f5edfa5aac662b76d6e885 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/zero_pp_rank_1_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9bd8a0a1e5fdc26f5b614753ae3381259e4b188 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3099ef3507849de92a9cab5225e8aae775312c5cd25585ace105c8d28ab97379 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/zero_pp_rank_2_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76e6ae983958d0b165e8834b635859e8a63aa7b5 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36eb117830014c03d712a2d7ba0ad67aed97a86ea5e51872c53b1e61fc1d8708 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/zero_pp_rank_3_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c40ce24b18349624f1423e504e59079ebf79c91c --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/global_step262/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef3ebb1ad0d4dd1a3b2a7e66b27eba54b661d486743a33d8786637d3cd75ef5c +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/rng_state_0.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..f9addb83a507c6380fea278d7fa9ff1286b1e426 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b599198461ae8d6eac59810aaab52bd29e2f693a4b9c739d6741cd1f99d293e +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/rng_state_1.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..81e9cc86ccd7b4f6d7440294169caca2ea8837fb --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:756fa0acad991f39af28eb8742650ea022424065df3eee4722d429cedb411518 +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/rng_state_2.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..3d9513e78a2c3fa658896e652100b4522984bd98 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96955490c396c13c2ca6db6a389878af9ef5aa4ed69d3c75c4092d6340c23e03 +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/rng_state_3.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..7093e53538134e5c0e9ae5201cc37bbd03c77402 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dcdc26cf88f5a2e0bc60bb4b796b4308d821534d05223fcdb154cae92623a1d +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/scheduler.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..97319d41ff4f5ec2986ff6e5c7373ff7f5e8d581 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c29af60badc3245d9917bc3ea106d516bdbcda5d5e735376bc451fc8c577986a +size 1064 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/tokenizer.json b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/training_args.bin b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..71a7a679bafd58fdbda78505d1846d457c53c968 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11053b058d5fdfbbeb42a2bffc040d300a12628fc29bcd3a89f97b09157f5c03 +size 7736 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/adapter_model.safetensors b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..08e3db752f4a4e9df35d92780908358cf2a1a89f --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b5c4d043813fb621f1ed61c11fad8df9707ad2477552ed0b691b3b94fff7803 +size 11046672 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b055cedc7486e93ac62a3e8d143526a40fe1bbb --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb192097de326bd2d7995f61c9940c64921afd08d73bd6103d02fb80b28ae9a0 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd5278ff5633f2f2a2142efe1775e368875f9a7a --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd30978056cee0ff9c20b10c4d4dd43ff2258ec59d35619cd94d0e36386bd6ca +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42323e587cd5c83649a9645a69157621b9c76f4b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dacf812c3ea21fec0a917638c47be81199c0b0f2d08e87563f20dd2597a87dd +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78dffc49622af7887b77168af8b649fbaa5b91da --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4234a6e7f236b5ebe108d5a4ad83e9a12eff09ed976a9fdbd3ca065fcc1f9062 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/zero_pp_rank_0_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ab80a1e1eb6e530df88a0c33d71474ccd3922be --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abe16af6a2470cc32b0e5e22184570edc3151559e37f5463b87b5605b98a1dba +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/zero_pp_rank_1_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfb9be28a339503714775e7588ba4e2ab428dcee --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b88621f04dce406c3d03d8aa403d4070770e0af6e8573c4a5154632f876e1936 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/zero_pp_rank_2_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00c8d6467189d76cac0404d07698413501fdc4a9 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62bfd4e85e07d4a2dee2e0345fc5817487fce1fe2ce28a59eba175b0d05f12db +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/zero_pp_rank_3_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..809fabbca09dfe3bf979d221a460784832c7e245 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/global_step3144/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cda176789b635517eaf10fa2a8afb159526c667fd6cc835531b64d18555c1d57 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/rng_state_0.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..d95eab56847a9e534ed2116d432e21814e7ed8fb --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57c63962675f7c791b87ce21912c9420a5a0f2c972ad4b94430a73d57b77aa95 +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/rng_state_1.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..2d1e34c4a40c88a00b046db9e2f08e3069558336 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11e4741f3034d19d0cc42ff1ca28cc6b322963c0a9c4a649086521ab51770743 +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/rng_state_2.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..ea48fe1439ff9f282560c91b53b7f5432ee111f2 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b6672a0225eaf4181d19c6f9fb35941efaa37752d21de72de8d2d32be12b41a +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/rng_state_3.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..778fd07a44b3e245ce58e6fc10d692d57a68e6f9 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a321e2088f41747d86dc9300db46b52650deefc5b4665626c99a63c271c4f985 +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/scheduler.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..59196bd8b37c7cdb95e34c9620f13d5fb804505f --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fe6d17c91697d3b300058b0ef287c5f3f8299a8fcc430ddf32b878953cd4b62 +size 1064 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/tokenizer.json b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/training_args.bin b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..71a7a679bafd58fdbda78505d1846d457c53c968 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11053b058d5fdfbbeb42a2bffc040d300a12628fc29bcd3a89f97b09157f5c03 +size 7736 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/adapter_model.safetensors b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2d22fb2a639fe3b030b5ba197dbd9afd0e0dd3ac --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d00b21ffee0c108d4fd87c85df2ca18b9d516167c4411126df34dba3ee1586ab +size 11046672 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1337b0ee36fb02ef06a0b10a79a2c66a5b1dca9 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32094d20215a536b216ba5fb0744310d64a7e2ab3786610d58b784a2c06f840c +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55d293dd8c9c5498777a0e3129f2535356d318d4 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dff6b9d55d0beb7a74a92492e46b734fc3ce7cea3254cfa8c840ce403ffc8f83 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6faefe15b61ea120018d587960a0dba73b64dc9b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a3e4fa4602d90dd232e975499630d42bafc720aada0dd97b54d36beb2a5ad2e +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..948bb1b6696cf16db211b4be49c959138a0e5dbe --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:898b3181969d2fdf959d7bb6e34177953cbec601ff2d893e3a524d232a02da41 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/zero_pp_rank_0_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..577e3584639361c1c9540b49f2603b25caa8577c --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11319e7e4aa47e938713f8c7f17bc742b1584b35df089abc0bbbff31c679ba0c +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/zero_pp_rank_1_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e6a9e7e98ab90a07b6847063cf39294c9f52709 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:973a5608c0babafd28d43e7d1a90cf808d45b9fa1f901776d6aed84904903cad +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/zero_pp_rank_2_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8164ef8cbc315f27fcca82a9aa1ff76272db8413 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be4444c210631380cdbcebcc7780591ae198a15e592af2243e16ba71d174267e +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/zero_pp_rank_3_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c009cff17e650302047418c744713285f2abb97 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/global_step3668/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55102b2dfe4ef744f560256a3b3c1120b193af35ab17f0ab26f92cdd841c9518 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/rng_state_0.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..57bcea9b92517e93765c059cf6df869e4e061f28 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57754ba138c0e60f453f439c63dd1ba9da398041b2ee73a8dc6aacb8379d5c4a +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/rng_state_1.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..e2a8fec5bc40dd2d985e94bcbf80e1c3f0de393d --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faa0e5d676a24a1a8a1483437f2b9804b8acd8b8ffc7ef5e20257b63e8406054 +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/rng_state_2.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..0ad903bc471f0a994c5b975b24695684eaaabe41 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c49f538ab0a95066de511de51f2ca8e9408a2a2445ed584ddc5f8b97cb6a02c9 +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/rng_state_3.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..b51b0a4541fbc81f890fd129406135ad29e2bf3b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a8a0111360eda94e2e8f93c9863f4cd9ad3335ba305277d4643f386b9c10a4f +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/scheduler.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0c06fa595b84f57bc8f8649fb3930ea1dc2e4cb --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21057f42c9723c5fada9789bf03845da3ea2f2101b9cdf553ec54993cba5dd56 +size 1064 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/tokenizer.json b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/training_args.bin b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..71a7a679bafd58fdbda78505d1846d457c53c968 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11053b058d5fdfbbeb42a2bffc040d300a12628fc29bcd3a89f97b09157f5c03 +size 7736 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/adapter_model.safetensors b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..15f7c5d8e2e2e03bb62acd69c99e27c257e8522d --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd805f85a022aff7228758b7b0083d06980957c080448d2ba4c3dc74dd5676d8 +size 11046672 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b621309100999c91f5ab26fd1696a4869647f6c8 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe0f39c83bbfc150b4499df959baa0b19e2c30608ed48b2d7b253b072bbf5b9c +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..112f903bd94ad5445965d6d6494022e846658a3d --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c62a0cb74bd863b3c6923dfc444b86fea8c8d457b97498df9c884a716ce9b2c7 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92fc0ee1cc223ac9f019124bd5f979a23126e94e --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdf0498ea50c9c0ed2c827c6603d1ae39e18091ce4ada0bc7c0b7b27db59dbb8 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2c720041952c0bd855a55e70b0a4e71ff59dfdf --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17f51500b93803500eba8416c0d7c579f23c279fbefb423e586472d7b2fca36f +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/zero_pp_rank_0_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a482b5e2c8211b23244b10c653fbe52bf6496738 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93f405fdcde7f16c8e172fcc6e2f115b490e6237659fe01577100cafab249007 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/zero_pp_rank_1_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c71ef70006d80f766ef4c40f26194a0c351e91a4 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9991a4fb89ead8baca737981ecee27242e947359ae8f4fe335718d2bba2fa8b7 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/zero_pp_rank_2_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dd9114f6cffcdbeb046f163910d49fca11094b8 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f620de17ae26c0e80bc62fc55611ce268cda6be223a329f391a176a80a5fd647 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/zero_pp_rank_3_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56a1d3ca2e044fe210c51f518a5602c929d6e0c4 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/global_step3930/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ef2951df6bad088b47a8b42794fea25c608d7aa4ac58f005af37e4ab7cd5937 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/rng_state_0.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..ab71968a599b872f7265217c56b4280ecc273fdf --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3b70897be73f1fec385981b85252ddd38f45655695d11b814f445e8a408b2b5 +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/rng_state_1.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..508f9d3663433d4d3e1a2e420d7013845c6c627a --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6339311fc18fafbeb0bb8a28e175b9b8df4ebb1adb804ab92e3a9bb1893dbb4 +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/rng_state_2.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..3778dfa16230c2b3f9470284d5b148e86eb55778 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b6759acd0cc606ee678ebcd05acbe63cbbbc543a4fcb7d8512b486f145b6a94 +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/rng_state_3.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..bef7bf03045cf51fdd4f3f2a578c2b5d792ae6c1 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:631257e51ae47e8276c90c6e03afa53766f63cb73d47b5cc1d0efa267f2aabbc +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/scheduler.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfd8b8a1f9b19fca5deef2d8dea4c8795a861592 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4baba68e5285be62a9bca653fc55ea29e17c06c81fb9bd3ba107943dcd7763ad +size 1064 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/tokenizer.json b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/training_args.bin b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..71a7a679bafd58fdbda78505d1846d457c53c968 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11053b058d5fdfbbeb42a2bffc040d300a12628fc29bcd3a89f97b09157f5c03 +size 7736 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/adapter_model.safetensors b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8a9ae5871232b6a6ee08ecdc2c1e229fe6efec77 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8122dea8e2f8a9b83c43610183a8a0c8df81fee428355099f4fc57b8a23a265b +size 11046672 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad1b2c9d9ae333928de792e2cd3b7a8cc43f4975 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e844af6ea69ca0715da4d53ab902aa2b29ad0f66a3a2e4440c219161030f6408 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7996b4a4d0de701686f03fd5a42d290c0de6c21c --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f3bf8b306322e01f4ddcb7c933a98f2875f9a27167852dc16a245a7b769983c +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f906f74f38c63a3789da9ad43bb8012ad803fc89 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97be4acef96b780b2895a982871654eed7d5ca129b6082c0d6cc0c90196d482a +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20d4e2b1d2ce20729d6b7b15ce7d6ac5dda24ce1 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ef4667892fbba00f554a479382baad3bcdb68f865252af5e3b4c0ba146d0664 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/zero_pp_rank_0_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d06de3cd690ff5d3a787379c49394a2f3a510641 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e85528e75d4269deb3cbb8746b286f3166a8e8a09dbab61343b4caeb350294f6 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/zero_pp_rank_1_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03e380acaa40c73838d9eb5de1d5377ce071c049 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24b07145b360dfa585a5c565b696bf29f48abd4b2388ed90d3a73eef2bd5e905 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/zero_pp_rank_2_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cf8d01d81f8405a9927af38e7ab1afc5f65f654 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c152dda4ba334cedf0adb115212797389611298b68691a82e5e2ea34474bb642 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/zero_pp_rank_3_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d85d21b0e23696f1681b1ecb546ddc2c496a4d21 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/global_step4192/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f45eba084719a0ab829a68cbc3ec5058d02577dc86c729d112ce961ed591a96 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/rng_state_0.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..91c3bc6705dc80f977586b6d6f0af7e33b1d25be --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b6b3eab258a45a8c93785552212f8ca229b85d34cdd2bc997ddbc4df58c497e +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/rng_state_1.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..1882a95631f0a73fc74d9d43cd9bf208605ca567 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4370c868a915bd7592abfdadb4806a0cf67c2eac327f364ff284c0bee3db82b2 +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/rng_state_2.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..90dba40d385443b44416f0ab4886ec3847b730bb --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16aa1a701d1b88fe49ee010672c49d1899aa30c210ff457ac3f799d1c728db7d +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/rng_state_3.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..e209f5d961438d0100ac31ac4669481a055f5689 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3a39254c5d867669ae2b49e07af169eae00eeea38213aa8636e9eec9a64b9f5 +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/scheduler.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..70011ef8f5bec20cb555f1a3b9ce9630319dc3b4 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad450c9932934853a1bbbf07e32c5925a3ed0cfa8ac0c8a3ca2f736fa64c3974 +size 1064 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/tokenizer.json b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/training_args.bin b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..71a7a679bafd58fdbda78505d1846d457c53c968 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11053b058d5fdfbbeb42a2bffc040d300a12628fc29bcd3a89f97b09157f5c03 +size 7736 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/adapter_model.safetensors b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d94bcb64e87c73c64f4e68301e61d49eda4d73ba --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fedafaaf0e920d2eb2b669bbe57d8e468d437a061da8195a0ee19f8314d8a49 +size 11046672 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13f95aeee5e004bb4c37b4853c3e94324b97fefb --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:376daf4ba1ed9be04e5d7c5ffa167b156547f6bac24cd8f4298e560f225a7800 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..474b0785e666d9d92cb03e19b492dad62f16b257 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:042272f1711093b942b81e22fe2ad76d13d659fc42e5a149726af40f542cb831 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e85e5e10436e1a484c5bb76fab5b19faca44b16 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03ca3c2ebda136a4f1e67d49c80d1f9ab4119004c352606a9712024fdfd18d56 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..adbd85dd99b94023ecdfcf3f800fab058296f974 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b519e750172b61c50d69fbd45731e57a6c728e70d9d9be19677d348c10419a9 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/zero_pp_rank_0_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cad586685dda937bc0b3f591a3dc8d49dc33f0f9 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34adeba61bf335be02edbdf43c5a7470a12e8c489fc7d2d42e8fcf81452e6021 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/zero_pp_rank_1_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cd49e8ddf0337e94d103ec84741f9b9bc27e8bf --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26b815b75a6c1def0997e3b9ff8eb55e6ad11be8985342529231d6f2bb3c336f +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/zero_pp_rank_2_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fabd14296166fd1cf3288173b73cee5e2a176a1b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93f82303ee2dc9f1e2477e622a25017183d15a410df8dc91a48019db94d54b29 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/zero_pp_rank_3_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82e7c93745058029f51436a8c15fe45d77990d23 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/global_step4454/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbe3c0210f0b12a4aea8bbec1208f31613e11787f54baf548baa5b0333ffb756 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/rng_state_0.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..752d9d6639d9681c4ab742f423bd12d2fdd6e391 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:378df17dc48e0aac769ad21d4e20338c74b99922180a7e18e2c963717bf7228b +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/rng_state_1.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..109e04b706fcf5c5f49993b87d419e234a2f6265 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a47f9e0f7dc2015afbfd1a294bb247daeee776f20435210e8eaa00bd59bc4d92 +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/rng_state_2.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..f4f0d4c1e66428b23b36a964d959e4b77c1b02a3 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eef7a69a10f91c255905b4058d92d0f9af40a70b94fe9bd706ae57e1350b5eeb +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/rng_state_3.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..0a0013f5412cc6ce36414154d7c0180c5aaf6f1b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fc41c3ffc7c154d26b2fc77b7ce6ed896adaad91e1b9a3d6815fa1bfb485276 +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/scheduler.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..1afe22f128d779f7bbc0072f3dc11edfe65d7cbf --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12735d7677c78ea5d84b503cb53e059dde4474f349faefffe7e1f8bfab1f15c4 +size 1064 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/tokenizer.json b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/training_args.bin b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..71a7a679bafd58fdbda78505d1846d457c53c968 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11053b058d5fdfbbeb42a2bffc040d300a12628fc29bcd3a89f97b09157f5c03 +size 7736 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/adapter_model.safetensors b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..55d4a42cd04fbae79026432faa3182efdc1acb0f --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10df1de813852e9ea3f7e5da7e587ae35ab58bd926aa2dcce1741f705706a4a6 +size 11046672 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbaa50748f2d3b57414aded674e87a00df92b684 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07df8e877ba6c77634d6ab828a6c1cc002d81cce5c30d1dee2d74eba96b51ec2 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83a7f458d2724732a424d7628ed7db46d23c9d09 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db28d86de06278c71bb987610b51505f7d1f9e6e70b007f6d02de3dd051ee099 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71f3d32f3554b383b88669dc45b0e8d3368d3500 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7288c117208ff74821faead07b53148a4bb675af9e49846a7be8700732629600 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f28a5cc665806f75a9973b4db80f55dbc08d8bca --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b8499706c103a611f23209541985d062f0726ddc4e9f38d92da1f6f274676c1 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/zero_pp_rank_0_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bb8576f7e5260c2d5e56ac6e26d19b37eea2dd9 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:332b2120a9c426b00e833b25ba5fcfff277d01c6ad593c48633afa3e2d835a2f +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/zero_pp_rank_1_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35531afcf73e93e07c7dfdcbe1b71c562f4e59e7 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61b06c5dd568beca798c1105b8945a00cf3f5f5dc1e2e658d3eb17c1a83fb239 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/zero_pp_rank_2_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5f8cf04607f64f753f1a4eeb7483ed13d9d1ade --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c740a87182db932d0034c3d59d7530240e709d94a668e9cd15a95d05569a054a +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/zero_pp_rank_3_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..744e014a7bc9921b55a6eed805dcc4be867fb5c4 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/global_step524/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b6fbf7f995b32a237adce510bb3b1caf6db818913e323bdaf365cbea870cd77 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/rng_state_0.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..dd23f9c5a348c6209cb0e99eb894fa0f5c763fc7 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec8c97a0bea876b9bdcc79294b8f49834eb65093e233a0b81ae778e590d130f0 +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/rng_state_2.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..a9c10582a318e02c3ba891659b193c2acbbe5cf3 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3376dedb666a0481ca2e901666957bcc43877acd4660c68d410049bb1e4b25c +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/rng_state_3.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..8c19b9406a564034e68db0d41355940f22430236 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b3233248285fcb8d254cc0927444ae9545be5ffa6c438ffa1bb79993e82cd90 +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/scheduler.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..630c2389374bb17de898f04d91d692585cf28ecd --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70686d61f2d6a94db3013a803000285ba94784012b0be23b867ebcd90a50dc18 +size 1064 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/tokenizer.json b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/training_args.bin b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..71a7a679bafd58fdbda78505d1846d457c53c968 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11053b058d5fdfbbeb42a2bffc040d300a12628fc29bcd3a89f97b09157f5c03 +size 7736 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/adapter_model.safetensors b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1c8a0cd7abd330c60bf836687b5262a2f8fccdd0 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05b29d47839dc8780b3c4a43af4d0aaec388266c17c2e7c8ab7f676dd1cc804e +size 11046672 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c853768e2a9d4cf454fe7789d2a83d3c8c278e35 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2192d27d805edcac38e3765692efba44bf104ce66f2bfc65b22393f7974073c9 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92b982f13858f71ae88ff7d5c39f75acae93a7b2 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:470e12dfc4a89a3264979103f81a55e64a676d5c6a36bf413d467fff71812464 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bf651e3f1931a16bd2ea7c79f27b6e31ca04f40 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2807fc27197f35de75182a2868a3425bc27b3aa1b9ff272e02b15674c6793a8 +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d48cc5dd88afc075d02971d6872a4017b373955a --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:729af20ea29897b87d9635fba3bd4e08a9b050c887eb26045ee425d12a6cdeda +size 16518640 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/zero_pp_rank_0_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bb39d1fc56f5ce23db01fa279cf321943fa891b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b23067152eb00e04c331860174fd4c06c51a3965f86fdfa014224cd5f0f6dc6 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/zero_pp_rank_1_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c5238f337201e03961fb23059e9b56d716d0eb4 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74b568ef0e05d924b723bfa27d29c79e4d4bde41c6caa6b1ec7b1e344e986d0b +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/zero_pp_rank_2_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63c1212f073fdbe19076864250b6cc2b341c92be --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ad200a852eadeb53d4be2362d31d06e407e9a0b02a8281a3ba4496dd197b616 +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/zero_pp_rank_3_mp_rank_00_model_states.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b84692bff5a808bfed0ac3afcfdf37767f3115c --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/global_step786/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1354d2ebb695a3992f1604dad7bd3130aebe808c8a0e09216b20c33d7d39cbd +size 321070 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/rng_state_0.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..8810363fd4249adc52bb11ba330b7366df231fa0 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8d8a790a233b0711726cd5f2b87e3411df6bf01319d60d21582456555c9acc3 +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/rng_state_1.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..baef0c59aed5baac51d93e5c2a766e3161b4593c --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f45620123e8d60f35e6a402867c90cab10daa407239cea4e335c089703e45185 +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/rng_state_2.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..967667b5ad19de0c46f3dcff605c001a3225d18c --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19c10314ed582e5daf366aea2753ff2c3288afa07c98cda471f2fe7189821527 +size 14960 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/rng_state_3.pth b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..f149bc6c3dea9ad9759415277705af8390d90e7c --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f95c537a58ae868b5c2fe9cfaa5e7b2de3fc00513f469e383cb554989fa100f5 +size 15024 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/scheduler.pt b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..c324befc52f194c1ffa1af0b876f4888612277fe --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fe2cc8512f9ae32d0ce8ad0d97b80867a00545e81e47379d990dae99d3ea83e +size 1064 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/tokenizer.json b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/training_args.bin b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..71a7a679bafd58fdbda78505d1846d457c53c968 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11053b058d5fdfbbeb42a2bffc040d300a12628fc29bcd3a89f97b09157f5c03 +size 7736 diff --git a/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/runs/Apr19_10-00-53_lrdn1381.leonardo.local/events.out.tfevents.1745049688.lrdn1381.leonardo.local.761986.0 b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/runs/Apr19_10-00-53_lrdn1381.leonardo.local/events.out.tfevents.1745049688.lrdn1381.leonardo.local.761986.0 new file mode 100644 index 0000000000000000000000000000000000000000..ac07307637248c958494f6027caec8752c50c7a7 --- /dev/null +++ b/grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/runs/Apr19_10-00-53_lrdn1381.leonardo.local/events.out.tfevents.1745049688.lrdn1381.leonardo.local.761986.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c3ebd4fa5473a20f6803c96dffed12b54ea8842cb394e1f4b90a21ba029d5c0 +size 385493 diff --git a/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/global_step11200/zero_pp_rank_0_mp_rank_00_model_states.pt b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/global_step11200/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce42c1294970efb12349c60776026f63160815d5 --- /dev/null +++ b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/global_step11200/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ace417abe2b1c38fd0047d00dcb5dc603c28674511c7cfe0e66591ea2c73e0a +size 1721799 diff --git a/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/global_step11200/zero_pp_rank_2_mp_rank_00_model_states.pt b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/global_step11200/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac02bbdd435bfad89e0061d5a5e90bcc15a83ef9 --- /dev/null +++ b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/global_step11200/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cdb144c5832409e54123575f6607a46a2ba1caa0d9e1d41a67aa2427192d6f4 +size 1721799 diff --git a/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/model-00001-of-00004.safetensors b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/model-00001-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a4c06a92380b12073b2c2831e8eb2b657011b28a --- /dev/null +++ b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/model-00001-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:517d4d51e26529c2f67700838e2563955587be2174c2ac2850d0782ebf6e2940 +size 4991459544 diff --git a/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/model-00002-of-00004.safetensors b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/model-00002-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7bebb6069f38a9dbb92a364edd96094aec87841f --- /dev/null +++ b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/model-00002-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:565f978022e491b20484ee6c746684fe5ee4e328107e7f5c91c8ede66edb3d55 +size 4991757456 diff --git a/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/model-00003-of-00004.safetensors b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/model-00003-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e15c926e4dc9295ff5b29ba7734b6774a5c4e922 --- /dev/null +++ b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/model-00003-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50b207adbb9f89dd86204b48c41e80a1283f14665a530c600c867f8ef036a010 +size 4947691960 diff --git a/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/model-00004-of-00004.safetensors b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/model-00004-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c89c6aa0af57eb380eb00a60844791972836d67a --- /dev/null +++ b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/model-00004-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4702e85f47e2b68d33702db96713bbd14c14e5809cb27d4b2988374d633c88f +size 1863387424 diff --git a/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/rng_state_0.pth b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..54bafeb0c24c5a385f33584d0633ddc7c72a3033 --- /dev/null +++ b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85ad2cbc3c7a0fefa416ca212a3ca0c765342dd508d3b01b19c9bdea93628432 +size 14768 diff --git a/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/rng_state_2.pth b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..847a12ac9891d16a30fe56837fecba87deed0f59 --- /dev/null +++ b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5599955f9c18cf845e77f327ca171b5415ea5761828d42a4a50471361c2db5b3 +size 14768 diff --git a/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/scheduler.pt b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..c31a6648152bf89761680ffdf09cd78cc839460c --- /dev/null +++ b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cbb67c896f7c9966371ab3df11f6b75055ac39c3cad2d8156343fa3cb8a3013 +size 1064 diff --git a/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/tokenizer.json b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0a7813a4db375020e06907094ac82c22e7c41667 --- /dev/null +++ b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9cad5a9375fa7ef1f625ffe0493b51b845ea9275c532425bf4fc8b6957a7b0e +size 12030944 diff --git a/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/training_args.bin b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..68c636eb915576c7813d1fd429c5b86dadbd15a7 --- /dev/null +++ b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bdecc5004a5f786527d887fe8b1d399febcf35d451ce22e6eeb5de5e46a4f75 +size 7928 diff --git a/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/runs/May15_01-13-58_gcn150.local.snellius.surf.nl/events.out.tfevents.1747264465.gcn150.local.snellius.surf.nl.1288853.0 b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/runs/May15_01-13-58_gcn150.local.snellius.surf.nl/events.out.tfevents.1747264465.gcn150.local.snellius.surf.nl.1288853.0 new file mode 100644 index 0000000000000000000000000000000000000000..cbe9362a548336260b0c74c91f7335b712befe27 --- /dev/null +++ b/grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/runs/May15_01-13-58_gcn150.local.snellius.surf.nl/events.out.tfevents.1747264465.gcn150.local.snellius.surf.nl.1288853.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cbcc408ad0950fd3101da5b7c00062bea83700789921c988a2624e5d6f2e591 +size 4311359 diff --git a/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_005211/runs/May16_00-52-18_gcn152.local.snellius.surf.nl/events.out.tfevents.1747349580.gcn152.local.snellius.surf.nl.1762909.0 b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_005211/runs/May16_00-52-18_gcn152.local.snellius.surf.nl/events.out.tfevents.1747349580.gcn152.local.snellius.surf.nl.1762909.0 new file mode 100644 index 0000000000000000000000000000000000000000..d25ba59d8db3147965a8491561690201cfb3ff25 --- /dev/null +++ b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_005211/runs/May16_00-52-18_gcn152.local.snellius.surf.nl/events.out.tfevents.1747349580.gcn152.local.snellius.surf.nl.1762909.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4dc202e0aeccb23e4030057d421870051d4df6d5885261382650631c766fbdf +size 7049 diff --git a/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010308/runs/May16_01-03-12_gcn153.local.snellius.surf.nl/events.out.tfevents.1747350212.gcn153.local.snellius.surf.nl.4193441.0 b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010308/runs/May16_01-03-12_gcn153.local.snellius.surf.nl/events.out.tfevents.1747350212.gcn153.local.snellius.surf.nl.4193441.0 new file mode 100644 index 0000000000000000000000000000000000000000..e38c91eb04844fe85911630de362b9b3bfdea758 --- /dev/null +++ b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010308/runs/May16_01-03-12_gcn153.local.snellius.surf.nl/events.out.tfevents.1747350212.gcn153.local.snellius.surf.nl.4193441.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e72c5be33b3324a769d296ebfaae1a03fdd924cfccc5a1f04f56c9f8b842cfeb +size 13236 diff --git a/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/adapter_model.safetensors b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6a851c3322b2a1f2da1c7698e2dd3d985ca016b1 --- /dev/null +++ b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77b11da30b95287bea795f6c044fae20dd4fb5061f128ce9a99e691b00184669 +size 11046672 diff --git a/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/global_step11200/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/global_step11200/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01880b4e29a710aaa807393a048a37f04ef8f8bf --- /dev/null +++ b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/global_step11200/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0147eb6e21e8bac045c69db8db1ec618a0e64ae885b179e55f0fac571c632950 +size 22025200 diff --git a/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/global_step11200/zero_pp_rank_0_mp_rank_00_model_states.pt b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/global_step11200/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70c56361dca438d6b797c7d86c714b99eb994d86 --- /dev/null +++ b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/global_step11200/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65b2f64d602fa015cebad428fe1da8062a74081cbfa8e4f28f6637b30addf910 +size 321070 diff --git a/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/rng_state_0.pth b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..11e0c7bb6a08e8ff8b44a5913c6ad0bf80e5430a --- /dev/null +++ b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66dc0679732346767ba47dd1c35fca247ba234f38bb31e7c70d52c6f347d7ae9 +size 14768 diff --git a/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/scheduler.pt b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cf615aee9eb7ee863c2bc3c7ec92f10afdbc8ad --- /dev/null +++ b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ec15349e0092747ea9b4c650aecdb3ddfc48a0c13af980acaab7715a2001fd6 +size 1064 diff --git a/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/tokenizer.json b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..3061716ad76b796880bdd16b2292c0af65a5039b --- /dev/null +++ b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6 +size 12030943 diff --git a/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/training_args.bin b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..00a9ca485e85d2c806e26a315da1309ed54b3720 --- /dev/null +++ b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443b792ec5905e6302337c43bbf96699044effb11e28baca15b086682c014569 +size 7928 diff --git a/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-8400/scheduler.pt b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-8400/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef6d3c306208a9a829985422fceadb09cb64503a --- /dev/null +++ b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-8400/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f93ad9509b8cd17e9b1cd5cc7712f9440a12d2eebe2b0670257940957c01c80 +size 1064 diff --git a/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-8400/training_args.bin b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-8400/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..00a9ca485e85d2c806e26a315da1309ed54b3720 --- /dev/null +++ b/grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-8400/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443b792ec5905e6302337c43bbf96699044effb11e28baca15b086682c014569 +size 7928 diff --git a/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_0_mp_rank_00_model_states.pt b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca1f68f36c3dd45bccfbbd7b03a51d3b34b7a3ed --- /dev/null +++ b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6d143466248a8974256ccde7ad285f092243b28432923fffb15acf52a53218d +size 1401735 diff --git a/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_1_mp_rank_00_model_states.pt b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b2cc3f35595f0e6460ce1e6cc28e6ffcb77b0cc --- /dev/null +++ b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1de265b4eefb945687c203fa66c2bd00c689ef9b38f938b1b9ba769197fae430 +size 1401735 diff --git a/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_2_mp_rank_00_model_states.pt b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9fb1153540e8a98fcae8ec65d5c0e0facff07e2 --- /dev/null +++ b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d71d3257e92e8f02abbdc4a056eacf10d914a62457105b097ae85599e4092db0 +size 1401735 diff --git a/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_3_mp_rank_00_model_states.pt b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68eb7306550adfaae24dfc2cfcaaca0d95f95068 --- /dev/null +++ b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6216480853283e6591e6cc4bca0441cdd444722285423c01b587e8a4174e6027 +size 1401735 diff --git a/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00001-of-00004.safetensors b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00001-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bffb041ea5728576cb06dd1b0e836591149a9713 --- /dev/null +++ b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00001-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:545ce5712cfb8b4eb55cb89e0322c356dd3904e97b5ab4c6c2bd908eb6fc696c +size 4991459544 diff --git a/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00002-of-00004.safetensors b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00002-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..834cbd31f646e1e281cce6418b6d420e2ec3bb2c --- /dev/null +++ b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00002-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63c9f3f04b1d52ffb17f4f7736d0011d97b4aedae8dd3136374a41333b268498 +size 4991757456 diff --git a/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00003-of-00004.safetensors b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00003-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5263b338c0dc576ec00c7615ef866de8bb7fa833 --- /dev/null +++ b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00003-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b5afd38278ffe53b784b75c6153b8d0e3b8d03b2903c02a4e66d98ae5871cb7 +size 4947691960 diff --git a/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00004-of-00004.safetensors b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00004-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..337e38a4b3b1be876192cf07782e2a024e8df983 --- /dev/null +++ b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00004-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:312bdd650adc16275df4790b735614e9045a9ff1fe2999ce0bdfa6bd3152c106 +size 1863387424 diff --git a/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_0.pth b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..5fc5a160cec57abb9b13c2a062c52fbe6a71e188 --- /dev/null +++ b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:659dc9beee437011295c32f0e369eeda66033d741de1417e5c2e725bc06993ec +size 15024 diff --git a/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_1.pth b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..6c2c26948d72055c17d3b892b72d3b4d0c8aed3e --- /dev/null +++ b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c925f0a9be9f41bcc3e25304f638715b43d9d71ba9a923a2967fa95493f71ff5 +size 15024 diff --git a/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_2.pth b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..a7bb27fc4f898b36bcb677974e2a3799953db489 --- /dev/null +++ b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a58973d261fdababb9058ec19e76a722c8f97e0726b50faa642ebbc0816eb205 +size 15024 diff --git a/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_3.pth b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..763df6b57988b69897fa61ab7e082af10f237de9 --- /dev/null +++ b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeed214d7c5bb3081fa4e35555f8aa33881b07fdd998350a014e5ea094188e22 +size 15024 diff --git a/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/scheduler.pt b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bbfa49057b862450cc54bc19ffbae41536bb7d1 --- /dev/null +++ b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0763ca19f582c73f8ac88de5446dc1d84f3eed0e65f3995cdc9c4515ad0e123c +size 1064 diff --git a/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/tokenizer.json b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/training_args.bin b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..0d56fc7112f02fbc010c67480f4a589c081c5f70 --- /dev/null +++ b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0a6f98e40b83d45bae017a84b509508bfd2def9bb3af3ef85642137413c0ff9 +size 7160 diff --git a/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/runs/Apr23_05-57-03_lrdn0487.leonardo.local/events.out.tfevents.1745380636.lrdn0487.leonardo.local.4094634.0 b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/runs/Apr23_05-57-03_lrdn0487.leonardo.local/events.out.tfevents.1745380636.lrdn0487.leonardo.local.4094634.0 new file mode 100644 index 0000000000000000000000000000000000000000..61bb9e1aba0385f4080c09dd8bd7ab43f24e8d61 --- /dev/null +++ b/sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/runs/Apr23_05-57-03_lrdn0487.leonardo.local/events.out.tfevents.1745380636.lrdn0487.leonardo.local.4094634.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8c54c01281dd4d6af7dccbe4294a02ca480e4cc7f4abf3f073a9f1a277e1e49 +size 213414 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/adapter_model.safetensors b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cd236a7c858655fdbd904d2aa51ccf1d0bb4ee12 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2df1221c7eee291bae0984b5388b807a5126018f75bac6171e90e8267476bfb +size 15367872 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/optimizer.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b9d12a01943248ed728dd827887dbd14150f65d --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ff6787fde28cc4a5b2b7a347da31758bc33e8948c6638c0b412a1b03933567e +size 30872250 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/rng_state.pth b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..f06339ba5a1c04df9b76c67d49038662f5c53fe5 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:379a4d804c655519454d3bad3d6da51f092a4e72d28ff9175e2c80c0ce59cad7 +size 14244 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/scheduler.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..19d3fc253cb3c188738574b5b3aefcf87ad75b3a --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa17318d000e86d957c7daa06882178d9337e0e3fd9ab5f040f54eac9d9908ba +size 1064 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/tokenizer.json b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8d651380b80b1775af303bdabc6da4e6774ce3 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8441917e39ae0244e06d704b95b3124795cec478e297f9afac39ba670d7e9d99 +size 11421870 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/training_args.bin b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..40a5ebf39bfbbdd6fd02657c7618a5346a246f38 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6681bcfaab168bb9f2546d08d7db7332c7031d07995e1b0c2370486b0ebaa67 +size 5880 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/adapter_model.safetensors b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5c49844c82e78b7e396fa40f2f27a162dd6c8546 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26cecc5f5ce6d9a73e0b18698b1af8c5b39c4bda69c3f33d6703dcdeb91a67ac +size 15367872 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/optimizer.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..efa9af7b917b16f48a792d3335c045b54f746f85 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d4665f277f1ad371e958bf65d846d26c379cb52247b91a6d64034997e114f46 +size 30872250 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/rng_state.pth b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..ca78ff4a15a59e8198e16d7e5287b23cdd4a294d --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:646f521696831b0d268d94af6f14ca70d8afd6520854e9bbce61958ccdbb016e +size 14244 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/scheduler.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..07c037e7007e1f8176734ac3acc61f2267ac801e --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c74116744f34db02c4b4e74f5b35f2fd9774be4492bc9b024069032c2c4bb0ff +size 1064 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/tokenizer.json b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8d651380b80b1775af303bdabc6da4e6774ce3 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8441917e39ae0244e06d704b95b3124795cec478e297f9afac39ba670d7e9d99 +size 11421870 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/training_args.bin b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..40a5ebf39bfbbdd6fd02657c7618a5346a246f38 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6681bcfaab168bb9f2546d08d7db7332c7031d07995e1b0c2370486b0ebaa67 +size 5880 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/adapter_model.safetensors b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..af620901e180bb96dbbf7f2bd90ebafb5b8ed9d1 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb9cd49abe08cd7789a07876402864f684fc7bb3441d2a1c5adc98ba3c18506d +size 15367872 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/optimizer.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..847a0d9649a6fd0fc0ebc4a2d735d1f5e7155641 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06edeaa9994ef176ee37972fab0846ed4cd916eb61a95086417391a4fde3d82e +size 30872250 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/rng_state.pth b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..91c945ed344d0aaef06035386122102a35633a15 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c21a0f7b5b641ace0de10a97e3fa19c1c4e987a3877b0adf82b74da444b05abf +size 14244 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/scheduler.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3783efb4e7ce12f3d18d9ca84c3af84b52e1d6f --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:995abe18a2a0013d55eb7c0f47cfab48651d0c92276c5c36f3439d94930a2c3b +size 1064 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/tokenizer.json b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8d651380b80b1775af303bdabc6da4e6774ce3 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8441917e39ae0244e06d704b95b3124795cec478e297f9afac39ba670d7e9d99 +size 11421870 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/training_args.bin b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..40a5ebf39bfbbdd6fd02657c7618a5346a246f38 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6681bcfaab168bb9f2546d08d7db7332c7031d07995e1b0c2370486b0ebaa67 +size 5880 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/adapter_model.safetensors b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..61c94e64439c68ef463d77188a732fa18745ae2f --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcfbe5c9898f653cf801804d82b34ecc2fc66f8a2c3c7372d276a9fdee02be12 +size 15367872 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/optimizer.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1b597fc06a38211d8d5c0c9726c6fb4c1e2e51d --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9b5fd881c125454e36cb9a36b3e87169bf8f54fe20967331c0ab0bb88836913 +size 30872250 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/rng_state.pth b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..6826044138437956dff9dd7da65fc95999b0195a --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ef3df68d396ef50658a75308e4bf3277bbfeb3946b849becccf926a1edefd28 +size 14244 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/scheduler.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..46c53270ae55be6b75a7821d79da7e47600a2af5 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd2dc17cb76f548c4df1240594283d0acd1d37f97fb0d831461092bd0ec8cee3 +size 1064 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/tokenizer.json b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8d651380b80b1775af303bdabc6da4e6774ce3 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8441917e39ae0244e06d704b95b3124795cec478e297f9afac39ba670d7e9d99 +size 11421870 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/training_args.bin b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..40a5ebf39bfbbdd6fd02657c7618a5346a246f38 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6681bcfaab168bb9f2546d08d7db7332c7031d07995e1b0c2370486b0ebaa67 +size 5880 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-19956/training_args.bin b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-19956/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..40a5ebf39bfbbdd6fd02657c7618a5346a246f38 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-19956/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6681bcfaab168bb9f2546d08d7db7332c7031d07995e1b0c2370486b0ebaa67 +size 5880 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/adapter_model.safetensors b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7a3450769188add07fec3a24a70be57f1bdf44ec --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30d35664825d668cc9d264f341af29ed46ab040533571868db845687b61b560e +size 15367872 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/optimizer.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdb5b0562152db64727bf7c81dd68cebcdff098e --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:258f3aa00de3932117e63140cf2ef0fe9b3791317b7d43429a73eda013fdbb3e +size 30872250 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/rng_state.pth b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..2f8cc2dc595998af91190a0660ba13d993dfec79 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d880495218201956d89065c6c46a6391922386503464f34552a4fe387183ae4 +size 14244 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/scheduler.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..6933173e9001d034317e0ad3fceb0e5565791177 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ab4683572cca1ba8b2c362bbc37a0af93ea6855736f49c4e4a9adc362ce4f55 +size 1064 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/tokenizer.json b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8d651380b80b1775af303bdabc6da4e6774ce3 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8441917e39ae0244e06d704b95b3124795cec478e297f9afac39ba670d7e9d99 +size 11421870 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/training_args.bin b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..40a5ebf39bfbbdd6fd02657c7618a5346a246f38 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6681bcfaab168bb9f2546d08d7db7332c7031d07995e1b0c2370486b0ebaa67 +size 5880 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/adapter_model.safetensors b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..888d206b4827ce3e6f05223b06d2ce892cd1909f --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4950cce067f8fa190c83cb8e4071bba0b2ac660f668f5e8fcee2578d66f19596 +size 15367872 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/optimizer.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b41d0bed51f2fcc6c195acc5ab7ce83e1b4b7df --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28ebaf28d6349e9ef3a4b736a11ede8165bfc2f9a6df1e8bdac2b346835ac5af +size 30872250 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/rng_state.pth b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..55fe1cab1b919aa9e5512d8d07e40e43e7226723 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1d596913e8efd88217611b4da09bbb6ee8f9090e204b399ff2d3c1d2cb33420 +size 14244 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/scheduler.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..20d19322fe46837cc486b49d22d12ea059117e7f --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc46787308b9d261488221ab0d13c7e93c42d2d42e6b10c56beb837ceb7be691 +size 1064 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/tokenizer.json b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8d651380b80b1775af303bdabc6da4e6774ce3 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8441917e39ae0244e06d704b95b3124795cec478e297f9afac39ba670d7e9d99 +size 11421870 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/training_args.bin b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..40a5ebf39bfbbdd6fd02657c7618a5346a246f38 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6681bcfaab168bb9f2546d08d7db7332c7031d07995e1b0c2370486b0ebaa67 +size 5880 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/adapter_model.safetensors b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d023f773be33fa8da555e0e229103988ad9b71f4 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50c52e2bcc37f272872f1de95855f4a978d477f4a62acbebcf6c921183418ad8 +size 15367872 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/optimizer.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b93ebbe170dc228bd97cfc3e1d2948390b6ff3f --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c6e07c71fe71f2142733970dfb42c2a54982f400239e19858bdda88e6cf2c70 +size 30872250 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/rng_state.pth b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..9f55eaf3d626eec7622ab245b61b309645199148 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c8726467cfae5c6b801f0f671b6051909cfb1a1be531cac767c5ac531533ecc +size 14244 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/scheduler.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c84285e39d6af914c214a036f26b37e697a4dde --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e9aca3fb0a231d3f73e51ab10568348fe688e1fecf7478877ad6fbc0dc0e61a +size 1064 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/tokenizer.json b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8d651380b80b1775af303bdabc6da4e6774ce3 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8441917e39ae0244e06d704b95b3124795cec478e297f9afac39ba670d7e9d99 +size 11421870 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/training_args.bin b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..40a5ebf39bfbbdd6fd02657c7618a5346a246f38 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6681bcfaab168bb9f2546d08d7db7332c7031d07995e1b0c2370486b0ebaa67 +size 5880 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/adapter_model.safetensors b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a9f6dbba1bb3f37a3fd49a046f46ee806cc07768 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d560f311884efaf0bacdc693e4824343852f185b97c2845a098b8736b31f937 +size 15367872 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/optimizer.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..efe31a45f8f4846d930b6606dac12a5a5b2cddcd --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:374b6075b4907af398199d7f6a08e0c783255cbcc957a23956100b24254c57d0 +size 30872250 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/rng_state.pth b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..6b3993665864ceb3f81ba9cbd3a8094dfbcd37f2 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f2ff28d42ace1cc286b6f66c7f2490331b7076c7bff74a535eec8fe52467a04 +size 14244 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/scheduler.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..61f3b3ae65f49a442806dfa717dec80dc56cd3f1 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42e4fc00adbdb52cba57771e6a9399b518b0e948b26a79251f704e509f35df0a +size 1064 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/tokenizer.json b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8d651380b80b1775af303bdabc6da4e6774ce3 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8441917e39ae0244e06d704b95b3124795cec478e297f9afac39ba670d7e9d99 +size 11421870 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/training_args.bin b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..40a5ebf39bfbbdd6fd02657c7618a5346a246f38 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6681bcfaab168bb9f2546d08d7db7332c7031d07995e1b0c2370486b0ebaa67 +size 5880 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/adapter_model.safetensors b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a5c1c94d4081ec3c2651c402c1ca62402e7ce3f5 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ef93f4b0d54c879699b4154e2ac57c423f0a456bb7b67722f1dc3bce5649b0f +size 15367872 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/optimizer.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..98a1463a744bb69c8c4732f9a29ae7a2219508ea --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5805691255aafe5e31f6cdfbddf77938762c5574d9855563f08ad90537f7b333 +size 30872250 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/rng_state.pth b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..3bdb0e6fcca4da2702f565998c8e046115e131b1 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b349ee13a84107a2a288d704d09452783a528d4407cf9eb7d62b3dce5b1d6edd +size 14244 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/scheduler.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5c8bc73f61f76e58160e9b05f5c83e5a6d9255d --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4135a36c005434af323623ae03b1ea436bc66bacb79b28120ef3fc335d54eee9 +size 1064 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/tokenizer.json b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8d651380b80b1775af303bdabc6da4e6774ce3 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8441917e39ae0244e06d704b95b3124795cec478e297f9afac39ba670d7e9d99 +size 11421870 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/training_args.bin b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..40a5ebf39bfbbdd6fd02657c7618a5346a246f38 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6681bcfaab168bb9f2546d08d7db7332c7031d07995e1b0c2370486b0ebaa67 +size 5880 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-51553/optimizer.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-51553/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a480b725ae5a54f849d941ef7c017f1e1218033 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-51553/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d232f3ae1753ea5871055f2a84d4620611c5b47a194f31379e6d0e6c176d71c +size 30872250 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-51553/rng_state.pth b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-51553/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..55ef2827be7944917757443a7b8488c4062a53d6 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-51553/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ec15c04f2e0a094c45e17073239ae110492a41c0d8dbe0a43a6ab1f936f7922 +size 14244 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-51553/scheduler.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-51553/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0b023dd10a41786a1bc6f413afdc96ce6699c86 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-51553/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9c6abe04ebadd37899dbc1b428bb3ffa7fedddf4b4348af197f464dc8db2a85 +size 1064 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-51553/training_args.bin b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-51553/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..40a5ebf39bfbbdd6fd02657c7618a5346a246f38 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-51553/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6681bcfaab168bb9f2546d08d7db7332c7031d07995e1b0c2370486b0ebaa67 +size 5880 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/adapter_model.safetensors b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..740ab3c0b2b89cbae9bceb84f4fc27a15ed70f30 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:166d3576833f565794e7301f8b198e4a1cb3b769122e3f1ba6208dcb498edbb8 +size 15367872 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/optimizer.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..7aaeef5d247c4ee202c4b1d0b8354549883af076 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2b76275c6c1b0d6e32a951dfb41b820ef359f3a523e701deb2cdd258a735c21 +size 30872250 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/rng_state.pth b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..ad26bfad4a96030a7e569b39b8a108ba5c94ca8c --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da58feedbcccd3e68d4d1d2e75ffe94a977465bcf8e0c8feff90fef02df38328 +size 14244 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/scheduler.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..b72bf5344fa5c9f91fd659d7c2ac2881c6e4b2ec --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80e453ea97eae702c89349289bdda7cb3ee0c69f7a0d4d05a81d9250c15f64a8 +size 1064 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/tokenizer.json b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8d651380b80b1775af303bdabc6da4e6774ce3 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8441917e39ae0244e06d704b95b3124795cec478e297f9afac39ba670d7e9d99 +size 11421870 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/training_args.bin b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..40a5ebf39bfbbdd6fd02657c7618a5346a246f38 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6681bcfaab168bb9f2546d08d7db7332c7031d07995e1b0c2370486b0ebaa67 +size 5880 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/adapter_model.safetensors b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9a631863c7d139facfe1ac72ec860d2e00fd872d --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f4a0640513ca2dd467a442e5b6fb63ca42e76bd057ed1d994f4b4ad5635c712 +size 15367872 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/optimizer.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..890576b4db18614528418c3ada2e3ed4b86e4359 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:392ec6e8515c2c275e3006be838859615de2bbe9ac12aa9d5f5ba13f5cbd4d88 +size 30872250 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/rng_state.pth b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..d028356c403740abd92be13f295a9f9b24a4d6b5 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ee599652580808262e2414d79d13f6e068ecc613791f614dafc1055150ad952 +size 14244 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/scheduler.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..af3c8484ab24d80101f8a78c6e304a582b86df05 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e7d2720eafb87876224361ca77f0e3340ad73ecf8a5b89d214662822df5b2f9 +size 1064 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/tokenizer.json b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8d651380b80b1775af303bdabc6da4e6774ce3 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8441917e39ae0244e06d704b95b3124795cec478e297f9afac39ba670d7e9d99 +size 11421870 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/training_args.bin b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..40a5ebf39bfbbdd6fd02657c7618a5346a246f38 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6681bcfaab168bb9f2546d08d7db7332c7031d07995e1b0c2370486b0ebaa67 +size 5880 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/adapter_model.safetensors b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ae764b130a0ab06e3dffad09165ff74f874acb10 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:183b86c18f5eafe25eef75ab13939aac1fce74033fdc0aeaa48f0d5c3c672bd3 +size 15367872 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/optimizer.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..c44501ef94e692fefaa71de68b0fd983411a05aa --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ab636aace078f12bd63b57bf386ba7b1e4da6140d9429d8142d19d64d62568f +size 30872250 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/rng_state.pth b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..e22403811ace4883bec3077bfbd5d85ef23d653f --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba2b2794cca671992fa36b303281e17c3776874f8612c79edd6139b8508a8b55 +size 14244 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/scheduler.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2298f20a12088c59df1c56f9fd474a50be01490 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:123c98ee240c2334f014ba780a666898a15ca279f1df15c909b5d888070b33c2 +size 1064 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/tokenizer.json b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8d651380b80b1775af303bdabc6da4e6774ce3 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8441917e39ae0244e06d704b95b3124795cec478e297f9afac39ba670d7e9d99 +size 11421870 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/training_args.bin b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..40a5ebf39bfbbdd6fd02657c7618a5346a246f38 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6681bcfaab168bb9f2546d08d7db7332c7031d07995e1b0c2370486b0ebaa67 +size 5880 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/adapter_model.safetensors b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..706178c0a8d1ade864a996e511d77d8b8e99068e --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1b29de2276075bbcb052fbf096856110ba9b104a210e8f40f34bfc111f2c3ab +size 15367872 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/optimizer.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..271fba9f82eab0089d38b8a3936a759c87193a5d --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23f76aa92ccddc7b62080641c68e31a4cb1a183569a2b89bacead848a0f1f0c0 +size 30872250 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/rng_state.pth b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..554c44ede7210da700a1cb4bb3540d3b8180c990 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adbf0602089d3dec81f5a843f1c6a7b4e23f6d809cb0482e367303c68a7be945 +size 14244 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/scheduler.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..edd71dd5b0f8f02e4e9330c2e0caa5cbc96f98c0 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:264dc091a3d31762e5bb1b64d389ade2091720849a4df5c30edadd72b7aef7d2 +size 1064 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/tokenizer.json b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8d651380b80b1775af303bdabc6da4e6774ce3 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8441917e39ae0244e06d704b95b3124795cec478e297f9afac39ba670d7e9d99 +size 11421870 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/training_args.bin b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..40a5ebf39bfbbdd6fd02657c7618a5346a246f38 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6681bcfaab168bb9f2546d08d7db7332c7031d07995e1b0c2370486b0ebaa67 +size 5880 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/adapter_model.safetensors b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fbeeb823408635b13ee6d26da884f43c8ac85eba --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18b5bcf922b7f115ddc7b6dc67b61d4cbbd7e1e2161575d552b63ef3ffb35d4c +size 15367872 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/optimizer.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d095e2771d6a89629b57f84e60cd64bc648f461 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73f49210b5d469b1d754ca9f0712952a139ca50fed0903d53a3ce31ebd2a8c24 +size 30872250 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/rng_state.pth b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..ada64148169d7d327b4fb3671ec3069e9a978d92 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8362fd66233d92cbe0c63ca103f1faef5f2fa203a3d3d896a970d59956838293 +size 14244 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/scheduler.pt b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..616c15df33d2acccc00ac684247836544eaecf7e --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:653abbcd7366cf409f915437482f9d0bbc5d11facbf5414c77bec311ea4a7ab8 +size 1064 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/tokenizer.json b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8d651380b80b1775af303bdabc6da4e6774ce3 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8441917e39ae0244e06d704b95b3124795cec478e297f9afac39ba670d7e9d99 +size 11421870 diff --git a/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/training_args.bin b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..40a5ebf39bfbbdd6fd02657c7618a5346a246f38 --- /dev/null +++ b/sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6681bcfaab168bb9f2546d08d7db7332c7031d07995e1b0c2370486b0ebaa67 +size 5880 diff --git a/sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-34482/optimizer.pt b/sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-34482/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..d61f1989ba9b8a5a4936014a2360460791318f71 --- /dev/null +++ b/sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-34482/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07c6a9f2febe8da5565bddf1ad5ebdc418fffef75beba353391d582bebc8b9e2 +size 30872250 diff --git a/sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-34482/tokenizer.json b/sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-34482/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8d651380b80b1775af303bdabc6da4e6774ce3 --- /dev/null +++ b/sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-34482/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8441917e39ae0244e06d704b95b3124795cec478e297f9afac39ba670d7e9d99 +size 11421870 diff --git a/sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-72248/adapter_model.safetensors b/sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-72248/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a285c1c982abf1f74ac82d17508db0b3fa8d917c --- /dev/null +++ b/sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-72248/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13ed7633febdfd24aca1c5b3593084bfc31ce9f43ce42be5bccad5e4c910beeb +size 15367872