Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +63 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/adapter_model.safetensors +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/optimizer.pt +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_0.pth +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_1.pth +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_2.pth +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/scheduler.pt +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/tokenizer.json +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/training_args.bin +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/adapter_model.safetensors +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/optimizer.pt +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_0.pth +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_1.pth +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_2.pth +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/scheduler.pt +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/tokenizer.json +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/training_args.bin +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/adapter_model.safetensors +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/optimizer.pt +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/rng_state_1.pth +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/rng_state_2.pth +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/scheduler.pt +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/training_args.bin +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/adapter_model.safetensors +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/optimizer.pt +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_0.pth +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_1.pth +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_2.pth +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/scheduler.pt +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/tokenizer.json +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/training_args.bin +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/adapter_model.safetensors +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/optimizer.pt +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_0.pth +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_1.pth +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_2.pth +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/scheduler.pt +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/tokenizer.json +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/training_args.bin +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/adapter_model.safetensors +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/optimizer.pt +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_0.pth +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_1.pth +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_2.pth +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/scheduler.pt +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/tokenizer.json +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/training_args.bin +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/adapter_model.safetensors +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/optimizer.pt +3 -0
- grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/rng_state_0.pth +3 -0
.gitattributes
CHANGED
|
@@ -728,3 +728,66 @@ sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-19704/to
|
|
| 728 |
sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-3284/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 729 |
sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-14778/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 730 |
sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-72248/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 728 |
sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-3284/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 729 |
sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-14778/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 730 |
sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-72248/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 731 |
+
sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-34482/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 732 |
+
sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 733 |
+
sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 734 |
+
sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 735 |
+
sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 736 |
+
sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 737 |
+
sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 738 |
+
sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 739 |
+
sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 740 |
+
sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 741 |
+
sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 742 |
+
sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 743 |
+
sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 744 |
+
sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 745 |
+
sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 746 |
+
sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 747 |
+
grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 748 |
+
grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 749 |
+
grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 750 |
+
grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 751 |
+
grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 752 |
+
grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 753 |
+
grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 754 |
+
grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 755 |
+
grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 756 |
+
grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 757 |
+
grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 758 |
+
grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 759 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 760 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 761 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 762 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 763 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 764 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 765 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-4248/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 766 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 767 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 768 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 769 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 770 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 771 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 772 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 773 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 774 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 775 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 776 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 777 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 778 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 779 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 780 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 781 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 782 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 783 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 784 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 785 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 786 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 787 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 788 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 789 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 790 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 791 |
+
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 792 |
+
grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 793 |
+
grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ccd61d65cb4b6c5620b6f52209b197c9358ca97736a9b61da04129a46425bd78
|
| 3 |
+
size 22056664
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1e882e92811d603b1d7c33169f0b025c4049b2669e537e66bb23bad26ea032be
|
| 3 |
+
size 33662330
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_0.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:032478a582980ef2c598efe75ad315499f6d42a4e32aa077084cb113a48b8a6e
|
| 3 |
+
size 14768
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_1.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4debf9dda4f462fe3511ec26606053718fedd02f09970b78403f90a11722f202
|
| 3 |
+
size 14768
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_2.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:25086c52a71c82f8f2df859291ac870e7bfd87f70293e98d086e60d4317c1fda
|
| 3 |
+
size 14768
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8400c05d78a868f3fb8829167d16a485f84e33d77e8ca368f247247e86d506d2
|
| 3 |
+
size 1064
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
|
| 3 |
+
size 12030943
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7467d71986e05cec05766ced10155b94f8de393746facf714bb23d4c4e0f4bc4
|
| 3 |
+
size 6392
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ccd61d65cb4b6c5620b6f52209b197c9358ca97736a9b61da04129a46425bd78
|
| 3 |
+
size 22056664
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ed6a42ed7e39af915d76774028325eb34053221e67cef08522b0dbf29e9360b
|
| 3 |
+
size 33662330
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_0.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:496dab5ac434081715cf9f19a53b79013cc1af9c13392f766b50c29fd432c14b
|
| 3 |
+
size 14768
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_1.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3e32d69705c106a176d6d90a7526ca0aff0c53dbc698628dc24edbbcf855626f
|
| 3 |
+
size 14768
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_2.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ae3a5f9f9438f8d33e9a0b1045fb33356838f16c5979de475cb6db60f6920e9a
|
| 3 |
+
size 14768
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c04f2401e284b6d6c90d110756cf3afe8dec75b249400c865cf2376b9b319c4c
|
| 3 |
+
size 1064
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
|
| 3 |
+
size 12030943
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7467d71986e05cec05766ced10155b94f8de393746facf714bb23d4c4e0f4bc4
|
| 3 |
+
size 6392
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ccd61d65cb4b6c5620b6f52209b197c9358ca97736a9b61da04129a46425bd78
|
| 3 |
+
size 22056664
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8b5ab141ecb9251f7455208a1d7f9c99b1cfc57988cdfb86f11ef65655817a85
|
| 3 |
+
size 33662330
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/rng_state_1.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:623d9cc8857f6fe5de0394fb47b498e3cd846748829ea9da03c995c8db951dd8
|
| 3 |
+
size 14768
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/rng_state_2.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c63a212562315fa03da9928d36545a70960c3e9b92ff46463386489fd524b2ee
|
| 3 |
+
size 14768
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7c77f1281f31768af4e25df89af97425bb99e7ca1c8e207f78ff7f6ba5957bcf
|
| 3 |
+
size 1064
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7467d71986e05cec05766ced10155b94f8de393746facf714bb23d4c4e0f4bc4
|
| 3 |
+
size 6392
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ccd61d65cb4b6c5620b6f52209b197c9358ca97736a9b61da04129a46425bd78
|
| 3 |
+
size 22056664
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:71da3b020316f488e9841c0d5447d857215527a1303732558eb8b0d5dcf2da4b
|
| 3 |
+
size 33662330
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_0.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b6a0b5bcfa1fd7883b7d3eaa51bc8bf12b62570765d047f46336d204932f169d
|
| 3 |
+
size 14768
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_1.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:59236a094fbd4155468af539e1d001f6c83152d87694314e1728f9ed82fa161f
|
| 3 |
+
size 14768
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_2.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d19a19a1621e733f81299b50ee7e52464ab66cd11517f247062c3dc897bdc62
|
| 3 |
+
size 14768
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:24e7ca248b81bb822afa3560fb61ce397c3061d8dfceeb6ebbdbe3c1a81414eb
|
| 3 |
+
size 1064
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
|
| 3 |
+
size 12030943
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7467d71986e05cec05766ced10155b94f8de393746facf714bb23d4c4e0f4bc4
|
| 3 |
+
size 6392
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ccd61d65cb4b6c5620b6f52209b197c9358ca97736a9b61da04129a46425bd78
|
| 3 |
+
size 22056664
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee67cf4314e0c7ccf5c81174590919078e9753aea37ae2797812a7d1a68c0ae2
|
| 3 |
+
size 33662330
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_0.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:407f251a8ecbe7fda1229f6223cf007607a4c15dff3ec5c2ad574c3400d86d75
|
| 3 |
+
size 14768
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_1.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2353dc8a88e88a7841e663c0c899be9842606f89b006fc5bc99fedad4ce3f8c3
|
| 3 |
+
size 14768
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_2.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4e9e1cc29e53955ff814da39132fcbf7befe00596ce55773da2c57ddebce732f
|
| 3 |
+
size 14768
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f5edfe6d7cca9ca522c7a28c2b9b2eaf9fcc5d05da256709ba38b82a48de2086
|
| 3 |
+
size 1064
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
|
| 3 |
+
size 12030943
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7467d71986e05cec05766ced10155b94f8de393746facf714bb23d4c4e0f4bc4
|
| 3 |
+
size 6392
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ccd61d65cb4b6c5620b6f52209b197c9358ca97736a9b61da04129a46425bd78
|
| 3 |
+
size 22056664
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2f2fba107150e8764af2ede60cf0ecde71465c8088d8af01b08afe9f41a45138
|
| 3 |
+
size 33662330
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_0.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bf32bbba4838d91a90a84eccb3ee5448194306672167b2592f52f0574eca0f49
|
| 3 |
+
size 14768
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_1.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e1536138e373843f9832da972f066736eff132e58f7d5ad0977019fe93eeb414
|
| 3 |
+
size 14768
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_2.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:02fdcf932b5458b87023d7a45c060420452d7a97a8b969889ebedd3cbddca1ba
|
| 3 |
+
size 14768
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee90731ea0c0dd8f909335cf442242f60a5949e7f041ece4b7ac574989d9808a
|
| 3 |
+
size 1064
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
|
| 3 |
+
size 12030943
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7467d71986e05cec05766ced10155b94f8de393746facf714bb23d4c4e0f4bc4
|
| 3 |
+
size 6392
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/adapter_model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:75da0e1656a768eb7b28b613273eb13d782d7ca19af3cecd252cf86174381625
|
| 3 |
+
size 22056664
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23ad97008180864f0fbf5aeb018396bab33c7779ef7a0f5ea7d231555bf306ab
|
| 3 |
+
size 33662330
|
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/rng_state_0.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:547b0d6f98d44f896382bf36cccc97565692b04e6e52dad6d7894cba3dddae49
|
| 3 |
+
size 14768
|