gijs commited on
Commit
ea09d3b
·
verified ·
1 Parent(s): 3ae48b1

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +63 -0
  2. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/adapter_model.safetensors +3 -0
  3. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/optimizer.pt +3 -0
  4. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_0.pth +3 -0
  5. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_1.pth +3 -0
  6. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_2.pth +3 -0
  7. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/scheduler.pt +3 -0
  8. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/tokenizer.json +3 -0
  9. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/training_args.bin +3 -0
  10. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/adapter_model.safetensors +3 -0
  11. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/optimizer.pt +3 -0
  12. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_0.pth +3 -0
  13. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_1.pth +3 -0
  14. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_2.pth +3 -0
  15. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/scheduler.pt +3 -0
  16. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/tokenizer.json +3 -0
  17. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/training_args.bin +3 -0
  18. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/adapter_model.safetensors +3 -0
  19. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/optimizer.pt +3 -0
  20. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/rng_state_1.pth +3 -0
  21. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/rng_state_2.pth +3 -0
  22. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/scheduler.pt +3 -0
  23. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/training_args.bin +3 -0
  24. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/adapter_model.safetensors +3 -0
  25. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/optimizer.pt +3 -0
  26. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_0.pth +3 -0
  27. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_1.pth +3 -0
  28. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_2.pth +3 -0
  29. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/scheduler.pt +3 -0
  30. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/tokenizer.json +3 -0
  31. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/training_args.bin +3 -0
  32. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/adapter_model.safetensors +3 -0
  33. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/optimizer.pt +3 -0
  34. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_0.pth +3 -0
  35. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_1.pth +3 -0
  36. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_2.pth +3 -0
  37. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/scheduler.pt +3 -0
  38. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/tokenizer.json +3 -0
  39. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/training_args.bin +3 -0
  40. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/adapter_model.safetensors +3 -0
  41. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/optimizer.pt +3 -0
  42. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_0.pth +3 -0
  43. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_1.pth +3 -0
  44. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_2.pth +3 -0
  45. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/scheduler.pt +3 -0
  46. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/tokenizer.json +3 -0
  47. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/training_args.bin +3 -0
  48. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/adapter_model.safetensors +3 -0
  49. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/optimizer.pt +3 -0
  50. grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/rng_state_0.pth +3 -0
.gitattributes CHANGED
@@ -728,3 +728,66 @@ sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-19704/to
728
  sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-3284/tokenizer.json filter=lfs diff=lfs merge=lfs -text
729
  sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-14778/tokenizer.json filter=lfs diff=lfs merge=lfs -text
730
  sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-72248/tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
728
  sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-3284/tokenizer.json filter=lfs diff=lfs merge=lfs -text
729
  sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-14778/tokenizer.json filter=lfs diff=lfs merge=lfs -text
730
  sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-72248/tokenizer.json filter=lfs diff=lfs merge=lfs -text
731
+ sft/20250428_230439_sftqwenomni-simple-loraopt-3e-8bs-0.0002/checkpoint-34482/tokenizer.json filter=lfs diff=lfs merge=lfs -text
732
+ sft/20250423_055703_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/tokenizer.json filter=lfs diff=lfs merge=lfs -text
733
+ sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-11641/tokenizer.json filter=lfs diff=lfs merge=lfs -text
734
+ sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-64857/tokenizer.json filter=lfs diff=lfs merge=lfs -text
735
+ sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-16630/tokenizer.json filter=lfs diff=lfs merge=lfs -text
736
+ sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-79824/tokenizer.json filter=lfs diff=lfs merge=lfs -text
737
+ sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-1663/tokenizer.json filter=lfs diff=lfs merge=lfs -text
738
+ sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-44901/tokenizer.json filter=lfs diff=lfs merge=lfs -text
739
+ sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-14967/tokenizer.json filter=lfs diff=lfs merge=lfs -text
740
+ sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-8315/tokenizer.json filter=lfs diff=lfs merge=lfs -text
741
+ sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-41575/tokenizer.json filter=lfs diff=lfs merge=lfs -text
742
+ sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-49890/tokenizer.json filter=lfs diff=lfs merge=lfs -text
743
+ sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-63194/tokenizer.json filter=lfs diff=lfs merge=lfs -text
744
+ sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-58205/tokenizer.json filter=lfs diff=lfs merge=lfs -text
745
+ sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-24945/tokenizer.json filter=lfs diff=lfs merge=lfs -text
746
+ sft/20250428_225638_sftqwenomni-semantic-loraopt-3e-8bs-0.0002/checkpoint-3326/tokenizer.json filter=lfs diff=lfs merge=lfs -text
747
+ grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-524/tokenizer.json filter=lfs diff=lfs merge=lfs -text
748
+ grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1572/tokenizer.json filter=lfs diff=lfs merge=lfs -text
749
+ grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1834/tokenizer.json filter=lfs diff=lfs merge=lfs -text
750
+ grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-2096/tokenizer.json filter=lfs diff=lfs merge=lfs -text
751
+ grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-262/tokenizer.json filter=lfs diff=lfs merge=lfs -text
752
+ grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3668/tokenizer.json filter=lfs diff=lfs merge=lfs -text
753
+ grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3144/tokenizer.json filter=lfs diff=lfs merge=lfs -text
754
+ grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-786/tokenizer.json filter=lfs diff=lfs merge=lfs -text
755
+ grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4454/tokenizer.json filter=lfs diff=lfs merge=lfs -text
756
+ grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-3930/tokenizer.json filter=lfs diff=lfs merge=lfs -text
757
+ grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-4192/tokenizer.json filter=lfs diff=lfs merge=lfs -text
758
+ grpo/grpo-20250415_180333_qwen2a-semantic-lora-e1-bs4-lr1e-05-20250419_100053/checkpoint-1048/tokenizer.json filter=lfs diff=lfs merge=lfs -text
759
+ grpo/grpo-20250411_032518_semantic_mc_qa-none-e1-bs4-lr1e-05-20250420_141256/checkpoint-262/tokenizer.json filter=lfs diff=lfs merge=lfs -text
760
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/tokenizer.json filter=lfs diff=lfs merge=lfs -text
761
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/tokenizer.json filter=lfs diff=lfs merge=lfs -text
762
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/tokenizer.json filter=lfs diff=lfs merge=lfs -text
763
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/tokenizer.json filter=lfs diff=lfs merge=lfs -text
764
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/tokenizer.json filter=lfs diff=lfs merge=lfs -text
765
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-4248/tokenizer.json filter=lfs diff=lfs merge=lfs -text
766
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5310/tokenizer.json filter=lfs diff=lfs merge=lfs -text
767
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7788/tokenizer.json filter=lfs diff=lfs merge=lfs -text
768
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6018/tokenizer.json filter=lfs diff=lfs merge=lfs -text
769
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1770/tokenizer.json filter=lfs diff=lfs merge=lfs -text
770
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-14160/tokenizer.json filter=lfs diff=lfs merge=lfs -text
771
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13098/tokenizer.json filter=lfs diff=lfs merge=lfs -text
772
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-11682/tokenizer.json filter=lfs diff=lfs merge=lfs -text
773
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2478/tokenizer.json filter=lfs diff=lfs merge=lfs -text
774
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-708/tokenizer.json filter=lfs diff=lfs merge=lfs -text
775
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3186/tokenizer.json filter=lfs diff=lfs merge=lfs -text
776
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-1062/tokenizer.json filter=lfs diff=lfs merge=lfs -text
777
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8850/tokenizer.json filter=lfs diff=lfs merge=lfs -text
778
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7434/tokenizer.json filter=lfs diff=lfs merge=lfs -text
779
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9912/tokenizer.json filter=lfs diff=lfs merge=lfs -text
780
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-13806/tokenizer.json filter=lfs diff=lfs merge=lfs -text
781
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-3540/tokenizer.json filter=lfs diff=lfs merge=lfs -text
782
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/tokenizer.json filter=lfs diff=lfs merge=lfs -text
783
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-6726/tokenizer.json filter=lfs diff=lfs merge=lfs -text
784
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-9558/tokenizer.json filter=lfs diff=lfs merge=lfs -text
785
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10974/tokenizer.json filter=lfs diff=lfs merge=lfs -text
786
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-2832/tokenizer.json filter=lfs diff=lfs merge=lfs -text
787
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10620/tokenizer.json filter=lfs diff=lfs merge=lfs -text
788
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-7080/tokenizer.json filter=lfs diff=lfs merge=lfs -text
789
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8142/tokenizer.json filter=lfs diff=lfs merge=lfs -text
790
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-8496/tokenizer.json filter=lfs diff=lfs merge=lfs -text
791
+ grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-5664/tokenizer.json filter=lfs diff=lfs merge=lfs -text
792
+ grpo/grpo-qwen2a-sft-simple-nolora-none-e1-bs2-lr1e-06-20250515_011358/checkpoint-11200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
793
+ grpo_audio/qwen2a-sft-simple-lora-lora-e1-bs2-lr1e-06-20250516_010602/checkpoint-11200/tokenizer.json filter=lfs diff=lfs merge=lfs -text
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccd61d65cb4b6c5620b6f52209b197c9358ca97736a9b61da04129a46425bd78
3
+ size 22056664
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e882e92811d603b1d7c33169f0b025c4049b2669e537e66bb23bad26ea032be
3
+ size 33662330
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:032478a582980ef2c598efe75ad315499f6d42a4e32aa077084cb113a48b8a6e
3
+ size 14768
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4debf9dda4f462fe3511ec26606053718fedd02f09970b78403f90a11722f202
3
+ size 14768
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25086c52a71c82f8f2df859291ac870e7bfd87f70293e98d086e60d4317c1fda
3
+ size 14768
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8400c05d78a868f3fb8829167d16a485f84e33d77e8ca368f247247e86d506d2
3
+ size 1064
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
3
+ size 12030943
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-350/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7467d71986e05cec05766ced10155b94f8de393746facf714bb23d4c4e0f4bc4
3
+ size 6392
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccd61d65cb4b6c5620b6f52209b197c9358ca97736a9b61da04129a46425bd78
3
+ size 22056664
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ed6a42ed7e39af915d76774028325eb34053221e67cef08522b0dbf29e9360b
3
+ size 33662330
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:496dab5ac434081715cf9f19a53b79013cc1af9c13392f766b50c29fd432c14b
3
+ size 14768
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e32d69705c106a176d6d90a7526ca0aff0c53dbc698628dc24edbbcf855626f
3
+ size 14768
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae3a5f9f9438f8d33e9a0b1045fb33356838f16c5979de475cb6db60f6920e9a
3
+ size 14768
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04f2401e284b6d6c90d110756cf3afe8dec75b249400c865cf2376b9b319c4c
3
+ size 1064
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
3
+ size 12030943
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-4550/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7467d71986e05cec05766ced10155b94f8de393746facf714bb23d4c4e0f4bc4
3
+ size 6392
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccd61d65cb4b6c5620b6f52209b197c9358ca97736a9b61da04129a46425bd78
3
+ size 22056664
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b5ab141ecb9251f7455208a1d7f9c99b1cfc57988cdfb86f11ef65655817a85
3
+ size 33662330
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:623d9cc8857f6fe5de0394fb47b498e3cd846748829ea9da03c995c8db951dd8
3
+ size 14768
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c63a212562315fa03da9928d36545a70960c3e9b92ff46463386489fd524b2ee
3
+ size 14768
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c77f1281f31768af4e25df89af97425bb99e7ca1c8e207f78ff7f6ba5957bcf
3
+ size 1064
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-5250/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7467d71986e05cec05766ced10155b94f8de393746facf714bb23d4c4e0f4bc4
3
+ size 6392
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccd61d65cb4b6c5620b6f52209b197c9358ca97736a9b61da04129a46425bd78
3
+ size 22056664
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71da3b020316f488e9841c0d5447d857215527a1303732558eb8b0d5dcf2da4b
3
+ size 33662330
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6a0b5bcfa1fd7883b7d3eaa51bc8bf12b62570765d047f46336d204932f169d
3
+ size 14768
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59236a094fbd4155468af539e1d001f6c83152d87694314e1728f9ed82fa161f
3
+ size 14768
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d19a19a1621e733f81299b50ee7e52464ab66cd11517f247062c3dc897bdc62
3
+ size 14768
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24e7ca248b81bb822afa3560fb61ce397c3061d8dfceeb6ebbdbe3c1a81414eb
3
+ size 1064
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
3
+ size 12030943
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-6650/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7467d71986e05cec05766ced10155b94f8de393746facf714bb23d4c4e0f4bc4
3
+ size 6392
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccd61d65cb4b6c5620b6f52209b197c9358ca97736a9b61da04129a46425bd78
3
+ size 22056664
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee67cf4314e0c7ccf5c81174590919078e9753aea37ae2797812a7d1a68c0ae2
3
+ size 33662330
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:407f251a8ecbe7fda1229f6223cf007607a4c15dff3ec5c2ad574c3400d86d75
3
+ size 14768
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2353dc8a88e88a7841e663c0c899be9842606f89b006fc5bc99fedad4ce3f8c3
3
+ size 14768
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e9e1cc29e53955ff814da39132fcbf7befe00596ce55773da2c57ddebce732f
3
+ size 14768
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5edfe6d7cca9ca522c7a28c2b9b2eaf9fcc5d05da256709ba38b82a48de2086
3
+ size 1064
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
3
+ size 12030943
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7000/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7467d71986e05cec05766ced10155b94f8de393746facf714bb23d4c4e0f4bc4
3
+ size 6392
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccd61d65cb4b6c5620b6f52209b197c9358ca97736a9b61da04129a46425bd78
3
+ size 22056664
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f2fba107150e8764af2ede60cf0ecde71465c8088d8af01b08afe9f41a45138
3
+ size 33662330
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf32bbba4838d91a90a84eccb3ee5448194306672167b2592f52f0574eca0f49
3
+ size 14768
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1536138e373843f9832da972f066736eff132e58f7d5ad0977019fe93eeb414
3
+ size 14768
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02fdcf932b5458b87023d7a45c060420452d7a97a8b969889ebedd3cbddca1ba
3
+ size 14768
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee90731ea0c0dd8f909335cf442242f60a5949e7f041ece4b7ac574989d9808a
3
+ size 1064
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e56eaebf99a63995f420cf1d71d671180c414ff523f363350b20c982ef29d5b6
3
+ size 12030943
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-05-20250425_022150/checkpoint-7350/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7467d71986e05cec05766ced10155b94f8de393746facf714bb23d4c4e0f4bc4
3
+ size 6392
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75da0e1656a768eb7b28b613273eb13d782d7ca19af3cecd252cf86174381625
3
+ size 22056664
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23ad97008180864f0fbf5aeb018396bab33c7779ef7a0f5ea7d231555bf306ab
3
+ size 33662330
grpo/grpo-20250411_032518_semantic_mc_qa-lora-e1-bs4-lr1e-06-20250425_181059/checkpoint-10266/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:547b0d6f98d44f896382bf36cccc97565692b04e6e52dad6d7894cba3dddae49
3
+ size 14768