diff --git a/.gitattributes b/.gitattributes index d6a3fae3229a47cd5d9a32e0e856dc42bb35e9ea..c8de753b86c5ff19ed5c21a9c282a259b1cf3a76 100644 --- a/.gitattributes +++ b/.gitattributes @@ -951,3 +951,29 @@ sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkp sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-4989/tokenizer.json filter=lfs diff=lfs merge=lfs -text sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-23282/tokenizer.json filter=lfs diff=lfs merge=lfs -text sft/20250428_122030_sftqwen2a-semantic-fullyscratch-loraopt-5e-8bs-0.0002/checkpoint-21619/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-87178/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-24908/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-93405/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-7424/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9283/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-3712/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-1856/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9280/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-5568/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-19746/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-59238/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-29619/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-49365/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-9873/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-69111/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-39492/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/tokenizer.json filter=lfs diff=lfs merge=lfs -text +sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-1856/adapter_model.safetensors b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-1856/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e2b6614c1687d8f1794c5ca542816011457f8d7a --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-1856/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:660ef5b561a8996a7b4714653010347c5c80b7fa4f516187d14b6e86ce7824c2 +size 22056664 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-1856/optimizer.pt b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-1856/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..64d090bee1ecdd8d963d797e09be31b87ccfa778 --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-1856/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd355d7df733a942224be1a56a7b434462cb70da3b1486964a6b478832ff31 +size 44254970 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-1856/rng_state.pth b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-1856/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..0743bc90fc8f7a58439faa95a35f5348c2f5e11d --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-1856/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf82c94f7efbe943489a6b705dfdc6f64ecbd05f9f6647f40c3c1981b81c83b6 +size 14244 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-1856/scheduler.pt b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-1856/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..f63fa34dc39bdd59c0cd09e63b6362c19997c59d --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-1856/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44227b061f4948a26b828d1b5f0cb00b3ad435aa83f0c9eb0514020a1d776260 +size 1064 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-1856/tokenizer.json b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-1856/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-1856/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-1856/training_args.bin b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-1856/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2ce0028acf1088649d5787f29ca538602621be02 --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-1856/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae6fa5711d8aa22f48fb9238292035fa3d9a34fb0b637bcb7b170f9129168d4b +size 5880 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-3712/adapter_model.safetensors b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-3712/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8f6b0f5914cf0a790c327735051ec480d271cadb --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-3712/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee825acd71357e202dacbd421f8faf47efd30c210c6db0e94d04a858a75e65b2 +size 22056664 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-3712/optimizer.pt b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-3712/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aad914226e2194f3ccebeaf077f1c71e46c4141 --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-3712/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac59d4f64701ae2e9b69506a7c4f94ed05aa7bb2f39722a42abf423c61e17778 +size 44254970 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-3712/rng_state.pth b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-3712/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..390650a7f2248f54ebb8aa77a391aa0db281e727 --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-3712/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ca1c02fb06427cc45af59f5b872aab7bbdeea9048a5f93279af167e5d7e3908 +size 14244 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-3712/scheduler.pt b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-3712/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1bebe45c5c51b9ab97a80233d03b6bfccd75590 --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-3712/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c9407c24ff791b760d181c94873b360e1930dd88e14ababffc107a48ee14856 +size 1064 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-3712/tokenizer.json b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-3712/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-3712/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-3712/training_args.bin b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-3712/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2ce0028acf1088649d5787f29ca538602621be02 --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-3712/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae6fa5711d8aa22f48fb9238292035fa3d9a34fb0b637bcb7b170f9129168d4b +size 5880 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-5568/adapter_model.safetensors b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-5568/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e7e9711559e31d943e535244605de1cabd59b5df --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-5568/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c23cf3066c06e25299c1b1d8ee2983c03d2fc01b078f1307cf4b92acb83ab95 +size 22056664 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-5568/optimizer.pt b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-5568/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f53c9982b70618badf88e8c3661793059d7466c --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-5568/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:343262e8c66ed54b3ef1d4d5cbba9ebbf167932bc0990ac4a3edfbf9e3c61c04 +size 44254970 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-5568/rng_state.pth b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-5568/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..faafefb7e5d98bcd0e1f94c15f6078d63102db44 --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-5568/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16647c07cf93fb7f2a66737a419ebf0bbe188b47bffdba8afe8b82c1491e778f +size 14244 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-5568/scheduler.pt b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-5568/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..950f7edf06802e1cc274b1d3ce51b2233535b6bb --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-5568/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a82dec750182aed3b47eb6532f4e332681c09277e8b114aa8414430b7ce8116 +size 1064 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-5568/tokenizer.json b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-5568/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-5568/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-5568/training_args.bin b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-5568/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2ce0028acf1088649d5787f29ca538602621be02 --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-5568/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae6fa5711d8aa22f48fb9238292035fa3d9a34fb0b637bcb7b170f9129168d4b +size 5880 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-7424/adapter_model.safetensors b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-7424/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f0546aec9ff7b65d138d0442160d5161c8252db8 --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-7424/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3013ab451a9a15abcc34d0cd2cbe7c9eaab5136a57c8053b94aa3701f6491772 +size 22056664 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-7424/optimizer.pt b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-7424/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..c91a6befb5261440f1238cbb83b5665ae0efe48f --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-7424/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcd1767266864d847db675da4affd7e3d7c31589f1c39ed435ec2a897487222d +size 44254970 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-7424/rng_state.pth b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-7424/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..ea0eac7111008787d75234798ab7cf477b6dcc6f --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-7424/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6ab1a1b05f28b8dc057aaf48ec573a563c80e3ac4d0c567992a684dcbaf4607 +size 14244 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-7424/scheduler.pt b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-7424/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..33ed30f58a6b30515a6215c34435cdf58b00f30e --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-7424/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce1b52f2d0d0672e7a488e92988265a1ede8a4844e69c77fc17053899d682895 +size 1064 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-7424/tokenizer.json b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-7424/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-7424/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-7424/training_args.bin b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-7424/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2ce0028acf1088649d5787f29ca538602621be02 --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-7424/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae6fa5711d8aa22f48fb9238292035fa3d9a34fb0b637bcb7b170f9129168d4b +size 5880 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9280/adapter_model.safetensors b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9280/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a31329eeca9e6aa70e288fc386b439e90c1e2b96 --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9280/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2720257feb4ab20b26cff01523b6b4abc657abb34e9590145295674feff35ccc +size 22056664 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9280/optimizer.pt b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9280/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..94fb71632a2e6fae2dc2b3c8df71a3020514e7a7 --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9280/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f39bc4004941b3a89534de0a213c667a0f7e46b583b59524d8f02f4be04fe89 +size 44254970 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9280/rng_state.pth b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9280/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..594a4f815eabb66d8d4aa60b1ada2a281db28ea1 --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9280/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1aa6695ad240c6b489663337e6db10d40887d4cb8c4b22a6cde2f29a43a050bf +size 14244 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9280/scheduler.pt b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9280/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..5282dc889625d2ddb7c7404648cfb61c923797ab --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9280/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba7d3458e9fdcfaa3bebca6bb524367c0027f2eac98c18a87debdfd5a7445887 +size 1064 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9280/tokenizer.json b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9280/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9280/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9280/training_args.bin b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9280/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2ce0028acf1088649d5787f29ca538602621be02 --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9280/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae6fa5711d8aa22f48fb9238292035fa3d9a34fb0b637bcb7b170f9129168d4b +size 5880 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9283/adapter_model.safetensors b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9283/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0a93820a33b215d8c97b7095c4e64d094aba04cf --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9283/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78746238dc22092f8fef322d70e668ffb55077b46c4b22e8b935e3f8e6ff9560 +size 22056664 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9283/optimizer.pt b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9283/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..66d6a227cc274ef241f69e47b9983f8e5674ef00 --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9283/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7b6027164767903af25d2a0a197c5e044d1676157e60b7ddebb45b7f29f818e +size 44254970 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9283/rng_state.pth b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9283/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..82fb19d00145998e863e64d0939ba09e13ae397e --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9283/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92face340385cb92a7402cb2a5346e3946c7ff303ba8f7fcd18de6b45d008c66 +size 14244 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9283/scheduler.pt b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9283/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9bb8c8f0a5bc1edebfa2f8941f06d2fc61c0715 --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9283/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d052ec9e86fd391d22fb127798597d25ea705dbddc399d6f36c1e83059261c20 +size 1064 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9283/tokenizer.json b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9283/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9283/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9283/training_args.bin b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9283/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..2ce0028acf1088649d5787f29ca538602621be02 --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/checkpoint-9283/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae6fa5711d8aa22f48fb9238292035fa3d9a34fb0b637bcb7b170f9129168d4b +size 5880 diff --git a/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/runs/Mar06_07-54-35_gcn120.local.snellius.surf.nl/events.out.tfevents.1741244077.gcn120.local.snellius.surf.nl.538532.0 b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/runs/Mar06_07-54-35_gcn120.local.snellius.surf.nl/events.out.tfevents.1741244077.gcn120.local.snellius.surf.nl.538532.0 new file mode 100644 index 0000000000000000000000000000000000000000..7c55258f47c6bec4376dbcf0b29d16b62320771d --- /dev/null +++ b/sft/20250306_075435_sfttraining_qwen2.5_simple_0_20000-loraopt-5e-10bs-0.0002/runs/Mar06_07-54-35_gcn120.local.snellius.surf.nl/events.out.tfevents.1741244077.gcn120.local.snellius.surf.nl.538532.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cf4e8c3e537ede126002e0ef361ef590f234ba0f5e639d99db5a57ef966b817 +size 151794 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-19746/adapter_model.safetensors b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-19746/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dfb3154fb239c0dd374b2e774200e99d335e454d --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-19746/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ce63425300cd2087c2b8bb73c970da593f5e902a78ee37b3d08adc44d45c967 +size 22056664 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-19746/optimizer.pt b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-19746/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfbca1c39e345b01a1c9cf4912489aba275dbb78 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-19746/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd14218867e410b7e3adc42e9951ab4363d433d76c846828514fd496785586d1 +size 44254970 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-19746/rng_state.pth b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-19746/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..19ad9a496f8590dfa397f66ae3001832280786e2 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-19746/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e310de5c6ab5416e68a174d3a198733f27092cecbb2ada7f84277e2914b7002 +size 14244 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-19746/scheduler.pt b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-19746/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fd8f0f6bce38cdc6a1f28b83a6f558b5cc8ab35 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-19746/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2ff1b37e185dc00b5d4496f77e0376c1ad61e819595c7678b7d23e73a14f429 +size 1064 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-19746/tokenizer.json b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-19746/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-19746/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-19746/training_args.bin b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-19746/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..ad13821115d40a2fd1276d143963e350609b1654 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-19746/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f979924fd4d8336365c917d21afaa4a3950602a3ab8c2913ec9b0311467cd8dd +size 5944 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-29619/adapter_model.safetensors b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-29619/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f32c7032a7f4e3e9e5cf3692a84d1c0bdad67329 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-29619/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:383396a4b5479bef1ba037f17730dc9170540b2c7ac9eee7336320b1afd37c48 +size 22056664 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-29619/optimizer.pt b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-29619/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..5eeaac3a246243f32b0f3299770647d1d1d5b286 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-29619/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adedd6393ecec758c3f9eaa22b66aaee054fdfa9327aa3e0889c432fee60a818 +size 44254970 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-29619/rng_state.pth b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-29619/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..e1460f1faa30d81c62003bee6caf393ba79f069e --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-29619/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84555b5913a59f11b6ffc6b91ba976bd1c9529d73f17af2adfc62661baa1dc79 +size 14244 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-29619/scheduler.pt b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-29619/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..be8751df83ddf7feeb59fa531e41a9b203c3f3b8 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-29619/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8c51a4425530c878b21176aa94a91eb4ced2973961cc3adfc233885cd3ad39f +size 1064 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-29619/tokenizer.json b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-29619/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-29619/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-29619/training_args.bin b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-29619/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..ad13821115d40a2fd1276d143963e350609b1654 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-29619/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f979924fd4d8336365c917d21afaa4a3950602a3ab8c2913ec9b0311467cd8dd +size 5944 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-39492/adapter_model.safetensors b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-39492/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..42cf181af7dc13cfd7efcda0609e0e59d5b162ea --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-39492/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d72cd39e4826e1ee88ebbe8fc84e3265a476ae5eab632c930913e55d93abb8c9 +size 22056664 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-39492/optimizer.pt b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-39492/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3bed62366e94ba4c065ea96d48e35dd43dbd130 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-39492/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c893bfb11a1eabb1b698e7b4bddf0ecfaa30b6587bcd9d4099309e2d4d3f12ef +size 44254970 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-39492/rng_state.pth b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-39492/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..1ff7097ad355c277ea48eff2783db303a001a9f3 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-39492/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:848a68fa3ebbe4e32cdbb94f88abb434dc15cbe7387cb30dee97f587dd0fe95d +size 14244 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-39492/scheduler.pt b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-39492/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5683a9de431d7eb9bac181fa630a8f56aa5b034 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-39492/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:890addec8460782c97fb7e34d3c78d264ff4da7de094d32e170db7f8cff2b3d4 +size 1064 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-39492/tokenizer.json b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-39492/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-39492/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-39492/training_args.bin b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-39492/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..ad13821115d40a2fd1276d143963e350609b1654 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-39492/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f979924fd4d8336365c917d21afaa4a3950602a3ab8c2913ec9b0311467cd8dd +size 5944 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-49365/adapter_model.safetensors b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-49365/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3da58947d551fd7c1c0a4218afdf3fc67a3abd07 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-49365/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:849a179262a06f5f4ccf87ef3c9857e21bf0ca50bacd006b32e6b651b2a35b7a +size 22056664 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-49365/optimizer.pt b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-49365/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3f224c10904a33ed5c76bf8f552dff3f1820e74 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-49365/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf90cf9fea27b85f4d1048f8d3dc8c5a3aa150b2ebcea56856fc0158a388b516 +size 44254970 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-49365/rng_state.pth b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-49365/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..5143e0afc7dedf7fb165e4e53f7df5ca670215b7 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-49365/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21999d0fb87f48b3d35c9a02623e93cde558a714cfaac65ad97f1a0c920a1994 +size 14244 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-49365/scheduler.pt b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-49365/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e6efa917b37190b8c4a3409a809082e8504c68a --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-49365/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2f3196339bef7a3f9dab1286e98b04680264dede927a90ea06c554e87b46a1a +size 1064 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-49365/tokenizer.json b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-49365/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-49365/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-49365/training_args.bin b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-49365/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..ad13821115d40a2fd1276d143963e350609b1654 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-49365/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f979924fd4d8336365c917d21afaa4a3950602a3ab8c2913ec9b0311467cd8dd +size 5944 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-59238/adapter_model.safetensors b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-59238/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dbf211eab0defd362ff1f4bea7175d0ad87273b3 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-59238/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e11bbb945c4a2cf81e767ce230ee9cd22cd64d3e0d6e6d33eac2b69c277ba61e +size 22056664 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-59238/optimizer.pt b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-59238/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..97ef661bf46fd06504b94633970a2ccaf1ced3b1 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-59238/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fa7efa36ea0542e97cad5237b0dcd0e6e9e2f0c65589bed4fda5c5b4137d5aa +size 44254970 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-59238/rng_state.pth b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-59238/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..6092a747d6b3df1700d098d9d091450d02d0ffe0 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-59238/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88958c4f0144242cb9fceb29c32c190fed6336b0754a338fc4b3ae2ebbb9fb6f +size 14244 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-59238/scheduler.pt b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-59238/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fcd7175dc5b3d0736eff069c4d592dea5369084 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-59238/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e22ffc7885f17bf94c38b3f96062d60a1dc1be90a8ac7de29def8237a6c33f9e +size 1064 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-59238/tokenizer.json b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-59238/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-59238/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-59238/training_args.bin b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-59238/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..ad13821115d40a2fd1276d143963e350609b1654 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-59238/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f979924fd4d8336365c917d21afaa4a3950602a3ab8c2913ec9b0311467cd8dd +size 5944 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-69111/adapter_model.safetensors b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-69111/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..26434d6334593a3710ff970a7d83e1075f1fbd11 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-69111/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a8e34c92514216360e017b637bf1819244fa5121e49133994ef0ecc99e02581 +size 22056664 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-69111/optimizer.pt b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-69111/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ea7d83709318f11553ba7628923aab09a722095 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-69111/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49041f328e2885c09193af520caab69abb0e48d2d081291def70a915baef89cb +size 44254970 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-69111/rng_state.pth b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-69111/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..83231edf7f9bf3afa2cc0165baad7424a5d397a9 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-69111/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cfbe61ee8e1413c0afc45ae71d553fac96305e896897e8e126d4fe1e82a632a +size 14244 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-69111/scheduler.pt b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-69111/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..136a99835ecc9ebbcf98384c6067086123238c3c --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-69111/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c455664fbf459ef4f74edb906146c14c38db8698f018690c6fc8ae3495d08abe +size 1064 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-69111/tokenizer.json b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-69111/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-69111/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-69111/training_args.bin b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-69111/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..ad13821115d40a2fd1276d143963e350609b1654 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-69111/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f979924fd4d8336365c917d21afaa4a3950602a3ab8c2913ec9b0311467cd8dd +size 5944 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-9873/adapter_model.safetensors b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-9873/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cb9fe5f709d10946d39087297dca04356514469f --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-9873/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94c5d7f1cf0c80b64903194dafb2ca823da0bd385c4760dda5d6d9531fbbd657 +size 22056664 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-9873/optimizer.pt b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-9873/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac6fabc6eef475e1aca271fa77b1df4b7994256b --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-9873/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b52bd6b3c3287ddd4b4d68d8ac613626daf6fde8210362f2874c0a44bc6cc4b +size 44254970 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-9873/rng_state.pth b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-9873/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..3f8391cf1c0fdfb1bf312380b7292e9bae7b0ce4 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-9873/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bef95148e7cb327f6a1468f3927c02b1757b0a43c5de09bee85761970a2ddf2a +size 14244 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-9873/scheduler.pt b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-9873/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..87924a84006ebe1ae1d0aa5f0e6597903748df76 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-9873/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb39f0ea8d06f358196ff45ec6eb963dfdedff015c601d163c4864744ecd74f9 +size 1064 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-9873/tokenizer.json b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-9873/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-9873/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-9873/training_args.bin b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-9873/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..ad13821115d40a2fd1276d143963e350609b1654 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/checkpoint-9873/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f979924fd4d8336365c917d21afaa4a3950602a3ab8c2913ec9b0311467cd8dd +size 5944 diff --git a/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/runs/Apr06_22-00-17_gcn134.local.snellius.surf.nl/events.out.tfevents.1743969620.gcn134.local.snellius.surf.nl.3138922.0 b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/runs/Apr06_22-00-17_gcn134.local.snellius.surf.nl/events.out.tfevents.1743969620.gcn134.local.snellius.surf.nl.3138922.0 new file mode 100644 index 0000000000000000000000000000000000000000..db57c978240d358a5726e1a9c565aadfbe30dd15 --- /dev/null +++ b/sft/20250406_220017_sfttraining_qwen2.5_simple_qa-loraopt-3e-8bs-0.0002/runs/Apr06_22-00-17_gcn134.local.snellius.surf.nl/events.out.tfevents.1743969620.gcn134.local.snellius.surf.nl.3138922.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2edc5b790eb1044bcc6e873f8bfabd1a85abd44edf43482c970feb59f27f98e +size 2202565 diff --git a/sft/20250418_131903_sftqwen2a-full-semantic-loraopt-20e-16bs-0.0002/runs/Apr18_13-19-03_lrdn2916.leonardo.local/events.out.tfevents.1744975150.lrdn2916.leonardo.local.1167629.0 b/sft/20250418_131903_sftqwen2a-full-semantic-loraopt-20e-16bs-0.0002/runs/Apr18_13-19-03_lrdn2916.leonardo.local/events.out.tfevents.1744975150.lrdn2916.leonardo.local.1167629.0 new file mode 100644 index 0000000000000000000000000000000000000000..38f4a7159297fbcc0bdef62b15dbbda8de59f907 --- /dev/null +++ b/sft/20250418_131903_sftqwen2a-full-semantic-loraopt-20e-16bs-0.0002/runs/Apr18_13-19-03_lrdn2916.leonardo.local/events.out.tfevents.1744975150.lrdn2916.leonardo.local.1167629.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c1589cca2255ebd66b384b056d54615cf27327904c59a5068a3491c272449d8 +size 6575 diff --git a/sft/20250421_230841_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/runs/Apr21_23-08-41_lrdn2430.leonardo.local/events.out.tfevents.1745269729.lrdn2430.leonardo.local.4083058.0 b/sft/20250421_230841_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/runs/Apr21_23-08-41_lrdn2430.leonardo.local/events.out.tfevents.1745269729.lrdn2430.leonardo.local.4083058.0 new file mode 100644 index 0000000000000000000000000000000000000000..f12d40a17f2bb8a4841af463f0d6a435211850d8 --- /dev/null +++ b/sft/20250421_230841_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/runs/Apr21_23-08-41_lrdn2430.leonardo.local/events.out.tfevents.1745269729.lrdn2430.leonardo.local.4083058.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8abdeae7f667c469262a5c6ef742b83dac4ed551484c02dc93bcd98116baa9d4 +size 7665 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/adapter_model.safetensors b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..37034e03819d082f95303dec3c71bda032d52952 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9c5701ede11021d900a7b8166d9c16aa6b7a8a8681523e50569a7f64cd969c8 +size 11046672 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a484d735235567385be1d5332c4450b8007d3f8 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2462c3243cf074da3479ba0c61e08b22803cc9dd3e083b6aeb95451d7aa91a9c +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37319b4b6c46e9c97bedb9d30d975764e25850d5 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b38f2b8b952da4dd67e6fabd73c3a1e194632776a237c9567270d02606b8503f +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f0ce8c399970ede9281b1c5587cbb552eec78fc --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:892e59c87d33c8e3392a0fa2125487d771c94a2993740c471e58cc4ec62604b3 +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c66f71683d39f93b275ae572e792b1e1d5057727 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:447be066597171951850f80b362e59c263bbc3816875f74217ddf0c47501262f +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/zero_pp_rank_0_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb8f9d0877ee650d9c9d5d9aa10fafa8877a38d1 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9de33cd1e27f25945d332e8a4a8bda944bb4836afbfbbafbdc16df389e687c6 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/zero_pp_rank_1_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87a610f74042aea89d3498bfa441361433d7974a --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b9fde97f1382d9cca8df844b9b0935a213483d6b8419c66e7ae168e32424493 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/zero_pp_rank_2_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8df2965274a1f1614611010b08eed35ecccf3743 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:998d34f0e833ed897d2c1049e2f99cd1282e5eb3136e9a5bce172a4bca8e45d9 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/zero_pp_rank_3_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1878e4f7d21510ac58518e91ee102fc13f8e62f4 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/global_step11641/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:168211a16dfd053fd8570ed4c8a5ad66d89c52bca530379859c3fe6982321613 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/rng_state_0.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..21d1028280d7bcf71477542d16f697836e420df3 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae04e827f697e7bbd4fcbf47b9f25516c1a83774d8d41f3b3fae7796c47799ec +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/rng_state_1.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..c88f403dae9d522d4b908236e2102c3cb3daf8c1 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32b7d483f46190d54dd15e89118c9aee8bfcbc67e7ed247600ccea53255e28cd +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/rng_state_2.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..c49823444d075d192aa4b2767e8862b5f4a5842c --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f694f47bbaf511cda1bbc03bf9a92d840dae8ce66f6f268b26a21b4cd479200 +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/rng_state_3.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..b45c2cd4294eba61e60808087b8dc017924536e1 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b8d68f9233080da66d2d08937da148ef595761179c94ba852ebbd95b8cf266c +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/scheduler.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..39bcda6877bb82a0dbb8f145fef8d79432c637d5 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f9cd66fed3fa18b7ea2a0a41c315557eb023a7dd2043fff39562a79ef66e7f4 +size 1064 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/tokenizer.json b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/training_args.bin b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b75d50cb82fdeb0932f76ab247c5669f48431305 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-11641/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27ca2f40e22b8f7ffed97f5f8bd77bfc8853d3f2f79f06c66119bd43899dfc5a +size 7160 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/adapter_model.safetensors b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b618f2540b81a9cb98fd4095ce930522dbdb892e --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dd0fc1242c5101594afc9bfbaeae8ec51eedd2847fc5d9fbf58100dbc55f2aa +size 11046672 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..184448a22d0943cfa4f986e9c2099b01871cebf7 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f85b94052b30aa6472ff277ac4bf1eab890a74baf21b4f12f9904e5b05cc089a +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..239905b4ab5705da5e215ee3310f209d0854bafa --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1dcc14a37a400b2da6e0e0da7dbe10e28980d44777bc01b738c93dff0edff56 +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a2311dfc4248dbd023e2e954cd74fc528f677d1 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e06afd62ef5e58d387a89604a0d5445f4f1516703cc4c6f317ad0d5831a2899d +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed35d74a8301b099da272c9afc1b4fe56484594 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f894e48d2a566602d257dde6b6cf87c39030e12f17f8e06f6c4faf18e0781cd +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/zero_pp_rank_0_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a58bb8165d5937c852219a2bf9628b9e90f198a3 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9321aea3ae2c982950b9ecead2271ab1998815065aaa1094925a50fa94a52e8d +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/zero_pp_rank_1_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9aca3e41d2c07477ee120f1496198f19129ac926 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb46a963882e047113b4a8f2edeec608cb9479953aa6db1896008c5ecd3b3cba +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/zero_pp_rank_2_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7b6b19c6a35874d1941ff644b4a701b69e37896 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:983fc7180b6e1e5b4629d13754b75c264465c6faf8238a15c2df3fec96a8a1b3 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/zero_pp_rank_3_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d73dd9f6adb5536ade12b42c159a79036e9f64f --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/global_step14967/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cab55488061d50369ad86ced9032c8850089ffdb39392f5104d8f4619a67584b +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/rng_state_0.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..e95ac6f1b133cd47f0a30529d71c9c5a73fd3fb5 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9b1dc3a4d5c2b1f14b298da24523ea040796cadc56b16c8b7dd9f73b0a2989 +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/rng_state_1.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..2e8de35dd8fd0ff1c05c0540633dbe98652792ee --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e58607e6fea5937a069b88c4ff761919a9b7a82b3885b9108ec15566450bbed +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/rng_state_2.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..bdd0a815c6090ff83f7f1823e86d61aa9366082b --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2656d5f7ec9512ef5acdfa9600593652e90732f4564c3d82ac031907179ea4bb +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/rng_state_3.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..5cfab3743fae0b5b15faee381026b5b68c35140a --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3acddb4328dec5589c108f2aed472a21d07489217a26d757430c4f60c10f72bf +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/scheduler.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b41098db18d49e430d5f7e57e526c924eac543f --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a69120ac56121b144562f57a7407e5c67d7be08781bf6bbe660fd2d6e46ff0c6 +size 1064 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/tokenizer.json b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/training_args.bin b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b75d50cb82fdeb0932f76ab247c5669f48431305 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-14967/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27ca2f40e22b8f7ffed97f5f8bd77bfc8853d3f2f79f06c66119bd43899dfc5a +size 7160 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/adapter_model.safetensors b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c5dd557f0a9602a605f45880e839f120eee1e71e --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7843d449c9a204184e65a195caa857c4663f43d1ec16095084968555d7ed823 +size 11046672 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48358dd9935db40f1ca182c5480d5a45dddb2ca8 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60a5a1a94bf56127c838547e2fed33a2801ef5a86b09cd337e981d330525d4ef +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..770e618e3031f3017556c383cd5aff8b5dd52ddd --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6ca3e3b5bb7faa3af8c5e582f5c33d1217975b023b298039b19eb1cad5166d8 +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70a0e61355919468f1f8c625dc3da72346400b4b --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44c8650a7a4566637a6cdf37c9afbae2de75a2ca99f0d561d9b8c5d475691deb +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf4c84c6889980a7b7726700f91a118f29e50f6f --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6784eee3ce00b5487b7644dde0f5f2b73125050d9c45c175f87b4d383c65f19c +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/zero_pp_rank_0_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db0c23017c8a8806be2edce3fbaf43ade344f2a0 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f58409d05edebedb5ad0289403242c93953ec492d8d53623506bb4d098e9e52 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/zero_pp_rank_1_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a9b8d1f069a4c6f67cb7197a1f539d3c0a043ba --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55696945c8d4834c44d05bb55980883be9b0061228a76d9de2e1856a488dbcca +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/zero_pp_rank_2_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b9f3d7e4cb3ff187303f1ab9ae69bc164e78ca1 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a29cd551b2f392a8f6de11c3f8d64c77a80fd8bcbc2214bc1ed4533ace4209e +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/zero_pp_rank_3_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c57b5638256eeb35513cd6d92b451bfa083cd85b --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/global_step1663/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:109438f65212576d722e92d9282bca33acb84973ef67c1ce52579bfef2a0d490 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/rng_state_0.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..3f06f017aee3a42a8ef9eda0a647f1b5d6da12f7 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9acb08a30b1c2a44c8ec9654ae02bd8997ba3f81b020ec01f30b39bdd65354f6 +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/rng_state_1.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..418c4b6f983b8da496fd58c8a109b1d2e0273268 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6f3e014aac6d1ccfc9317ae6465c7017847275d8219a3e7875aaf8934fb2df1 +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/rng_state_2.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..65325577735b0542590bcd4a4ae2fd50befcd9df --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cd3564beaad2f519d75c1fac2fa4a6f0b45eea8417517c303dd536a035e938a +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/rng_state_3.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..2ab8b32f8cf0f82cb07c8009233bcb5fa9d84b83 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24763e323990ee1f3aebcec78519c6584f3df6644ba9042c3f671d7e9632eb07 +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/scheduler.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..babe861349d437f287492e9f3eb3d1c97c306920 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66a5c6795140814b08705d3a2c82fd9302c3099ff12c444a936995bc0fef8090 +size 1064 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/tokenizer.json b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/training_args.bin b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b75d50cb82fdeb0932f76ab247c5669f48431305 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-1663/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27ca2f40e22b8f7ffed97f5f8bd77bfc8853d3f2f79f06c66119bd43899dfc5a +size 7160 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/adapter_model.safetensors b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ce5e647c6b1ea27d941821fa9b07d55dc16c4293 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ccbe611bdf2cdc94e4db7fbd5f0fe69e754b4378fbfe757070b24af6c543b8f +size 11046672 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2416d017e59ef3eb4947ddd5410577f624252eb7 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd274a3211ed92f678a781bbb82586316b7d1d4902ae94b7dcf474e425dca74e +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f10182995164b79f8efabb005f996ff27fc19bd --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73a2264d27b0e4e7807589d80d4e91544babb6979dc75376121a4769bbb8f9f7 +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a334e0dd1bc6db1131892813f938cbfaadd8f67 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:217b7ed6d4b22da0c16f7ba8c89e50d3b61c9d34c76cad20e7ef46b540cf9634 +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b747e4a3b5269d54bb0f5feaa73c87d963aa22da --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85daacb9c9e04fe26a670f69cc84c13ddce7b43bfae9272abdac76553c484115 +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/zero_pp_rank_0_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5ec95bd950fe12d8f93a6a96b0c68d5d39e7f5c --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4749fa70d01942321d0c12747be420898a5b8f684fb6d1b08ffdb5a67e0c89c1 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/zero_pp_rank_1_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5554d590d2cd3c88b27fb9ce62fa68f1587db32d --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43c5ac7b8c1352f249bb2a2c22fd130737f66733ae9394aac741869da150577d +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/zero_pp_rank_2_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8587f241d5483ec45d3d49bc625fcdef383f1b20 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33b875be355688e58ad3e1bb314cd898b4b4f7e0983aaf12fe43c45be0321e90 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/zero_pp_rank_3_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c62575c7097edf5b7d3bb68ccb1aa8209df908e --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/global_step16630/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23054b9e9b07d54b8d6211c7bab3810452d798f8c1a25a84601320ceb395b724 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/rng_state_0.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..22c48fba5b48e703096a9879f0c5d0b7781c8ec3 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3163fb2b05b680ad6f05edbcee4ab6daac774213dc0cfb24a4e597d1e143723 +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/rng_state_1.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..a0a038e029ad63d55c5df6a308ec5e475a036cec --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e1734ff16e68dfb9b4c63c42c847ad6f96830ad23e646820306a7ddd6556de1 +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/rng_state_2.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..ee712f9a96dec323bbb01109ea0a38b9db03183f --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df24861ab88bfd00d8c26fef3cedb2cd91e17e2e7dec200a333693879a9a74ac +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/rng_state_3.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..8c3158d924b7d23e864eb38adf84e2957a654f5b --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed0a6d184c26bf913ec9d4faa243161f5a2afde2a85ba693172b0829d0089de6 +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/scheduler.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..47f3e7b53ab47d0797b1c2a095ea8d02d0022ec2 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b22ea060a504f9c20f8583fc08c9bf3301927b2c52eb055ff81d95c8452d0c4b +size 1064 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/tokenizer.json b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/training_args.bin b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b75d50cb82fdeb0932f76ab247c5669f48431305 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-16630/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27ca2f40e22b8f7ffed97f5f8bd77bfc8853d3f2f79f06c66119bd43899dfc5a +size 7160 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/adapter_model.safetensors b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..76985b6e2047b351b0975f34343218a11595ed9b --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cc65496e1ae520274ad1b2fdb6385fb33f532ee2167a04f5aca91a805a43f61 +size 11046672 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0a58b13ec9aeeb926c23df1e2841690aaf319a2 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1d76bd59cf8d38d4f51a0d3a98c0ceb5f1ff20d35e772651bcb6d0270d3b686 +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d962ac8039afc4d7f48a25449c62e296c7d120f --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48dc92d15f3254953deb198d7ad5871a5996b57406014add16fd8fc2395f1bef +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4b403fab920366f4b585fcfb1eb440dc2cb7f27 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a0c4748864dd7d0e40c5c4bd2f3e7add569d3cb843d91cab9aa30c34c38c5c5 +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8b2bced75ac5428cce4583f0c0074d76a3e4fab --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:170f98154c5a0808033627ff03d9f65807416489672cda0fd57ee5074788f7b6 +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/zero_pp_rank_0_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82a06749a2d613930a431b02c912c4ae48d1fb5d --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43327d95081c1e6b07e63734df1fb6be87dd48410ce707532e2d262a37e514b7 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/zero_pp_rank_1_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c36fdcfb16efa8e4e60378522a9ac26c0135e284 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67e301be654ad91e5ab4c29fa64e95344ae54f14f2ffc1af8d797ae978232f8a +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/zero_pp_rank_2_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..236042031bc1830e314204a12b88f2b97ac89014 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0f3b84c299d62e5b381cce3b1190f5abf338a54927c82a5b000e30496e95c16 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/zero_pp_rank_3_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..655c2619d79771e8b9a0fbf0416646e71f377ae9 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/global_step19956/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33aadb081e8fdaf6808fcbbd06b50b5699c4e7bbf1ec9815926158ad9eb7e0af +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/rng_state_0.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..f25fcce1e7bbe45a7c3e8449384a3a5a5ed159eb --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0c9fe8fb60a45afb981dc96a072b6aa4c61d013f0b958667167663d2e6f2c86 +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/rng_state_1.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..5b3fde86cde7b0acf58befb1a59ba980a16b482e --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54e24a874ebebe3a8129fde8122a5a5b6bd7810cbfe762b0d160b92c63919312 +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/rng_state_2.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..f67a625fcaa2cd453e955c546a1e2dd05e9fc995 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33c6494bbcbdeeb7e286b0d7f211446e5b83f17bbe3a479ffee8c0192ab34dcb +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/rng_state_3.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..89153983f4fe1036b61ec52474e1df140793c0c0 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:545492d43521a25583c6fa41afbce7a3f9abd2bd193cc794740de81352a7dd95 +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/scheduler.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..104d9703cddff750f43511f044e7d465af89820c --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5975ae1ccf0afbfd1a9de1413a8c02c5220aafbff00948b8dd4d005856e30941 +size 1064 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/tokenizer.json b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/training_args.bin b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b75d50cb82fdeb0932f76ab247c5669f48431305 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-19956/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27ca2f40e22b8f7ffed97f5f8bd77bfc8853d3f2f79f06c66119bd43899dfc5a +size 7160 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/adapter_model.safetensors b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d58dbf76f945c33558de43eeebf4f6e60a907a3b --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:583e3be8293c548a26564aabe4c5c8fea7b881a81e0af16a3ba8b2f0cb1988a1 +size 11046672 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27dd6ae560ee94b82ff3fd154f22d8025fecc96b --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e09a38e0ba613d264fdc13b865c1c089bcdbac8619a6ea025ad4cefffbd5d6c +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c97adcc5c69e4ac3258c7660bbfed692fa1dc5d4 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6b4f8e2fd6555c58dd3debfc9072f2a999d772c5d376fe352141f6e7164cd78 +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c13afaa3a3f0d90ac8fd8398206fe1c4c35668f0 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a92b40366b69cd9ad7e29f15d8eb7f3f7e6251a37f9ba37421c657d1008d6ea +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01d73c8bc0dfc4420b3ae64deb8511edd685604b --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25f6aa4113311d1ac66603c71d99def46b9d798680926a12f7e39134724be626 +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/zero_pp_rank_0_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa4d79d3dbc987339e9ecdad34390078e1262a6b --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d0299678ac2d88cf0ee1c1f844475d487382238b5827feef1da29df7cbd73cc +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/zero_pp_rank_1_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c97e774b82bf14f524f364dec612c02a1450a2d3 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46b4e72ea52defd24ce972d4cfc0d2ea61d7b94a0fe9310768de6107b5a5f997 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/zero_pp_rank_2_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6812ca9007db8d2955b3b2bdeefc9f24b784b3b4 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5a0bf7bca9a9d102aba5ab32d1240fea31774c4e5c76d2d4ecc3db88942f201 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/zero_pp_rank_3_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c7add67c5f1fd69e5797530015268794197b918 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/global_step24945/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f0bc101cd86d101c1bc39d711846e56ec3d9a75fd6018cd9db95dc1d0cb8222 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/rng_state_0.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..3e1e43a06a1d0b7845186aab01301453886b35cf --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b7a5725a1872be8ad72e1fe09ef753bea552afb85d928e564e328a2758de256 +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/rng_state_1.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..6d785ae145863f6c28e422b7f40a08eebfad37e5 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:855cea7ee90a89122b39a4a96c5fac40908944b55ac96eee62a0f35ceaadc99b +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/rng_state_2.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..32bd1beac2a69b0ff599e7c78a70b9e50802a74a --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fff7e090dfeb270f7c0310346fa94a7be82ed2e3d58c328b9262e0c9ad6045e2 +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/rng_state_3.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..326c02d37cb4234bc8164c1264b43fb9fc0f1498 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc795daf91dfdd3e46d9cf8eb9ffaad6242ce70271d8784d5e67b3785de977fb +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/scheduler.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ba7ab995ca7ee9e46fa349fa3145f6acbbdfb82 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3f754335ccf13a14a96ac1608619e626513315000040c97cd8be404c9168588 +size 1064 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/tokenizer.json b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/training_args.bin b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b75d50cb82fdeb0932f76ab247c5669f48431305 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-24945/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27ca2f40e22b8f7ffed97f5f8bd77bfc8853d3f2f79f06c66119bd43899dfc5a +size 7160 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/adapter_model.safetensors b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e3bb5eefb224009b4f140b697a3a284a96630535 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:049a044955e48a0a23befa0ec678fc72eefa73f719d4a07e86d0855886faf8af +size 11046672 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab5eba1b6e9e6c208b812d216ae03a71fa582aa3 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c14745838b1e98ec7c978146fe7bc4f22f8ecbf09b9957861f711b88fa8889c +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a102b08da5c946cefaa6d4f9716e6845cd1718a --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ee6911a1ac4b9fa06a8fb390f552dae1dd42b0db09ef990b00289c4e314976a +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de0ac89f7acfc0c5e0c1aba62d7f1b542d26ed54 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:842cc49128e02dcc1f5e94236d4431a8fb0dd50cc3a341eb938f6eab7cdf10e8 +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2356393447591f52b6644f335feaf5bf8d835d0a --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6eee157c6097b87af0af82937be740832d9cff7cb3d0ba03614203acfef94603 +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/zero_pp_rank_0_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d91e45827c51f62fa86d50ab6de6df2aa7f5ec6c --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0377273baecd4a6c38748fa62b6dc582fe7e54d876fb279f1a3d9d60f4a61de9 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/zero_pp_rank_1_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02c2f59d64c84ffecdbaa018c5c9fde4c0d2e284 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3cf3fbaa339528c1944fedc11c35640b94bbc8647fa694483d981893ae29fdd +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/zero_pp_rank_2_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf94ba37a8acc54cd974e9a76f3be2af2d87e720 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2874cc25f6f5612d05b952d0f22d12a0d432d3fb896a5aee4854f0c25f82ca8d +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/zero_pp_rank_3_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2b4caa4dcfa8ee4c2a31ace7fe8a2d77f245b06 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/global_step3326/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e58d725f8be5ec9fd6e88916695052acbeb867c86280854f220abf4b8790487 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/rng_state_0.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..3eaff6d3965eb22baa64914c5221e42d62125bfb --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a11ad45b514b786e43d0241a1f4b61e33ae3c06cb3fefe813c085ebdab76d5c +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/rng_state_1.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..0af919947d31a0539e1092345f0907530320f385 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d162cc39a622c1fcf117f45185dece7a8858bac1b567b5cf0292c39b9bc20858 +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/rng_state_2.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..6ac3f39d231d3a7a764d11b7ffe4a9f828740908 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:deef44e2f5c781860630b704aa3363a708b584b07943d6b440c32c83431521dd +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/rng_state_3.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..67e12e72a03b750f71ceb5ebeee153659985c1bd --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5162e9b0bff9daced5fe7e85e049aafa67fd489fb8e3941eaa3edb88f4581a8f +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/scheduler.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..c052e55bd4894acd8e822ede5ec0e07bf109e8c1 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fc370178b68b938a0e5e19e2254d6f15bd205b65e9f04130e916b72c783f227 +size 1064 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/tokenizer.json b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/training_args.bin b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b75d50cb82fdeb0932f76ab247c5669f48431305 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-3326/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27ca2f40e22b8f7ffed97f5f8bd77bfc8853d3f2f79f06c66119bd43899dfc5a +size 7160 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/adapter_model.safetensors b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0d7fe1e8fc9991f730168b1183c7ee8a5c78cfa3 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7dd4bacfb731d46b9cf87588f93bf9a6538ea06a2f7a2ed5182c97e7854fe3a +size 11046672 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/global_step4989/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/global_step4989/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54ccaff150dc195277416c95d0861b3e15e841e5 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/global_step4989/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b74ed1313e164b1380845fa61a6e25cca24ef7357be2f7e7a52fe2e2ef2151a +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/global_step4989/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/global_step4989/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aad81564899c114e5635ad9224d527ddab8f8215 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/global_step4989/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ab1dab15c9ba68af7b7c51ed54917c5e02d103135671430d55c99198915a004 +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/global_step4989/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/global_step4989/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fc85eb49c47e5cdff8a2251ea712d02962ed25b --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/global_step4989/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4848011873aec329795f5280f70374e1076da7af477892b04f42c7a29d4b79b +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/global_step4989/zero_pp_rank_2_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/global_step4989/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d9fa37e1b582258eec0c25dca3987a11018dc98 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/global_step4989/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f82af72f83fa96cefb9b00840bc13fc558959dfa9669f5edc1dd2c6c5cc38f3a +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/rng_state_0.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..ac7ca9421dee00575c7bfbb7696729284c4a92f6 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1dc8be5e19479032ef56cc83a4c900fcdaec17598ce60cf5698bfb4ca044caa +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/rng_state_1.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..dc516952a96f4b5e683d253d2486d0d5a7fbd690 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbf14f0f5c8ee6a7ade2d76f32de9c13e8af83fe431bb9ea3d5f5ba28e92213c +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/rng_state_2.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..2df3191fedb30188dffd6d42afeffd9028006832 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9c0c44356b0f308c6bfbd904a721ddf35381ac01967180db4c18620746aa87a +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/rng_state_3.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..df028dc7e7e09d556316d6a086b379258b314c1e --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f3150ce5067fce9fc0eadc09064b8a539a14c30744e578ce11d35578812233d +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/scheduler.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a0e456a84052ecc31461bd261d1fd7e7f2e652d --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74bf834d36431f4f5d14c42954f6c23d9fca663de4a738fc699b9be9b6f4da0f +size 1064 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/tokenizer.json b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/training_args.bin b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b75d50cb82fdeb0932f76ab247c5669f48431305 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-4989/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27ca2f40e22b8f7ffed97f5f8bd77bfc8853d3f2f79f06c66119bd43899dfc5a +size 7160 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/adapter_model.safetensors b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c91a25d9c205076fbb4dc3997a1f4e722783d02c --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:454e449ce0fe75af27b5177a14abd2d0d787f5d7c5b57a1e3a103158c3703c79 +size 11046672 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cebf2d0c03bdfe116d6bac8bbebff3edbf439ec7 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82e7478943e7ae1902ba29322e180f765bf8a3cc7a7a8441f0b1cb125a3036c2 +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e83bcdcb2e07816827880c0a331100ab7ea29a16 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:429c460dd422b2862b15a06e9cc7acc9df13327419f94662c4dc1f7bcebcdef6 +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..718c2c535ff7e9108ad44a587bc61e94e0744b65 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:728a392ffdea0b60c441c8666d6404ad251ed065589fe629be7ff2a7b6b0ec9b +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73849d54933a965b123c5c3ef0167024207169b8 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:155f399e4ec1e78efd42d0035b6221e8160a247a55b5f27bcc6f78c24f77359b +size 16518576 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/zero_pp_rank_0_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed680b9c2a6d072422a2cff9bba4154e434ffc08 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3501f5b771b19ed9b6336ee9f1ab8a1ce58ed6baf4cf8a19ba5b59119be72116 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/zero_pp_rank_1_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdcd58b457f3451f3023532be8e25d970734bb39 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9f7cb2ca29cf014267a9c28dc68849851c0eae0cc97c1a9b1ef251f700124cc +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/zero_pp_rank_2_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..181712ebe570a2f6a214c7958fd3266e57ed693b --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6aad2267846f2c8096d5ea86161081d8e4842a3950511a0a777a52cbb153e20 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/zero_pp_rank_3_mp_rank_00_model_states.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..925b118d0b3efa077a5227f0557a57b52f52a888 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/global_step8315/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71476d90da388c5d131e33d8062c8595499fb8fe26cb715bfec0fae7af2f39b6 +size 321070 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/rng_state_0.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..518fc42e5eef5ea2b4f31bc11317929a71496e64 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:632c2104ba79bb84c259703b79ee4ab51268213ea85cda0088fac5cf3d224fed +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/rng_state_1.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..68569b8970164cf4278026739eb01af10dd3996f --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7edb44333d8782542f62425e646fe5478129008a1ec196f3dfaf8dc15c2ed429 +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/rng_state_2.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..5755410a95079ef6fc8cdcd0850c40235b30bc19 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7daef1fd11930354d3efe146139fb5bc04ba6dae1a7920b50469ec4089e4ea58 +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/rng_state_3.pth b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..dda8fd28be18f851b3fbdecafdd2a10868eae666 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb113ad7131eb034dc44867e365606cc5a1b0e4e8ab3ef246e7008a03acd806d +size 15024 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/scheduler.pt b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..f72d9cf9cf9c1125824ff7afa34459b7036dca1f --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2760ea7dede85270c4f3e259685b6c79721dcc241421f2313b897bb9ba37f707 +size 1064 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/tokenizer.json b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/training_args.bin b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..b75d50cb82fdeb0932f76ab247c5669f48431305 --- /dev/null +++ b/sft/20250422_192334_sftqwen2a-resume-semantic-loraopt-10e-8bs-1e-05/checkpoint-8315/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27ca2f40e22b8f7ffed97f5f8bd77bfc8853d3f2f79f06c66119bd43899dfc5a +size 7160 diff --git a/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_0_mp_rank_00_model_states.pt b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca1f68f36c3dd45bccfbbd7b03a51d3b34b7a3ed --- /dev/null +++ b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6d143466248a8974256ccde7ad285f092243b28432923fffb15acf52a53218d +size 1401735 diff --git a/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_1_mp_rank_00_model_states.pt b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b2cc3f35595f0e6460ce1e6cc28e6ffcb77b0cc --- /dev/null +++ b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1de265b4eefb945687c203fa66c2bd00c689ef9b38f938b1b9ba769197fae430 +size 1401735 diff --git a/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_2_mp_rank_00_model_states.pt b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9fb1153540e8a98fcae8ec65d5c0e0facff07e2 --- /dev/null +++ b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d71d3257e92e8f02abbdc4a056eacf10d914a62457105b097ae85599e4092db0 +size 1401735 diff --git a/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_3_mp_rank_00_model_states.pt b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68eb7306550adfaae24dfc2cfcaaca0d95f95068 --- /dev/null +++ b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/global_step36597/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6216480853283e6591e6cc4bca0441cdd444722285423c01b587e8a4174e6027 +size 1401735 diff --git a/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00001-of-00004.safetensors b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00001-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..db40638cfd4d04b738c67769bc1eaf09b9d534e4 --- /dev/null +++ b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00001-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8425531c907221dcdf4804b39db8d0ce28c2d65b20c8e31ee2b4e5e635be28eb +size 4991459544 diff --git a/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00002-of-00004.safetensors b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00002-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..db8806b3fbdbb9524cf498e04c02f1dab3295975 --- /dev/null +++ b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00002-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:249a1518e892949d64706bb1efdef6caf09d123b4aa6f5ed7a6272bbe9cf7bbe +size 4991757456 diff --git a/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00003-of-00004.safetensors b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00003-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7e0815f53f8242d2c880a1e48f013123d615e042 --- /dev/null +++ b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00003-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4332456c8959e1563610ead40dbbc5f20c6032d72bc10b88ddf71900da1b4fa3 +size 4947691960 diff --git a/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00004-of-00004.safetensors b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00004-of-00004.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4d00c214a05247655908f54d73d6ab2b1d9fdfef --- /dev/null +++ b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/model-00004-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d95126bd085dda0d5c9901b47379ed4b1f8dc492c1d403d4ba3aba7a710872a +size 1863387424 diff --git a/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_0.pth b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..5fc5a160cec57abb9b13c2a062c52fbe6a71e188 --- /dev/null +++ b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:659dc9beee437011295c32f0e369eeda66033d741de1417e5c2e725bc06993ec +size 15024 diff --git a/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_1.pth b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..6c2c26948d72055c17d3b892b72d3b4d0c8aed3e --- /dev/null +++ b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c925f0a9be9f41bcc3e25304f638715b43d9d71ba9a923a2967fa95493f71ff5 +size 15024 diff --git a/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_2.pth b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..a7bb27fc4f898b36bcb677974e2a3799953db489 --- /dev/null +++ b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a58973d261fdababb9058ec19e76a722c8f97e0726b50faa642ebbc0816eb205 +size 15024 diff --git a/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_3.pth b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..763df6b57988b69897fa61ab7e082af10f237de9 --- /dev/null +++ b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeed214d7c5bb3081fa4e35555f8aa33881b07fdd998350a014e5ea094188e22 +size 15024 diff --git a/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/scheduler.pt b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bbfa49057b862450cc54bc19ffbae41536bb7d1 --- /dev/null +++ b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0763ca19f582c73f8ac88de5446dc1d84f3eed0e65f3995cdc9c4515ad0e123c +size 1064 diff --git a/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/tokenizer.json b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..91c743bb8bd63f5dad1db5e08b025d73c0b7b3cf --- /dev/null +++ b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fecdb47d281073055efd605d080013e3114ed0f3c5d8af201e245b199864c9c7 +size 12030779 diff --git a/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/training_args.bin b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..ad4c15503bf2f6b365e8b7158014052fe88a6e71 --- /dev/null +++ b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/checkpoint-36597/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b55e10e546d2f9501314b5e3d4422a32d16b177a42741f92de1e2ce95c3312fa +size 7160 diff --git a/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/runs/Apr22_19-35-50_lrdn2812.leonardo.local/events.out.tfevents.1745343372.lrdn2812.leonardo.local.2689265.0 b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/runs/Apr22_19-35-50_lrdn2812.leonardo.local/events.out.tfevents.1745343372.lrdn2812.leonardo.local.2689265.0 new file mode 100644 index 0000000000000000000000000000000000000000..fcadc173bfdb2dbb8a8317ba87bea988a71cbe7a --- /dev/null +++ b/sft/20250422_193550_sftqwen2a-sem-nolora-noneopt-5e-4bs-0.0002/runs/Apr22_19-35-50_lrdn2812.leonardo.local/events.out.tfevents.1745343372.lrdn2812.leonardo.local.2689265.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c4356931893036bc41ab7e2309a0a9605801ac1092abeb3bf8184a6d7bf2bb4 +size 211728 diff --git a/sft/20250429_131213_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/runs/Apr29_13-12-13_gcn145.local.snellius.surf.nl/events.out.tfevents.1745925179.gcn145.local.snellius.surf.nl.2929798.0 b/sft/20250429_131213_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/runs/Apr29_13-12-13_gcn145.local.snellius.surf.nl/events.out.tfevents.1745925179.gcn145.local.snellius.surf.nl.2929798.0 new file mode 100644 index 0000000000000000000000000000000000000000..3bfa53b3231abe4027db1e13a32544ff68bfd7ce --- /dev/null +++ b/sft/20250429_131213_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/runs/Apr29_13-12-13_gcn145.local.snellius.surf.nl/events.out.tfevents.1745925179.gcn145.local.snellius.surf.nl.2929798.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08205f1f5be726fec2225217ec8acaac5d45d78de3e7cacc787807bf02c7a577 +size 7811 diff --git a/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-24908/adapter_model.safetensors b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-24908/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..809cdf6cd2b860895d03ee4acfdc0a2b85be12c0 --- /dev/null +++ b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-24908/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdc576d19417a76010990bf6d8ff76d39b2579180cb095a1de67f77cf0850b8e +size 15367872 diff --git a/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-24908/optimizer.pt b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-24908/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..a780646f57f912525db57d54f65b6104f290f905 --- /dev/null +++ b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-24908/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:511fd504588e4b277f331a88d0951ce48eeaee9329b1df9bccf9dc1fa70005bd +size 30872250 diff --git a/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-24908/rng_state.pth b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-24908/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..1db9226e80ad49616d17c360a3a27b36e8996419 --- /dev/null +++ b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-24908/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cf2acce645026b91c09100ffd226a070806d2cd6f356551adf45199c33a891a +size 14244 diff --git a/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-24908/scheduler.pt b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-24908/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1b50734a5112927af23ee2176dfa6da43216a42 --- /dev/null +++ b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-24908/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0a897365987c0d78e582f7ee8d7aa6d92d3358a6ba3c0dcd90d87ff3fa0c216 +size 1064 diff --git a/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-24908/tokenizer.json b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-24908/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8d651380b80b1775af303bdabc6da4e6774ce3 --- /dev/null +++ b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-24908/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8441917e39ae0244e06d704b95b3124795cec478e297f9afac39ba670d7e9d99 +size 11421870 diff --git a/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-87178/tokenizer.json b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-87178/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8d651380b80b1775af303bdabc6da4e6774ce3 --- /dev/null +++ b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-87178/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8441917e39ae0244e06d704b95b3124795cec478e297f9afac39ba670d7e9d99 +size 11421870 diff --git a/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-93405/adapter_model.safetensors b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-93405/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ab1aee4c279f4e6785e0038448f8e148d4776312 --- /dev/null +++ b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-93405/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:220b4fde5f4d656125142adb4d54eeb296b5391326a1316c0af538716fafeaae +size 15367872 diff --git a/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-93405/optimizer.pt b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-93405/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f7feb7553224e6bfe3e2f4c82f5a8df5cfceebc --- /dev/null +++ b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-93405/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:727c5c6607e54d29af28ef78ae2db5a9ad46574bb1d40b14bc96d628d9e29acd +size 30872250 diff --git a/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-93405/rng_state.pth b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-93405/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..060a326fc997bba1e8e03f373abdcb3424fde7bb --- /dev/null +++ b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-93405/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd2ece16b5b62c2235870e33b6386469a1f3e876ac6580e4d184aa60237ab739 +size 14244 diff --git a/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-93405/scheduler.pt b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-93405/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..3766b7b5b155516a7dfcc7d25fd5e850ca6ba54b --- /dev/null +++ b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-93405/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:966f563a4e4e1ba4e8fb5294cd1403b2f47f5cb017d5b7bfa5878c6c4895d088 +size 1064 diff --git a/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-93405/tokenizer.json b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-93405/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0a8d651380b80b1775af303bdabc6da4e6774ce3 --- /dev/null +++ b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-93405/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8441917e39ae0244e06d704b95b3124795cec478e297f9afac39ba670d7e9d99 +size 11421870 diff --git a/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-93405/training_args.bin b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-93405/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..db462e9f036a56dbd78271b5f3c3f5ba0da75011 --- /dev/null +++ b/sft/20250429_133137_sftqwenomni-fullsemantic-loraopt-1e-8bs-0.0002/checkpoint-93405/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dde9e9296d6ea0e4df0bb27e9fcbba4ef64dac6fcb0b9f8ad15aafecbd907467 +size 5944 diff --git a/sft/20250516_000144_sftqwen2a-full-semantic-noneopt-5e-4bs-0.0002/runs/May16_00-01-44_gcn153.local.snellius.surf.nl/events.out.tfevents.1747346549.gcn153.local.snellius.surf.nl.3440925.0 b/sft/20250516_000144_sftqwen2a-full-semantic-noneopt-5e-4bs-0.0002/runs/May16_00-01-44_gcn153.local.snellius.surf.nl/events.out.tfevents.1747346549.gcn153.local.snellius.surf.nl.3440925.0 new file mode 100644 index 0000000000000000000000000000000000000000..d561377ffa7c8a784c5cfc40413708d6616cc74c --- /dev/null +++ b/sft/20250516_000144_sftqwen2a-full-semantic-noneopt-5e-4bs-0.0002/runs/May16_00-01-44_gcn153.local.snellius.surf.nl/events.out.tfevents.1747346549.gcn153.local.snellius.surf.nl.3440925.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:538547277c95097808c9d70399dbdf5bd3af48b3d0987fa09799cb379577b07a +size 6526 diff --git a/sft/20250516_012535_sftqwen2a-full-semantic-noneopt-5e-3bs-0.0002/runs/May16_01-25-35_gcn113.local.snellius.surf.nl/events.out.tfevents.1747351585.gcn113.local.snellius.surf.nl.1064258.0 b/sft/20250516_012535_sftqwen2a-full-semantic-noneopt-5e-3bs-0.0002/runs/May16_01-25-35_gcn113.local.snellius.surf.nl/events.out.tfevents.1747351585.gcn113.local.snellius.surf.nl.1064258.0 new file mode 100644 index 0000000000000000000000000000000000000000..194fb314d5291f385d2e76e84e9dceae5f24a6f6 --- /dev/null +++ b/sft/20250516_012535_sftqwen2a-full-semantic-noneopt-5e-3bs-0.0002/runs/May16_01-25-35_gcn113.local.snellius.surf.nl/events.out.tfevents.1747351585.gcn113.local.snellius.surf.nl.1064258.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff4832f4e89b4f091e44322b3f9a2f7ce35061c94c82222658897f726d4733f8 +size 16679 diff --git a/sft/20250516_024349_sftqwen2a-full-semantic-noneopt-5e-3bs-0.0002/checkpoint-29216/global_step29216/zero_pp_rank_0_mp_rank_00_optim_states.pt b/sft/20250516_024349_sftqwen2a-full-semantic-noneopt-5e-3bs-0.0002/checkpoint-29216/global_step29216/zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22915a0620205905b5dd49f2b1a8dce0ae3452a7 --- /dev/null +++ b/sft/20250516_024349_sftqwen2a-full-semantic-noneopt-5e-3bs-0.0002/checkpoint-29216/global_step29216/zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec3bed445ce16d35b4cee4d38cb764e9648a4ca0e85beeed49935b5b01544da0 +size 33580712886 diff --git a/sft/20250516_024349_sftqwen2a-full-semantic-noneopt-5e-3bs-0.0002/checkpoint-29216/global_step29216/zero_pp_rank_1_mp_rank_00_optim_states.pt b/sft/20250516_024349_sftqwen2a-full-semantic-noneopt-5e-3bs-0.0002/checkpoint-29216/global_step29216/zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3337abc6c266a4e2fcbafb24e8063a49262e986d --- /dev/null +++ b/sft/20250516_024349_sftqwen2a-full-semantic-noneopt-5e-3bs-0.0002/checkpoint-29216/global_step29216/zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eb6932deb8f0c1a7968d8c3e421c459df9a18f752c01af379dd723e17974a6b +size 33580712886 diff --git a/sft/20250516_024349_sftqwen2a-full-semantic-noneopt-5e-3bs-0.0002/checkpoint-29216/global_step29216/zero_pp_rank_2_mp_rank_00_optim_states.pt b/sft/20250516_024349_sftqwen2a-full-semantic-noneopt-5e-3bs-0.0002/checkpoint-29216/global_step29216/zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fffa8dc9b28d40962019e77456e5f11189ab2b2b --- /dev/null +++ b/sft/20250516_024349_sftqwen2a-full-semantic-noneopt-5e-3bs-0.0002/checkpoint-29216/global_step29216/zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0a091e3eb5f09c4675c77de6497ae7dc7c869ce92110afe7d6cc540eddc1336 +size 33580712886