Qwen3-SWA-adaptation / .gitattributes
yuyijiong's picture
Add files using upload-large-folder tool
51c291e verified
*.7z filter=lfs diff=lfs merge=lfs -text
*.arrow filter=lfs diff=lfs merge=lfs -text
*.bin filter=lfs diff=lfs merge=lfs -text
*.bz2 filter=lfs diff=lfs merge=lfs -text
*.ckpt filter=lfs diff=lfs merge=lfs -text
*.ftz filter=lfs diff=lfs merge=lfs -text
*.gz filter=lfs diff=lfs merge=lfs -text
*.h5 filter=lfs diff=lfs merge=lfs -text
*.joblib filter=lfs diff=lfs merge=lfs -text
*.lfs.* filter=lfs diff=lfs merge=lfs -text
*.mlmodel filter=lfs diff=lfs merge=lfs -text
*.model filter=lfs diff=lfs merge=lfs -text
*.msgpack filter=lfs diff=lfs merge=lfs -text
*.npy filter=lfs diff=lfs merge=lfs -text
*.npz filter=lfs diff=lfs merge=lfs -text
*.onnx filter=lfs diff=lfs merge=lfs -text
*.ot filter=lfs diff=lfs merge=lfs -text
*.parquet filter=lfs diff=lfs merge=lfs -text
*.pb filter=lfs diff=lfs merge=lfs -text
*.pickle filter=lfs diff=lfs merge=lfs -text
*.pkl filter=lfs diff=lfs merge=lfs -text
*.pt filter=lfs diff=lfs merge=lfs -text
*.pth filter=lfs diff=lfs merge=lfs -text
*.rar filter=lfs diff=lfs merge=lfs -text
*.safetensors filter=lfs diff=lfs merge=lfs -text
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
*.tar.* filter=lfs diff=lfs merge=lfs -text
*.tar filter=lfs diff=lfs merge=lfs -text
*.tflite filter=lfs diff=lfs merge=lfs -text
*.tgz filter=lfs diff=lfs merge=lfs -text
*.wasm filter=lfs diff=lfs merge=lfs -text
*.xz filter=lfs diff=lfs merge=lfs -text
*.zip filter=lfs diff=lfs merge=lfs -text
*.zst filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Thinking-2507-sft-fusang-swa=2k_sink=0_falayer=13_from1_step4/checkpoint-1771/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-30B-A3B-Thinking-2507-sft-fusang-swa=2k_sink=0/checkpoint-862/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Thinking-2507-sft-fusang-swa=2k_sink=0/checkpoint-8855/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Thinking-2507-sft-fusang-swa=2k_sink=100/checkpoint-1771/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Instruct-2507-sft-fusang-swa=2k_sink=0_falayer=25_from1_step2/checkpoint-921/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Thinking-2507-sft-fusang-swa=2k_sink=0_falayer=13_from0_step4_fadec/checkpoint-1771/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Instruct-2507-sft-fusang-swa=2k_sink=0/checkpoint-1736/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Instruct-2507-sft-fusang-swa=2k_sink=100_falayer=25_from1_step2_fadec/checkpoint-921/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Instruct-2507-sft-fusang-swa=2k_sink=0/checkpoint-1302/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Instruct-2507-sft-fusang-swa=2k_sink=100/checkpoint-1760/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-30B-A3B-Instruct-2507-sft-fusang-swa=2k_sink=100_fadec/checkpoint-870/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-30B-A3B-Instruct-2507-sft-fusang-swa=2k_sink=0_falayer=25_from0_step2_fadec/checkpoint-994/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Instruct-2507-sft-fusang-swa=2k_sink=10/checkpoint-1760/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Instruct-2507-sft-fusang-swa=2k_sink=0_fadec/checkpoint-1760/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Thinking-2507-sft-fusang-swa=2k_sink=0_fadec/checkpoint-2778/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Thinking-2507-sft-fusang-swa=2k_sink=10/checkpoint-1664/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-30B-A3B-Thinking-2507-sft-fusang-swa=2k_sink=100/checkpoint-862/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-30B-A3B-Thinking-2507-sft-fusang/checkpoint-862/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Thinking-2507-sft-fusang-swa=2k_sink=0_falayer=25_from1_step2/checkpoint-1771/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Thinking-2507-sft-fusang-swa=2k_sink=100/checkpoint-1059/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-30B-A3B-Thinking-2507-sft-fusang-swa=2k_sink=100_falayer=25_from0_step2_fadec/checkpoint-862/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Instruct-2507-sft-fusang/checkpoint-1760/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-30B-A3B-Instruct-2507-sft-fusang-swa=2k_sink=100_falayer=25_from0_step2_fadec/checkpoint-870/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Thinking-2507-sft-fusang/checkpoint-1771/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Thinking-2507-sft-fusang-swa=2k_sink=100_falayer=25_from1_step2_fadec/checkpoint-926/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-30B-A3B-Instruct-2507-sft-fusang-swa=2k_sink=0/checkpoint-870/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Instruct-2507-sft-fusang-swa=2k_sink=0_falayer=13_from1_step4_fadec/checkpoint-921/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Thinking-2507-sft-fusang-swa=2k_sink=0_falayer=25_from1_step2_fadec/checkpoint-1771/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Thinking-2507-sft-fusang-swa=2k_sink=0_falayer=25_from0_step2_fadec/checkpoint-1771/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Instruct-2507-sft-fusang-swa=2k_sink=0_falayer=7_from0_step8_fadec/checkpoint-1085/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Thinking-2507-sft-fusang-swa=4k_sink=0_fadec/checkpoint-1771/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-30B-A3B-Thinking-2507-sft-fusang-swa=2k_sink=0_falayer=25_from0_step2/checkpoint-862/tokenizer.json filter=lfs diff=lfs merge=lfs -text
Qwen3-4B-Thinking-2507-sft-fusang-swa=2k_sink=0/checkpoint-876/tokenizer.json filter=lfs diff=lfs merge=lfs -text