| *.7z filter=lfs diff=lfs merge=lfs -text | |
| *.arrow filter=lfs diff=lfs merge=lfs -text | |
| *.bin filter=lfs diff=lfs merge=lfs -text | |
| *.bz2 filter=lfs diff=lfs merge=lfs -text | |
| *.ckpt filter=lfs diff=lfs merge=lfs -text | |
| *.ftz filter=lfs diff=lfs merge=lfs -text | |
| *.gz filter=lfs diff=lfs merge=lfs -text | |
| *.h5 filter=lfs diff=lfs merge=lfs -text | |
| *.joblib filter=lfs diff=lfs merge=lfs -text | |
| *.lfs.* filter=lfs diff=lfs merge=lfs -text | |
| *.mlmodel filter=lfs diff=lfs merge=lfs -text | |
| *.model filter=lfs diff=lfs merge=lfs -text | |
| *.msgpack filter=lfs diff=lfs merge=lfs -text | |
| *.npy filter=lfs diff=lfs merge=lfs -text | |
| *.npz filter=lfs diff=lfs merge=lfs -text | |
| *.onnx filter=lfs diff=lfs merge=lfs -text | |
| *.ot filter=lfs diff=lfs merge=lfs -text | |
| *.parquet filter=lfs diff=lfs merge=lfs -text | |
| *.pb filter=lfs diff=lfs merge=lfs -text | |
| *.pickle filter=lfs diff=lfs merge=lfs -text | |
| *.pkl filter=lfs diff=lfs merge=lfs -text | |
| *.pt filter=lfs diff=lfs merge=lfs -text | |
| *.pth filter=lfs diff=lfs merge=lfs -text | |
| *.rar filter=lfs diff=lfs merge=lfs -text | |
| *.safetensors filter=lfs diff=lfs merge=lfs -text | |
| saved_model/**/* filter=lfs diff=lfs merge=lfs -text | |
| *.tar.* filter=lfs diff=lfs merge=lfs -text | |
| *.tar filter=lfs diff=lfs merge=lfs -text | |
| *.tflite filter=lfs diff=lfs merge=lfs -text | |
| *.tgz filter=lfs diff=lfs merge=lfs -text | |
| *.wasm filter=lfs diff=lfs merge=lfs -text | |
| *.xz filter=lfs diff=lfs merge=lfs -text | |
| *.zip filter=lfs diff=lfs merge=lfs -text | |
| *.zst filter=lfs diff=lfs merge=lfs -text | |
| *tfevents* filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refine_665k_llava/checkpoint-16632/logs/0409_1803_llava..._pope_llava_model_args_7bd459/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refine_665k_llava/checkpoint-16632/logs/0409_1803_llava..._pope_llava_model_args_7bd459/pope.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refine_665k_llava/checkpoint-16632/logs/0409_1803_llava..._pope_llava_model_args_7bd459/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refine_665k_llava/checkpoint-16632/logs/0409_1833_llava...mstar_llava_model_args_7bd459/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refine_665k_llava/checkpoint-16632/logs/0409_1833_llava...mstar_llava_model_args_7bd459/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refine_665k_llava/checkpoint-3328/logs/0409_1820_llava...mstar_llava_model_args_b94fe7/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refine_665k_llava/checkpoint-3328/logs/0409_1820_llava...mstar_llava_model_args_b94fe7/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refine_665k_llava/logs/ai2d,mmbench_en_dev,mmmu_val,mmstar/0412_1911_llava...mstar_llava_model_args_4172a9/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refine_665k_llava/logs/ai2d,mmbench_en_dev,mmmu_val,mmstar/0412_1911_llava...mstar_llava_model_args_4172a9/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refine_665k_llava/logs/gqa/0412_1934_llava_v1.5_gqa_llava_model_args_4172a9/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refine_665k_llava/logs/ocrbench,textvqa_val,mmerealworld_lite,pope/0412_1933_llava..._pope_llava_model_args_4172a9/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refine_665k_llava/logs/ocrbench,textvqa_val,mmerealworld_lite,pope/0412_1933_llava..._pope_llava_model_args_4172a9/pope.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refine_665k_llava/logs/ocrbench,textvqa_val,mmerealworld_lite,pope/0412_1933_llava..._pope_llava_model_args_4172a9/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refinev2_665k_llava/checkpoint-16632/logs/0409_1803_llava..._pope_llava_model_args_7bd459/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refinev2_665k_llava/checkpoint-16632/logs/0409_1803_llava..._pope_llava_model_args_7bd459/pope.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refinev2_665k_llava/checkpoint-16632/logs/0409_1803_llava..._pope_llava_model_args_7bd459/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refinev2_665k_llava/checkpoint-16632/logs/0409_1833_llava...mstar_llava_model_args_7bd459/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refinev2_665k_llava/checkpoint-16632/logs/0409_1833_llava...mstar_llava_model_args_7bd459/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refinev2_665k_llava/checkpoint-3328/logs/0409_1820_llava...mstar_llava_model_args_b94fe7/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refinev2_665k_llava/checkpoint-3328/logs/0409_1820_llava...mstar_llava_model_args_b94fe7/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refinev3_665k_llava/checkpoint-13312/logs/0418_1835_llava...u_val_llava_model_args_8261c1/mmmu_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refinev3_665k_llava/checkpoint-6656/logs/0418_1819_llava...u_val_llava_model_args_473fc1/mmmu_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refinev3_665k_llava/checkpoint-9984/logs/0418_1827_llava...u_val_llava_model_args_af441b/mmmu_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refinev3_665k_llava/logs/0418_1707_llava...mstar_llava_model_args_9259d6/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refinev3_665k_llava/logs/0418_1707_llava...mstar_llava_model_args_9259d6/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refinev3_665k_llava/logs/0418_1721_llava..._pope_llava_model_args_9259d6/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refinev3_665k_llava/logs/0418_1721_llava..._pope_llava_model_args_9259d6/pope.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refinev3_665k_llava/logs/0418_1721_llava..._pope_llava_model_args_9259d6/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/smoe_refinev3_665k_llava/logs/0418_1748_llava_v1.5_gqa_llava_model_args_9259d6/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| sft_pretrain/Full_competesmoev30/checkpoint-1040/logs/0512_0233_llava...a_val_llava_model_args_f58958/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/0.02_moce/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_norm/logs/0418_1103_llava...mstar_llava_model_args_16dc6f/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_norm/logs/0418_1103_llava...mstar_llava_model_args_16dc6f/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_norm/logs/0418_1110_llava..._pope_llava_model_args_16dc6f/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_norm/logs/0418_1110_llava..._pope_llava_model_args_16dc6f/pope.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_norm/logs/0418_1110_llava..._pope_llava_model_args_16dc6f/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_norm/logs/0418_1130_llava_v1.5_gqa_llava_model_args_16dc6f/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_norm/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_relu/logs/0417_0450_llava...mstar_llava_model_args_696dbd/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_relu/logs/0417_0450_llava...mstar_llava_model_args_696dbd/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_relu/logs/0417_0459_llava..._pope_llava_model_args_696dbd/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_relu/logs/0417_0459_llava..._pope_llava_model_args_696dbd/pope.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_relu/logs/0417_0459_llava..._pope_llava_model_args_696dbd/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_relu/logs/0417_0514_llava_v1.5_gqa_llava_model_args_696dbd/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_relu/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_sigmoid/logs/0417_0523_llava...mstar_llava_model_args_2153fb/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_sigmoid/logs/0417_0523_llava...mstar_llava_model_args_2153fb/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_sigmoid/logs/0417_0532_llava..._pope_llava_model_args_2153fb/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_sigmoid/logs/0417_0532_llava..._pope_llava_model_args_2153fb/pope.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_sigmoid/logs/0417_0532_llava..._pope_llava_model_args_2153fb/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_sigmoid/logs/0417_0547_llava_v1.5_gqa_llava_model_args_2153fb/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_sigmoid/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_silu/logs/0416_2257_llava...mstar_llava_model_args_a34f80/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_silu/logs/0416_2257_llava...mstar_llava_model_args_a34f80/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_silu/logs/0417_0411_llava...mstar_llava_model_args_a34f80/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_silu/logs/0417_0411_llava...mstar_llava_model_args_a34f80/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_silu/logs/0417_0418_llava..._pope_llava_model_args_a34f80/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_silu/logs/0417_0418_llava..._pope_llava_model_args_a34f80/pope.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_silu/logs/0417_0418_llava..._pope_llava_model_args_a34f80/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_silu/logs/0417_0441_llava_v1.5_gqa_llava_model_args_a34f80/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/act/moce_silu/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/hrloss/0.03_moce/logs/gqa/0404_0654_llava_v1.5_gqa_llava_model_args_b4e935/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/hrloss/0.03_moce/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/remove_competition/logs/ai2d,mmbench_en_dev,mmmu_val,mmstar/0404_2022_llava...mstar_llava_model_args_c2354b/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/remove_competition/logs/ai2d,mmbench_en_dev,mmmu_val,mmstar/0404_2022_llava...mstar_llava_model_args_c2354b/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/remove_competition/logs/gqa/0405_2347_llava_v1.5_gqa_llava_model_args_c2354b/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/remove_competition/logs/ocrbench,textvqa_val,mmerealworld_lite,pope/0404_2045_llava..._pope_llava_model_args_c2354b/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/remove_competition/logs/ocrbench,textvqa_val,mmerealworld_lite,pope/0404_2045_llava..._pope_llava_model_args_c2354b/pope.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/remove_competition/logs/ocrbench,textvqa_val,mmerealworld_lite,pope/0404_2045_llava..._pope_llava_model_args_c2354b/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/remove_diversity/logs/ai2d,mmbench_en_dev,mmmu_val,mmstar/0405_2242_llava...mstar_llava_model_args_6f8127/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/remove_diversity/logs/ai2d,mmbench_en_dev,mmmu_val,mmstar/0405_2242_llava...mstar_llava_model_args_6f8127/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/remove_diversity/logs/gqa/0405_2242_llava_v1.5_gqa_llava_model_args_6f8127/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/remove_diversity/logs/ocrbench,textvqa_val,mmerealworld_lite,pope/0405_2253_llava..._pope_llava_model_args_6f8127/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/remove_diversity/logs/ocrbench,textvqa_val,mmerealworld_lite,pope/0405_2253_llava..._pope_llava_model_args_6f8127/pope.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/remove_diversity/logs/ocrbench,textvqa_val,mmerealworld_lite,pope/0405_2253_llava..._pope_llava_model_args_6f8127/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/remove_diversity/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/scheduler/0.03_moce/logs/gqa/0404_0741_llava_v1.5_gqa_llava_model_args_42bfb8/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/scheduler/0.03_moce/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/scheduler/0.05_moce/logs/gqa/0404_0709_llava_v1.5_gqa_llava_model_args_b48daf/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/scheduler/0.05_moce/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/scheduler/0.09_moce/logs/gqa/0404_0610_llava_v1.5_gqa_llava_model_args_84bad3/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/scheduler/0.09_moce/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/theta/0.2_moce/logs/gqa/0404_0504_llava_v1.5_gqa_llava_model_args_34716b/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/theta/0.2_moce/logs/mmerealworld_lite,ocrbench/0404_0452_llava...bench_llava_model_args_34716b/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/theta/0.3_moce/logs/ai2d,mmbench_en_dev,mmmu_val,mmstar/0404_0418_llava...mstar_llava_model_args_99e268/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/theta/0.3_moce/logs/ai2d,mmbench_en_dev,mmmu_val,mmstar/0404_0418_llava...mstar_llava_model_args_99e268/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/theta/0.3_moce/logs/gqa/0404_1451_llava_v1.5_gqa_llava_model_args_99e268/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/theta/0.3_moce/logs/ocrbench,textvqa_val,mmerealworld_lite,pope/0404_0428_llava..._pope_llava_model_args_99e268/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/theta/0.3_moce/logs/ocrbench,textvqa_val,mmerealworld_lite,pope/0404_0428_llava..._pope_llava_model_args_99e268/pope.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/theta/0.3_moce/logs/ocrbench,textvqa_val,mmerealworld_lite,pope/0404_0428_llava..._pope_llava_model_args_99e268/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/ablation_moce/theta/0.3_moce/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| CompeteSMoE/competesmoe_versions/Full_CS_BS_theta0.2_RL0.01_softmax_competesmoev30/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/logs/0613_0224_llava..._pope_llava_model_args_bc59f1/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/logs/0613_0224_llava..._pope_llava_model_args_bc59f1/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/logs/0613_0224_llava..._pope_llava_model_args_bc59f1/pope.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/logs/0613_0224_llava..._pope_llava_model_args_bc59f1/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/logs/0613_0224_llava..._pope_llava_model_args_bc59f1/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/logs/0613_0343_llava_v1.5_gqa_llava_model_args_bc59f1/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/logs/0617_0402_llava...a_val_llava_model_args_bc59f1/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/logs/0626_0643_llava_v1.5_pope_llava_model_args_bc59f1/pope.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-27572/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-34462/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-20679/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/logs/0616_2246_llava..._pope_llava_model_args_d02902/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/logs/0616_2246_llava..._pope_llava_model_args_d02902/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/logs/0616_2246_llava..._pope_llava_model_args_d02902/pope.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/logs/0616_2246_llava..._pope_llava_model_args_d02902/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/logs/0616_2246_llava..._pope_llava_model_args_d02902/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/logs/0617_0149_llava...l_mme_llava_model_args_d02902/scienceqa.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/logs/0617_0304_llava...a_val_llava_model_args_d02902/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/logs/0626_1043_llava_v1.5_gqa_llava_model_args_d02902/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-27572/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-34462/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-20679/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/logs/0616_2318_llava..._pope_llava_model_args_0a2586/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/logs/0616_2318_llava..._pope_llava_model_args_0a2586/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/logs/0616_2318_llava..._pope_llava_model_args_0a2586/pope.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/logs/0616_2318_llava..._pope_llava_model_args_0a2586/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/logs/0616_2318_llava..._pope_llava_model_args_0a2586/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/logs/0617_0323_llava...a_val_llava_model_args_0a2586/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/logs/0626_1111_llava_v1.5_gqa_llava_model_args_0a2586/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-27572/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-34462/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-20679/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/logs/0616_2349_llava..._pope_llava_model_args_2d4392/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/logs/0616_2349_llava..._pope_llava_model_args_2d4392/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/logs/0616_2349_llava..._pope_llava_model_args_2d4392/pope.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/logs/0616_2349_llava..._pope_llava_model_args_2d4392/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/logs/0616_2349_llava..._pope_llava_model_args_2d4392/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/logs/0617_0343_llava...a_val_llava_model_args_2d4392/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/logs/0626_1221_llava_v1.5_gqa_llava_model_args_2d4392/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-27572/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-34462/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-20679/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/std_0.002_Full_smoe/logs/0613_0312_llava..._pope_llava_model_args_35cab6/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/std_0.002_Full_smoe/logs/0613_0312_llava..._pope_llava_model_args_35cab6/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/std_0.002_Full_smoe/logs/0613_0312_llava..._pope_llava_model_args_35cab6/pope.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/std_0.002_Full_smoe/logs/0613_0312_llava..._pope_llava_model_args_35cab6/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/std_0.002_Full_smoe/logs/0613_0312_llava..._pope_llava_model_args_35cab6/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/std_0.002_Full_smoe/logs/0613_0314_llava_v1.5_gqa_llava_model_args_35cab6/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/std_0.002_Full_smoe/checkpoint-27572/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/std_0.002_Full_smoe/checkpoint-34462/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/std_0.002_Full_smoe/checkpoint-20679/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/checkpoint-13786/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/logs/0620_0432_llava..._pope_llava_model_args_5c6951/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/logs/0620_0432_llava..._pope_llava_model_args_5c6951/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/logs/0620_0432_llava..._pope_llava_model_args_5c6951/pope.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/logs/0620_0432_llava..._pope_llava_model_args_5c6951/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/logs/0620_0432_llava..._pope_llava_model_args_5c6951/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/logs/0626_1513_llava...a_val_llava_model_args_5c6951/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/logs/0626_1526_llava_v1.5_gqa_llava_model_args_5c6951/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/checkpoint-27572/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/checkpoint-34462/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/checkpoint-20679/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/revise_Full_remoe/logs/0625_1531_llava..._pope_llava_model_args_179bff/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/revise_Full_remoe/logs/0625_1531_llava..._pope_llava_model_args_179bff/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/revise_Full_remoe/logs/0625_1531_llava..._pope_llava_model_args_179bff/pope.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/revise_Full_remoe/logs/0625_1531_llava..._pope_llava_model_args_179bff/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/revise_Full_remoe/logs/0625_1531_llava..._pope_llava_model_args_179bff/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/revise_Full_remoe/logs/0625_1719_llava..._pope_llava_model_args_179bff/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/revise_Full_remoe/logs/0625_1719_llava..._pope_llava_model_args_179bff/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/revise_Full_remoe/logs/0625_1719_llava..._pope_llava_model_args_179bff/pope.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/revise_Full_remoe/logs/0625_1719_llava..._pope_llava_model_args_179bff/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/revise_Full_remoe/logs/0625_1719_llava..._pope_llava_model_args_179bff/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/revise_Full_remoe/logs/0625_1751_llava...a_val_llava_model_args_179bff/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/revise_Full_remoe/logs/0626_1437_llava_v1.5_gqa_llava_model_args_179bff/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/revise_Full_remoe/checkpoint-27572/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/revise_Full_remoe/checkpoint-34462/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/revise_Full_remoe/checkpoint-20679/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/logs/0626_0357_llava..._pope_llava_model_args_59313d/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/logs/0626_0357_llava..._pope_llava_model_args_59313d/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/logs/0626_0357_llava..._pope_llava_model_args_59313d/pope.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/logs/0626_0357_llava..._pope_llava_model_args_59313d/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/logs/0626_0357_llava..._pope_llava_model_args_59313d/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/logs/0626_0430_llava...a_val_llava_model_args_59313d/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/logs/0626_1139_llava_v1.5_gqa_llava_model_args_59313d/gqa.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-27572/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-34462/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-20679/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-27572/logs/0627_1319_llava...l_mme_llava_model_args_1bb959/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-27572/logs/0627_1319_llava...l_mme_llava_model_args_1bb959/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-27572/logs/0627_1319_llava...l_mme_llava_model_args_1bb959/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-27572/logs/0627_1319_llava...l_mme_llava_model_args_1bb959/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-27572/logs/0627_1319_llava...l_mme_llava_model_args_1bb959/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-6893/logs/0627_0249_llava...l_mme_llava_model_args_f4318b/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-6893/logs/0627_0249_llava...l_mme_llava_model_args_f4318b/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-6893/logs/0627_0249_llava...l_mme_llava_model_args_f4318b/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-6893/logs/0627_0249_llava...l_mme_llava_model_args_f4318b/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-6893/logs/0627_0249_llava...l_mme_llava_model_args_f4318b/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-20679/logs/0627_1245_llava...l_mme_llava_model_args_18fef8/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-20679/logs/0627_1245_llava...l_mme_llava_model_args_18fef8/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-20679/logs/0627_1245_llava...l_mme_llava_model_args_18fef8/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-20679/logs/0627_1245_llava...l_mme_llava_model_args_18fef8/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-20679/logs/0627_1245_llava...l_mme_llava_model_args_18fef8/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-13786/logs/0628_1431_llava...l_mme_llava_model_args_d81bcd/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-13786/logs/0628_1431_llava...l_mme_llava_model_args_d81bcd/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-13786/logs/0628_1431_llava...l_mme_llava_model_args_d81bcd/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-13786/logs/0628_1431_llava...l_mme_llava_model_args_d81bcd/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-13786/logs/0628_1431_llava...l_mme_llava_model_args_d81bcd/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-27572/logs/0628_1536_llava...l_mme_llava_model_args_3e6edd/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-27572/logs/0628_1536_llava...l_mme_llava_model_args_3e6edd/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-27572/logs/0628_1536_llava...l_mme_llava_model_args_3e6edd/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-27572/logs/0628_1536_llava...l_mme_llava_model_args_3e6edd/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-27572/logs/0628_1536_llava...l_mme_llava_model_args_3e6edd/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-6893/logs/0628_1330_llava...l_mme_llava_model_args_50d1c2/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-6893/logs/0628_1330_llava...l_mme_llava_model_args_50d1c2/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-6893/logs/0628_1330_llava...l_mme_llava_model_args_50d1c2/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-6893/logs/0628_1330_llava...l_mme_llava_model_args_50d1c2/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-6893/logs/0628_1330_llava...l_mme_llava_model_args_50d1c2/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-20679/logs/0628_1504_llava...l_mme_llava_model_args_ed3dba/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-20679/logs/0628_1504_llava...l_mme_llava_model_args_ed3dba/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-20679/logs/0628_1504_llava...l_mme_llava_model_args_ed3dba/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-20679/logs/0628_1504_llava...l_mme_llava_model_args_ed3dba/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_share/checkpoint-20679/logs/0628_1504_llava...l_mme_llava_model_args_ed3dba/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-13786/logs/0628_1643_llava...l_mme_llava_model_args_5e9e69/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-13786/logs/0628_1643_llava...l_mme_llava_model_args_5e9e69/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-13786/logs/0628_1643_llava...l_mme_llava_model_args_5e9e69/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-13786/logs/0628_1643_llava...l_mme_llava_model_args_5e9e69/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-13786/logs/0628_1643_llava...l_mme_llava_model_args_5e9e69/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-27572/logs/0628_1751_llava...l_mme_llava_model_args_2dffa6/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-27572/logs/0628_1751_llava...l_mme_llava_model_args_2dffa6/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-27572/logs/0628_1751_llava...l_mme_llava_model_args_2dffa6/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-27572/logs/0628_1751_llava...l_mme_llava_model_args_2dffa6/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-27572/logs/0628_1751_llava...l_mme_llava_model_args_2dffa6/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-6893/logs/0628_1609_llava...l_mme_llava_model_args_d8dc17/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-6893/logs/0628_1609_llava...l_mme_llava_model_args_d8dc17/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-6893/logs/0628_1609_llava...l_mme_llava_model_args_d8dc17/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-6893/logs/0628_1609_llava...l_mme_llava_model_args_d8dc17/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-6893/logs/0628_1609_llava...l_mme_llava_model_args_d8dc17/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-20679/logs/0628_1717_llava...l_mme_llava_model_args_a39ef6/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-20679/logs/0628_1717_llava...l_mme_llava_model_args_a39ef6/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-20679/logs/0628_1717_llava...l_mme_llava_model_args_a39ef6/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-20679/logs/0628_1717_llava...l_mme_llava_model_args_a39ef6/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_sigmoidgating/checkpoint-20679/logs/0628_1717_llava...l_mme_llava_model_args_a39ef6/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-13786/logs/0628_2120_llava...l_mme_llava_model_args_467343/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-13786/logs/0628_2120_llava...l_mme_llava_model_args_467343/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-13786/logs/0628_2120_llava...l_mme_llava_model_args_467343/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-13786/logs/0628_2120_llava...l_mme_llava_model_args_467343/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-13786/logs/0628_2120_llava...l_mme_llava_model_args_467343/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-27572/logs/0628_2239_llava...l_mme_llava_model_args_7e5f99/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-27572/logs/0628_2239_llava...l_mme_llava_model_args_7e5f99/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-27572/logs/0628_2239_llava...l_mme_llava_model_args_7e5f99/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-27572/logs/0628_2239_llava...l_mme_llava_model_args_7e5f99/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-27572/logs/0628_2239_llava...l_mme_llava_model_args_7e5f99/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-6893/logs/0628_1825_llava...l_mme_llava_model_args_1b5567/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-6893/logs/0628_1825_llava...l_mme_llava_model_args_1b5567/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-6893/logs/0628_1825_llava...l_mme_llava_model_args_1b5567/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-6893/logs/0628_1825_llava...l_mme_llava_model_args_1b5567/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-6893/logs/0628_1825_llava...l_mme_llava_model_args_1b5567/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-6893/logs/0628_2054_llava...l_mme_llava_model_args_1b5567/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-6893/logs/0628_2054_llava...l_mme_llava_model_args_1b5567/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-6893/logs/0628_2054_llava...l_mme_llava_model_args_1b5567/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-6893/logs/0628_2054_llava...l_mme_llava_model_args_1b5567/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-6893/logs/0628_2054_llava...l_mme_llava_model_args_1b5567/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-20679/logs/0628_2212_llava...l_mme_llava_model_args_732fc6/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-20679/logs/0628_2212_llava...l_mme_llava_model_args_732fc6/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-20679/logs/0628_2212_llava...l_mme_llava_model_args_732fc6/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-20679/logs/0628_2212_llava...l_mme_llava_model_args_732fc6/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_xmoe/checkpoint-20679/logs/0628_2212_llava...l_mme_llava_model_args_732fc6/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/checkpoint-13786/logs/0627_1428_llava...l_mme_llava_model_args_595126/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/checkpoint-13786/logs/0627_1428_llava...l_mme_llava_model_args_595126/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/checkpoint-13786/logs/0627_1428_llava...l_mme_llava_model_args_595126/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/checkpoint-13786/logs/0627_1428_llava...l_mme_llava_model_args_595126/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/checkpoint-13786/logs/0627_1428_llava...l_mme_llava_model_args_595126/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/checkpoint-6893/logs/0627_1351_llava...l_mme_llava_model_args_746c3e/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/checkpoint-6893/logs/0627_1351_llava...l_mme_llava_model_args_746c3e/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/checkpoint-6893/logs/0627_1351_llava...l_mme_llava_model_args_746c3e/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/checkpoint-6893/logs/0627_1351_llava...l_mme_llava_model_args_746c3e/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/checkpoint-6893/logs/0627_1351_llava...l_mme_llava_model_args_746c3e/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/checkpoint-20679/logs/0627_1503_llava...l_mme_llava_model_args_efed7a/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/checkpoint-20679/logs/0627_1503_llava...l_mme_llava_model_args_efed7a/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/checkpoint-20679/logs/0627_1503_llava...l_mme_llava_model_args_efed7a/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/checkpoint-20679/logs/0627_1503_llava...l_mme_llava_model_args_efed7a/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_remoe/checkpoint-20679/logs/0627_1503_llava...l_mme_llava_model_args_efed7a/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-13786/logs/0629_0144_llava...l_mme_llava_model_args_735781/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-13786/logs/0629_0144_llava...l_mme_llava_model_args_735781/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-13786/logs/0629_0144_llava...l_mme_llava_model_args_735781/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-13786/logs/0629_0144_llava...l_mme_llava_model_args_735781/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-13786/logs/0629_0144_llava...l_mme_llava_model_args_735781/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/logs/0629_0244_llava...l_mme_llava_model_args_59313d/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/logs/0629_0244_llava...l_mme_llava_model_args_59313d/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/logs/0629_0244_llava...l_mme_llava_model_args_59313d/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/logs/0629_0244_llava...l_mme_llava_model_args_59313d/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/logs/0629_0244_llava...l_mme_llava_model_args_59313d/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/logs/0629_0425_llava_v1.5_pope_llava_model_args_59313d/pope.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/logs/0629_0427_llava_v1.5_pope_llava_model_args_59313d/pope.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-27572/logs/0629_0244_llava...l_mme_llava_model_args_498031/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-27572/logs/0629_0244_llava...l_mme_llava_model_args_498031/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-27572/logs/0629_0244_llava...l_mme_llava_model_args_498031/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-27572/logs/0629_0244_llava...l_mme_llava_model_args_498031/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-27572/logs/0629_0244_llava...l_mme_llava_model_args_498031/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-6893/logs/0629_0110_llava...l_mme_llava_model_args_8331f0/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-6893/logs/0629_0110_llava...l_mme_llava_model_args_8331f0/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-6893/logs/0629_0110_llava...l_mme_llava_model_args_8331f0/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-6893/logs/0629_0110_llava...l_mme_llava_model_args_8331f0/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-6893/logs/0629_0110_llava...l_mme_llava_model_args_8331f0/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-20679/logs/0629_0214_llava...l_mme_llava_model_args_26ed7e/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-20679/logs/0629_0214_llava...l_mme_llava_model_args_26ed7e/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-20679/logs/0629_0214_llava...l_mme_llava_model_args_26ed7e/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-20679/logs/0629_0214_llava...l_mme_llava_model_args_26ed7e/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_tcmoe/checkpoint-20679/logs/0629_0214_llava...l_mme_llava_model_args_26ed7e/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-13786/logs/0627_1209_llava...l_mme_llava_model_args_8d283e/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-13786/logs/0627_1209_llava...l_mme_llava_model_args_8d283e/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-13786/logs/0627_1209_llava...l_mme_llava_model_args_8d283e/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-13786/logs/0627_1209_llava...l_mme_llava_model_args_8d283e/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe/checkpoint-13786/logs/0627_1209_llava...l_mme_llava_model_args_8d283e/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/revise_Full_smoe_perturbed/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| data/1M3 filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_plus_plus/checkpoint-27572/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_plus_plus/checkpoint-34462/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M3/Full_smoe_plus_plus/checkpoint-20679/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe/checkpoint-20791/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_sigmoidgating/checkpoint-20791/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_xmoe/checkpoint-20791/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_share/checkpoint-20791/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_tcmoe/checkpoint-20791/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| Pretrain_language_model/save/test/checkpoint/save_tmp filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_plus_plus/checkpoint-20791/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_sharev3_not_norm/checkpoint-20791/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_sharev3/checkpoint-20791/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-20791/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-12477/logs/0717_2000_llava...l_mme_llava_model_args_82420a/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-12477/logs/0717_2000_llava...l_mme_llava_model_args_82420a/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-12477/logs/0717_2000_llava...l_mme_llava_model_args_82420a/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-12477/logs/0717_2000_llava...l_mme_llava_model_args_82420a/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-12477/logs/0717_2000_llava...l_mme_llava_model_args_82420a/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2159_llava...u_val_llava_model_args_861273/mmmu_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2213_llava...mstar_llava_model_args_861273/mathvista_testmini.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2213_llava...mstar_llava_model_args_861273/mme.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2213_llava...mstar_llava_model_args_861273/mmmu_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2213_llava...mstar_llava_model_args_861273/mmstar.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2225_llava...mstar_llava_model_args_fc3596/mathvista_testmini.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2225_llava...mstar_llava_model_args_fc3596/mme.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2225_llava...mstar_llava_model_args_fc3596/mmmu_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2225_llava...mstar_llava_model_args_fc3596/mmstar.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2237_llava...mstar_llava_model_args_82420a/mathvista_testmini.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2237_llava...mstar_llava_model_args_82420a/mme.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2237_llava...mstar_llava_model_args_82420a/mmmu_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2237_llava...mstar_llava_model_args_82420a/mmstar.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2249_llava...mstar_llava_model_args_fe2b4a/mathvista_testmini.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2249_llava...mstar_llava_model_args_fe2b4a/mme.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2249_llava...mstar_llava_model_args_fe2b4a/mmmu_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2249_llava...mstar_llava_model_args_fe2b4a/mmstar.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2301_llava...mstar_llava_model_args_fe4e53/mathvista_testmini.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2301_llava...mstar_llava_model_args_fe4e53/mme.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2301_llava...mstar_llava_model_args_fe4e53/mmmu_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/0717_2301_llava...mstar_llava_model_args_fe4e53/mmstar.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/logs/0717_1127_llava...l_mme_llava_model_args_5a2714/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/logs/0717_1127_llava...l_mme_llava_model_args_5a2714/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/logs/0717_1127_llava...l_mme_llava_model_args_5a2714/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/logs/0717_1127_llava...l_mme_llava_model_args_5a2714/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/logs/0717_1127_llava...l_mme_llava_model_args_5a2714/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-4159/logs/0717_1839_llava...l_mme_llava_model_args_861273/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-4159/logs/0717_1839_llava...l_mme_llava_model_args_861273/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-4159/logs/0717_1839_llava...l_mme_llava_model_args_861273/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-4159/logs/0717_1839_llava...l_mme_llava_model_args_861273/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-4159/logs/0717_1839_llava...l_mme_llava_model_args_861273/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-16636/logs/0717_2005_llava...l_mme_llava_model_args_fe2b4a/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-16636/logs/0717_2005_llava...l_mme_llava_model_args_fe2b4a/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-16636/logs/0717_2005_llava...l_mme_llava_model_args_fe2b4a/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-16636/logs/0717_2005_llava...l_mme_llava_model_args_fe2b4a/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-16636/logs/0717_2005_llava...l_mme_llava_model_args_fe2b4a/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-8318/logs/0717_1925_llava...l_mme_llava_model_args_fc3596/infovqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-8318/logs/0717_1925_llava...l_mme_llava_model_args_fc3596/mmbench_en_dev.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-8318/logs/0717_1925_llava...l_mme_llava_model_args_fc3596/mmerealworld_lite.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-8318/logs/0717_1925_llava...l_mme_llava_model_args_fc3596/submissions/mmbench_en_dev_results.xlsx filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/checkpoint-8318/logs/0717_1925_llava...l_mme_llava_model_args_fc3596/textvqa_val.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_plus_plus/analysts/mathvista_testmini_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_plus_plus/analysts/mme_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe/analysts/mathvista_testmini_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe/analysts/mme_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_share/analysts/mathvista_testmini_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_share/analysts/mme_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_sigmoidgating/analysts/mathvista_testmini_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_sigmoidgating/analysts/mme_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_sigmoidgating/analysts/mmmu_val_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/mathvista_testmini_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/mme_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_xmoe/analysts/mathvista_testmini_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_xmoe/analysts/mme_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_xmoe/analysts/mmmu_val_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_xmoe/analysts/mmstar_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_tcmoe/analysts/mathvista_testmini_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_tcmoe/analysts/mme_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_tcmoe/analysts/mmmu_val_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_tcmoe/analysts/mmstar_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_plus_plus/analysts/mmmu_val_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_plus_plus/analysts/mmstar_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe/analysts/mmmu_val_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe/analysts/mmstar_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_share/analysts/mmstar_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/Full_smoe_sigmoidgating/analysts/mmstar_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_smoe_sharev3/analysts/mmstar_data_selected_final.json filter=lfs diff=lfs merge=lfs -text | |
| sft/665K36/revise_Full_competesmoe/checkpoint-16636/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| Pretrain_language_model/save/slimpajama_competesmoe_no_attmoe_660M_standardlb/competesmoe_div0.01/model-20000.pth.txt filter=lfs diff=lfs merge=lfs -text | |
| sft/665K/o_grad_Full_competesmoe/checkpoint-16632/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M2/Full_smoe/checkpoint-31320/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M2/Full_smoe/checkpoint-39148/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M2/Full_smoe/checkpoint-23490/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M2/Full_smoe_share/checkpoint-31320/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M2/Full_smoe_share/checkpoint-39148/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M2/Full_smoe_share/checkpoint-23490/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M2/Full_smoe_sigmoidgating/checkpoint-31320/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M2/Full_smoe_sigmoidgating/checkpoint-39148/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M2/Full_smoe_sigmoidgating/checkpoint-23490/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M2/Full_xmoe/checkpoint-31320/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M2/Full_xmoe/checkpoint-35235/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M2/Full_xmoe/checkpoint-39148/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M2/Full_xmoe/checkpoint-23490/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M2/Full_xmoe/checkpoint-27405/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M2/Full_xmoe/checkpoint-19575/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M2/Full_smoe_sharev3/checkpoint-19575/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |
| sft/1M2/Full_smoe_plus_plus/checkpoint-19575/trainer_state.json filter=lfs diff=lfs merge=lfs -text | |