Ctrl+K
- grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep1_gate_v5
- grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep1_gate_v5_multiprompt
- grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep1_gate_v5_multiprompt_mixfv
- grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep1_len-pan-max-256
- grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep1_len-pan-max-256_finevision
- grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep1_len-pan-max-256_mixfinevision
- grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep1_len-pan-max-256_tmp
- grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep1_lpan_t128_s10_c20
- grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep1_lpan_t256_s20_c40
- grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep1_lpan_t384_s5_c10
- grpo_Qwen2.5-VL-3B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep3
- grpo_Qwen2.5-VL-7B-Instruct_tr1024_mini256_micro16_n8_lr5e-6_cosine_ep1_gate_v5_multiprompt_mixfv
- grpo_Qwen2.5-VL-7B-Instruct_tr1024_mini256_micro16_n8_lr5e-6_cosine_ep1_len-pan-max-256
- grpo_Qwen2.5-VL-7B-Instruct_tr1024_mini256_micro16_n8_lr5e-6_cosine_ep1_len-pan-max-256_mixfinevision
- grpo_Qwen2.5-VL-7B-Instruct_tr1024_mini256_micro32_n8_lr5e-6_cosine_ep1
- llava_vqa_judge_grpo_local_qwen3
- llava_vqa_judge_grpo_local_qwen3_new_1epoch
- sft_qwen2.5vl3b_gpt_llava_multiprompt_2ep
- sft_qwen2.5vl3b_gpt_llava_rephrase8_2ep
- sft_qwen2.5vl3b_gpt_mixfv_multiprompt
- sft_qwen2.5vl3b_gpt_mixfv_multiprompt_2ep
- sft_qwen2.5vl3b_gpt_mixfv_rephrase8_2ep
- sft_qwen2.5vl7b_gpt_llava_multiprompt_2ep
- sft_qwen2.5vl7b_gpt_llava_rephrase8_2ep
- sft_qwen2.5vl7b_gpt_mixfv_multiprompt
- sft_qwen2.5vl7b_gpt_mixfv_multiprompt_1ep
- sft_qwen2.5vl7b_gpt_mixfv_multiprompt_2ep
- sft_qwen2.5vl7b_gpt_mixfv_rephrase8_2ep
- 2.77 kB