| 541 |
qwen3-4b-agent-trajectory_alf_admissible-lora-constraint_gen-dist_allign_b |
HuggingFace |
2.22 |
unrated |
| 542 |
qwen3-4b-agent-trajectory_alf_admissible-lora-constraint_gen-dist_allign_c |
HuggingFace |
2.22 |
unrated |
| 543 |
qwen3-4b-agent-trajectory_alf_admPlusExtra-lora-constraint_gen-dist_allign |
HuggingFace |
2.22 |
unrated |
| 544 |
qwen3-4b-agent-trajectory_dpo_v1 |
HuggingFace |
2.22 |
unrated |
| 545 |
qwen3-4b-agent-trajectory-lora-add_constraint_prompt |
HuggingFace |
2.22 |
unrated |
| 546 |
qwen3-4b-agent-trajectory-lora-base |
HuggingFace |
2.22 |
unrated |
| 547 |
qwen3-4b-agent-trajectory-lora-constraint_gen-dist_allign |
HuggingFace |
2.22 |
unrated |
| 548 |
qwen3-4b-agent-trajectory-lora-sft_dpo_v1 |
HuggingFace |
2.22 |
unrated |
| 549 |
qwen3-4b-agent-trajectory-lora-sft_dpo_v2 |
HuggingFace |
2.22 |
unrated |
| 550 |
qwen3-4b-agent-trajectory-lora-sft_dpo_v3 |
HuggingFace |
2.22 |
unrated |
| 551 |
qwen3-4b-agent-trajectory-lora-sft_dpo_v3-a |
HuggingFace |
2.22 |
unrated |
| 552 |
qwen3-4b-agent-trajectory-lora-sft_multi_dpo |
HuggingFace |
2.22 |
unrated |
| 553 |
qwen3-4b-agent-trajectory-lora-sft_multi_dpo_merged |
HuggingFace |
2.22 |
unrated |
| 554 |
qwen3-4b-agent-trajectory-SFT_alfadm2-prmcons_alformat1 |
HuggingFace |
2.22 |
unrated |
| 555 |
qwen3-4b-agent-trajectory-SFT_alfadm-prmcons_alformat2 |
HuggingFace |
2.22 |
unrated |
| 556 |
qwen3-4b-agent-trajectory-SFT_alfadm-prmcons_alformat3 |
HuggingFace |
2.22 |
unrated |
| 557 |
Qwen2.5-7B-agent-trajectory-lora_1 |
HuggingFace |
2.22 |
unrated |
| 558 |
Qwen2.5-7B-agent-trajectory-lora_10_1 |
HuggingFace |
2.22 |
unrated |
| 559 |
Qwen2.5-7B-agent-trajectory-lora_12_1 |
HuggingFace |
2.22 |
unrated |
| 560 |
Qwen2.5-7B-agent-trajectory-lora_2 |
HuggingFace |
2.22 |
unrated |