| 48901 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info100-60step |
HuggingFace |
1.30 |
unrated |
| 48902 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info100-75step |
HuggingFace |
1.30 |
unrated |
| 48903 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info100-90step |
HuggingFace |
1.30 |
unrated |
| 48904 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info200-105step |
HuggingFace |
1.30 |
unrated |
| 48905 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info200-120step |
HuggingFace |
1.30 |
unrated |
| 48906 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info200-135step |
HuggingFace |
1.30 |
unrated |
| 48907 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info200-150step |
HuggingFace |
1.30 |
unrated |
| 48908 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info200-15step |
HuggingFace |
1.30 |
unrated |
| 48909 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info200-30step |
HuggingFace |
1.30 |
unrated |
| 48910 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info200-45step |
HuggingFace |
1.30 |
unrated |
| 48911 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info200-60step |
HuggingFace |
1.30 |
unrated |
| 48912 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info200-75step |
HuggingFace |
1.30 |
unrated |
| 48913 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info200-90step |
HuggingFace |
1.30 |
unrated |
| 48914 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info300-105step |
HuggingFace |
1.30 |
unrated |
| 48915 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info300-120step |
HuggingFace |
1.30 |
unrated |
| 48916 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info300-135step |
HuggingFace |
1.30 |
unrated |
| 48917 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info300-150step |
HuggingFace |
1.30 |
unrated |
| 48918 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info300-15step |
HuggingFace |
1.30 |
unrated |
| 48919 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info300-30step |
HuggingFace |
1.30 |
unrated |
| 48920 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info300-45step |
HuggingFace |
1.30 |
unrated |