| 48921 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info300-60step |
HuggingFace |
1.30 |
unrated |
| 48922 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info300-75step |
HuggingFace |
1.30 |
unrated |
| 48923 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info300-90step |
HuggingFace |
1.30 |
unrated |
| 48924 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info50-105step |
HuggingFace |
1.30 |
unrated |
| 48925 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info50-120step |
HuggingFace |
1.30 |
unrated |
| 48926 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info50-135step |
HuggingFace |
1.30 |
unrated |
| 48927 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info50-150step |
HuggingFace |
1.30 |
unrated |
| 48928 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info50-15step |
HuggingFace |
1.30 |
unrated |
| 48929 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info50-30step |
HuggingFace |
1.30 |
unrated |
| 48930 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info50-45step |
HuggingFace |
1.30 |
unrated |
| 48931 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info50-60step |
HuggingFace |
1.30 |
unrated |
| 48932 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info50-75step |
HuggingFace |
1.30 |
unrated |
| 48933 |
aug-verl_agent_alfworld-GRPO-kl0.01-from-webshop-Llama-3.1-8B-Instruct-info50-90step |
HuggingFace |
1.30 |
unrated |
| 48934 |
aug_verl_agent_webshop-GRPO-kl-0.01-from-webshop-20step-v2-Llama-3.1-8B-Instruct-info100-105step |
HuggingFace |
1.30 |
unrated |
| 48935 |
aug_verl_agent_webshop-GRPO-kl-0.01-from-webshop-20step-v2-Llama-3.1-8B-Instruct-info100-120step |
HuggingFace |
1.30 |
unrated |
| 48936 |
aug_verl_agent_webshop-GRPO-kl-0.01-from-webshop-20step-v2-Llama-3.1-8B-Instruct-info100-135step |
HuggingFace |
1.30 |
unrated |
| 48937 |
aug_verl_agent_webshop-GRPO-kl-0.01-from-webshop-20step-v2-Llama-3.1-8B-Instruct-info100-150step |
HuggingFace |
1.30 |
unrated |
| 48938 |
aug_verl_agent_webshop-GRPO-kl-0.01-from-webshop-20step-v2-Llama-3.1-8B-Instruct-info100-15step |
HuggingFace |
1.30 |
unrated |
| 48939 |
aug_verl_agent_webshop-GRPO-kl-0.01-from-webshop-20step-v2-Llama-3.1-8B-Instruct-info100-30step |
HuggingFace |
1.30 |
unrated |
| 48940 |
aug_verl_agent_webshop-GRPO-kl-0.01-from-webshop-20step-v2-Llama-3.1-8B-Instruct-info100-45step |
HuggingFace |
1.30 |
unrated |