mlgym-bench
v1.0Evaluates agents on ML tasks across computer vision, RL, tabular ML, and game theory.
harbor run -d mlgym-bench@1.0Tasks (12)
mlgym-battle-of-sexes
harbor run -d mlgym-bench@1.0 -t mlgym-battle-of-sexes325a5c5
mlgym-blotto
harbor run -d mlgym-bench@1.0 -t mlgym-blotto325a5c5
mlgym-image-classification-cifar10
harbor run -d mlgym-bench@1.0 -t mlgym-image-classification-cifar10325a5c5
mlgym-image-classification-cifar10-l1
harbor run -d mlgym-bench@1.0 -t mlgym-image-classification-cifar10-l1325a5c5
mlgym-image-classification-f-mnist
harbor run -d mlgym-bench@1.0 -t mlgym-image-classification-f-mnist325a5c5
mlgym-prisoners-dilemma
harbor run -d mlgym-bench@1.0 -t mlgym-prisoners-dilemma325a5c5
mlgym-regression-kaggle-house-price
harbor run -d mlgym-bench@1.0 -t mlgym-regression-kaggle-house-price325a5c5
mlgym-regression-kaggle-house-price-l1
harbor run -d mlgym-bench@1.0 -t mlgym-regression-kaggle-house-price-l1325a5c5
mlgym-rl-meta-maze-misc
harbor run -d mlgym-bench@1.0 -t mlgym-rl-meta-maze-misc325a5c5
mlgym-rl-mountain-car-continuous
harbor run -d mlgym-bench@1.0 -t mlgym-rl-mountain-car-continuous325a5c5
mlgym-rl-mountain-car-continuous-reinforce
harbor run -d mlgym-bench@1.0 -t mlgym-rl-mountain-car-continuous-reinforce325a5c5
mlgym-titanic
harbor run -d mlgym-bench@1.0 -t mlgym-titanic325a5c5