# run the toy examples

# ==== entropy-Diff + Q-ensemble ====
python train_toy_game.py -m 0
# ===================================

# ======= entropy + diffusion =======
python train_toy_game.py -m 1
# ===================================

# ========= standard diffusion = ====
python train_toy_game.py -m 2
# ===================================
