- 機械学習ライブラリ:PyTorch: An Imperative Style, High-Performance Deep Learning Library
- デバッグツール:Weights & Biases
git clone https://github.com/sql-hkr/offline-rl
cd offline-rl
python setup.py develop
Dockerイメージ:Dockerfile
git clone https://github.com/sql-hkr/offline-rl
cd offline-rl
docker build -t offline-rl .
docker run --gpus all -it -v $PWD:/workspace offline-rl
python train_d4rl.py --algo_name={algo} --task {env} --seed 0 --lam 0.9
ex.
python train_d4rl.py --algo_name=mcq --task walker2d-medium-v2 --seed 6 --lam 0.9