Skip to content
This repository was archived by the owner on Jun 2, 2025. It is now read-only.
Open
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
64 commits
Select commit Hold shift + click to select a range
b3068c9
Added sac codebase. Works independently.
ShahRutav Jan 11, 2023
f37ac89
Added small test codebase.
ShahRutav Jan 11, 2023
09bad16
Merge branch 'dev' into sac_dev
ShahRutav Jan 13, 2023
6c03e9c
test.py updated with another bug
ShahRutav Jan 13, 2023
50ae2e0
small change with updated torchrl
ShahRutav Jan 13, 2023
f2d9b43
working sac codebase. cleanup
ShahRutav Jan 14, 2023
b576682
added installation script. sac configs correct
ShahRutav Jan 15, 2023
2f07d0c
Added a new running instruction for SAC+R3M
ShahRutav Jan 15, 2023
e6067c4
Fixed readme
ShahRutav Jan 15, 2023
c6084e8
Added redq codebase from torchrl
ShahRutav Jan 15, 2023
d39bd0c
Merge branch 'sac_dev' of github.com:facebookresearch/rlhive into sac…
ShahRutav Jan 15, 2023
1f02c30
updated redq script with robohive env
ShahRutav Jan 16, 2023
fab9084
Added RRLTransform
ShahRutav Jan 16, 2023
76e601a
moved rrl_transform inside helpers
ShahRutav Jan 16, 2023
850c3d9
Updated README with parameter sweep
ShahRutav Jan 17, 2023
2a942ab
updated redq with action, state, and obs norms
ShahRutav Jan 24, 2023
bd932d3
Merge branch 'sac_dev' of github.com:facebookresearch/rlhive into sac…
ShahRutav Jan 24, 2023
bc49e48
Merge branch 'dev' into sac_dev
vmoens Jan 24, 2023
e3cd33d
Merge branch 'sac_dev' of https://github.com/facebookresearch/rlhive …
vmoens Jan 24, 2023
5823199
updated the code with torchrl sacloss and rrl transform
ShahRutav Jan 25, 2023
e68f917
init
vmoens Jan 27, 2023
721394c
amend
vmoens Jan 27, 2023
47dbc8a
amend
vmoens Jan 27, 2023
e120d7b
amend
vmoens Jan 27, 2023
582020c
amend
vmoens Jan 27, 2023
ad060d8
amend
vmoens Jan 27, 2023
e1225d5
amend
vmoens Jan 27, 2023
79d1eae
amend
vmoens Jan 27, 2023
5d87afc
amend
vmoens Jan 27, 2023
2af22a4
amend
vmoens Jan 27, 2023
65bd6ef
amend
vmoens Jan 27, 2023
bbb1d72
amend
vmoens Jan 27, 2023
ab22dec
amend
vmoens Jan 27, 2023
3168908
amend
vmoens Jan 27, 2023
c85a24d
amend
vmoens Jan 27, 2023
bbcd73d
amend
vmoens Jan 27, 2023
dc68e2e
rl_env updated for state based experiments
Jan 28, 2023
faa46de
amend
vmoens Jan 28, 2023
e895912
init
vmoens Jan 13, 2023
3da5e5c
amend
vmoens Jan 13, 2023
eee0d4b
amend
vmoens Jan 13, 2023
2e5e1e6
minor
vmoens Jan 13, 2023
caa66e1
Some more info in GET_STARTED.md
vmoens Jan 23, 2023
c935d24
Fix ref to wandb
vmoens Jan 23, 2023
1af25a9
cleanup
vmoens Jan 24, 2023
ad20206
init
vmoens Jan 27, 2023
1bbddd4
amend
vmoens Jan 27, 2023
fea42b2
amend
vmoens Jan 27, 2023
a43e2a4
amend
vmoens Jan 27, 2023
8cb852d
amend
vmoens Jan 27, 2023
deeb272
amend
vmoens Jan 27, 2023
ff4895a
amend
vmoens Jan 27, 2023
3224ec2
amend
vmoens Jan 27, 2023
4573419
amend
vmoens Jan 27, 2023
97180ae
amend
vmoens Jan 27, 2023
7106f01
amend
vmoens Jan 27, 2023
f71a155
amend
vmoens Jan 27, 2023
a28404b
amend
vmoens Jan 27, 2023
1ac5466
amend
vmoens Jan 27, 2023
a7be171
amend
vmoens Jan 27, 2023
22d91cb
amend
vmoens Jan 27, 2023
0659cca
merged with sac_example
Jan 28, 2023
1a6e527
moving the sac_loss to local file
Jan 28, 2023
c521fcd
updated with rrl,r3m,flatten transforms, added visual hand envs
Jan 31, 2023
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
46 changes: 46 additions & 0 deletions examples/config/sac.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,46 @@
default:
- override hydra/output: local
- override hydra/launcher: local

# Logger
exp_name: ${task}_sac_${visual_transform}
visual_transform: r3m
record_interval: 1
device: "cuda:0"
device_collection: "cuda:1"
wandb_entity: "RLHive"
wandb_mode: "offline"

# Environment
task: visual_franka_slide_random-v3
#frame_skip: 1
reward_scaling: 5.0
init_env_steps: 1000
seed: 42
eval_traj: 25
eval_interval: 1000
num_envs: 8

# Collector
env_per_collector: 1
max_frames_per_traj: -1
total_frames: 1000000
init_random_frames: 25000
frames_per_batch: 1000

# Replay Buffer
prb: 0
buffer_size: 100000
buffer_scratch_dir: /tmp/

# Optimization
gamma: 0.99
batch_size: 256
lr: 3.0e-4
weight_decay: 0.0
target_update_polyak: 0.995
utd_ratio: 1

hydra:
job:
name: sac_${task}_${seed}
41 changes: 41 additions & 0 deletions examples/install/install_rlhive.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,41 @@
#!/bin/zsh

# Instructions to install a fresh anaconda environment with RLHive

set -e

conda_path=$(conda info | grep -i 'base environment' | awk '{ print $4 }')
source $conda_path/etc/profile.d/conda.sh

here=$(pwd)
module_path=$HOME/modules/

module purge
module load cuda/11.6

conda env remove -n rlhive -y

conda create -n rlhive -y python=3.8

conda activate rlhive

python3 -mpip install --pre torch torchvision torchaudio --extra-index-url https://download.pytorch.org/whl/nightly/cu116

mkdir $module_path
cd $module_path
git clone -c submodule.mj_envs/sims/neuromuscular_sim.update=none --branch v0.4dev --recursive https://github.com/vikashplus/mj_envs.git mj_envs
cd mj_envs
python3 -mpip install . # one can also install it locally with the -e flag
cd $here

python3 -mpip install git+https://github.com/pytorch-labs/tensordict # or stable or nightly with pip install tensordict(-nightly)
python3 -mpip install git+https://github.com/pytorch/rl.git # or stable or nightly with pip install torchrl(-nightly)

# this
# python3 -mpip install git+https://github.com/facebookresearch/rlhive.git # or stable or nightly with pip install torchrl(-nightly)
# or this
cd ../..
pip install -e .
cd $here

pip install wandb tqdm hydra-core moviepy
Loading