Skip to content

Commit f148d68

Browse files
committed
update: add aca
1 parent df05250 commit f148d68

File tree

10 files changed

+719
-0
lines changed

10 files changed

+719
-0
lines changed
Lines changed: 41 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,41 @@
1+
# @package _global_
2+
3+
algo:
4+
name: aca
5+
target_update_freq: 1
6+
feature_dim: 512
7+
rff_dim: 1024
8+
critic_hidden_dims: [512, 512]
9+
reward_hidden_dims: [512, 512]
10+
phi_hidden_dims: [512, 512]
11+
mu_hidden_dims: [512, 512]
12+
ctrl_coef: 1.0
13+
reward_coef: 1.0
14+
critic_coef: 1.0
15+
critic_activation: elu # not used
16+
back_critic_grad: false
17+
feature_lr: 0.0001
18+
critic_lr: 0.0003
19+
discount: 0.99
20+
num_samples: 10
21+
ema: 0.005
22+
feature_ema: 0.005
23+
clip_grad_norm: null
24+
temp: 0.1
25+
diffusion:
26+
time_dim: 64
27+
mlp_hidden_dims: [512, 512, 512]
28+
lr: 0.0003
29+
end_lr: null
30+
lr_decay_steps: null
31+
lr_decay_begin: null
32+
steps: 20
33+
clip_sampler: true
34+
x_min: -1.0
35+
x_max: 1.0
36+
solver: ddpm
37+
num_noises: 25
38+
linear: false
39+
ranking: true
40+
41+
norm_obs: true

examples/online/main_dmc_offpolicy.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -29,6 +29,7 @@
2929
"ctrl_td3": CtrlTD3Agent,
3030
"qsm": QSMAgent,
3131
"ctrl_qsm": CtrlQSMAgent,
32+
"aca": ACAAgent,
3233
}
3334

3435
class OffPolicyTrainer():

flowrl/agent/online/__init__.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,7 @@
99
from .sdac import SDACAgent
1010
from .td3 import TD3Agent
1111
from .td7.td7 import TD7Agent
12+
from .unirep import *
1213

1314
__all__ = [
1415
"BaseAgent",
@@ -24,4 +25,5 @@
2425
"ALACAgent",
2526
"CtrlTD3Agent",
2627
"CtrlQSMAgent",
28+
"ACAAgent",
2729
]
Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,5 @@
1+
from .aca import ACAAgent
2+
3+
__all__ = [
4+
"ACAAgent",
5+
]

0 commit comments

Comments
 (0)