forked from johnjim0816/joyrl-offline
-
Notifications
You must be signed in to change notification settings - Fork 0
/
config.py
29 lines (29 loc) · 1.09 KB
/
config.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
#!/usr/bin/env python
# coding=utf-8
'''
Author: JiangJi
Email: [email protected]
Date: 2023-02-21 20:32:11
LastEditor: JiangJi
LastEditTime: 2023-05-18 13:38:56
Discription:
'''
from config.config import DefaultConfig
class AlgoConfig(DefaultConfig):
''' algorithm parameters
'''
def __init__(self) -> None:
# set epsilon_start=epsilon_end to get fixed epsilon, i.e. epsilon=epsilon_end
self.epsilon_start = 0.95 # epsilon start value
self.epsilon_end = 0.01 # epsilon end value
self.epsilon_decay = 500 # epsilon decay
self.gamma = 0.95 # reward discount factor
self.lr = 0.0001 # learning rate
self.buffer_size = 100000 # replay buffer size
self.batch_size = 64 # batch size
self.target_update = 4 # target network update frequency
# value network layers config
self.value_layers = [
{'layer_type': 'noisy_linear', 'layer_size': [64], 'activation': 'ReLU','std_init': 0.4},
{'layer_type': 'noisy_linear', 'layer_size': [64], 'activation': 'ReLU','std_init': 0.4},
]