TheoVincent commited on
Commit
9bd27a8
Β·
1 Parent(s): b0bc0be

unique config.json

Browse files
README.md CHANGED
@@ -26,7 +26,7 @@ The sparse model parameters were obtained with [EauDeQN](https://arxiv.org/pdf/2
26
 
27
  5 seeds are available for each configuration which makes a total of **750 available models** πŸ“ˆ.
28
 
29
- The [evaluate.ipynb](./evaluate.ipynb) notebook contains a minimal example to evaluate to model parameters πŸ§‘β€πŸ« It uses JAX πŸš€ The hyperparameters used during training are reported in [online_config.json](./online_config.json) and [offline_config.json](./offline_config.json) πŸ”§
30
 
31
  The training code is available soon ⏳
32
 
 
26
 
27
  5 seeds are available for each configuration which makes a total of **750 available models** πŸ“ˆ.
28
 
29
+ The [evaluate.ipynb](./evaluate.ipynb) notebook contains a minimal example to evaluate to model parameters πŸ§‘β€πŸ« It uses JAX πŸš€ The hyperparameters used during training are reported in [config.json](./config.json) πŸ”§
30
 
31
  The training code is available soon ⏳
32
 
online_config.json β†’ config.json RENAMED
@@ -1,5 +1,6 @@
1
  {
2
- "shared_parameters": {
 
3
  "replay_buffer_capacity": 1000000,
4
  "batch_size": 32,
5
  "update_horizon": 1,
@@ -33,5 +34,41 @@
33
  "sparcity_update_freq": 4000,
34
  "final_sparsity": 0.95
35
  },
36
- "dqn": {}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
37
  }
 
1
  {
2
+ "ONLINE PARAMETERS": "-------------------",
3
+ "online_shared_parameters": {
4
  "replay_buffer_capacity": 1000000,
5
  "batch_size": 32,
6
  "update_horizon": 1,
 
34
  "sparcity_update_freq": 4000,
35
  "final_sparsity": 0.95
36
  },
37
+ "dqn": {},
38
+ "OFFLINE PARAMETERS": "-------------------",
39
+ "offline_shared_parameters": {
40
+ "features": [
41
+ 32,
42
+ 64,
43
+ 64,
44
+ "Feature Size"
45
+ ],
46
+ "replay_buffer_capacity": 50000,
47
+ "batch_size": 32,
48
+ "update_horizon": 1,
49
+ "gamma": 0.99,
50
+ "learning_rate": 5e-05,
51
+ "architecture_type": "cnn",
52
+ "target_update_frequency": 2000,
53
+ "n_buffers_to_load": 5,
54
+ "n_epochs": 50,
55
+ "n_fitting_steps": 62500
56
+ },
57
+ "eaudecql": {
58
+ "n_networks": 5,
59
+ "max_noise": 3.0,
60
+ "max_speed": 0.01,
61
+ "reset_optimizer": true,
62
+ "alpha_cql": 0.1
63
+ },
64
+ "polyprunecql": {
65
+ "sparcity_start_step": 625000,
66
+ "sparcity_end_step": 2500000,
67
+ "sparcity_update_freq": 1000,
68
+ "final_sparsity": 0.95,
69
+ "alpha_cql": 0.1
70
+ },
71
+ "cql": {
72
+ "alpha_cql": 0.1
73
+ }
74
  }
offline_config.json DELETED
@@ -1,37 +0,0 @@
1
- {
2
- "shared_parameters": {
3
- "features": [
4
- 32,
5
- 64,
6
- 64,
7
- "Feature Size"
8
- ],
9
- "replay_buffer_capacity": 50000,
10
- "batch_size": 32,
11
- "update_horizon": 1,
12
- "gamma": 0.99,
13
- "learning_rate": 5e-05,
14
- "architecture_type": "cnn",
15
- "target_update_frequency": 2000,
16
- "n_buffers_to_load": 5,
17
- "n_epochs": 50,
18
- "n_fitting_steps": 62500
19
- },
20
- "eaudecql": {
21
- "n_networks": 5,
22
- "max_noise": 3.0,
23
- "max_speed": 0.01,
24
- "reset_optimizer": true,
25
- "alpha_cql": 0.1
26
- },
27
- "polyprunecql": {
28
- "sparcity_start_step": 625000,
29
- "sparcity_end_step": 2500000,
30
- "sparcity_update_freq": 1000,
31
- "final_sparsity": 0.95,
32
- "alpha_cql": 0.1
33
- },
34
- "cql": {
35
- "alpha_cql": 0.1
36
- }
37
- }