emiliodavola commited on
Commit
79f020d
·
1 Parent(s): 47972eb

Upload model_config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. model_config.json +40 -0
model_config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "dqn",
3
+ "task": "reinforcement-learning",
4
+ "environment": "french-solitaire-7x7",
5
+ "algorithm": "double-dqn",
6
+ "framework": "pytorch",
7
+ "state_dim": 49,
8
+ "action_dim": 100,
9
+ "architecture": {
10
+ "type": "mlp",
11
+ "layers": [
12
+ {"type": "linear", "in": 49, "out": 128},
13
+ {"type": "relu"},
14
+ {"type": "linear", "in": 128, "out": 128},
15
+ {"type": "relu"},
16
+ {"type": "linear", "in": 128, "out": 100}
17
+ ]
18
+ },
19
+ "hyperparameters": {
20
+ "learning_rate": 0.0005,
21
+ "gamma": 0.99,
22
+ "epsilon_start": 1.0,
23
+ "epsilon_end": 0.01,
24
+ "epsilon_decay": 0.995,
25
+ "batch_size": 64,
26
+ "buffer_size": 10000,
27
+ "target_update_freq": 100
28
+ },
29
+ "training": {
30
+ "episodes": 15000,
31
+ "max_steps_per_episode": 200,
32
+ "device": "cuda"
33
+ },
34
+ "performance": {
35
+ "win_rate": "TBD",
36
+ "center_win_rate": "TBD",
37
+ "avg_reward": "TBD",
38
+ "avg_pegs_remaining": "TBD"
39
+ }
40
+ }