-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmodel_architecture
130 lines (130 loc) · 4.47 KB
/
model_architecture
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
digraph {
graph [size="16.5,16.5"]
node [align=left fontname=monospace fontsize=10 height=0.2 ranksep=0.1 shape=box style=filled]
2263593188832 [label="
(1, 2)" fillcolor=darkolivegreen1]
2263593188432 [label="
(1, 2)" fillcolor=darkolivegreen3]
2263593188432 -> 2263593188832 [style=dotted]
2263581907360 [label="
(1, 1)" fillcolor=darkolivegreen1]
2263578566400 [label=AddmmBackward0]
2263592572368 -> 2263578566400
2263541364720 [label="value_net.bias
(1)" fillcolor=lightblue]
2263541364720 -> 2263592572368
2263592572368 [label=AccumulateGrad]
2263574703136 -> 2263578566400
2263574703136 [label=TanhBackward0]
2263573954272 -> 2263574703136
2263573954272 [label=AddmmBackward0]
2263593074896 -> 2263573954272
2263541363440 [label="mlp_extractor.value_net.2.bias
(64)" fillcolor=lightblue]
2263541363440 -> 2263593074896
2263593074896 [label=AccumulateGrad]
2263593075808 -> 2263573954272
2263593075808 [label=TanhBackward0]
2263593074992 -> 2263593075808
2263593074992 [label=AddmmBackward0]
2263593075184 -> 2263593074992
2263541363280 [label="mlp_extractor.value_net.0.bias
(64)" fillcolor=lightblue]
2263541363280 -> 2263593075184
2263593075184 [label=AccumulateGrad]
2263593075088 -> 2263593074992
2263593075088 [label=TBackward0]
2263593075280 -> 2263593075088
2263541363200 [label="mlp_extractor.value_net.0.weight
(64, 25)" fillcolor=lightblue]
2263541363200 -> 2263593075280
2263593075280 [label=AccumulateGrad]
2263593075952 -> 2263573954272
2263593075952 [label=TBackward0]
2263593075232 -> 2263593075952
2263541363360 [label="mlp_extractor.value_net.2.weight
(64, 64)" fillcolor=lightblue]
2263541363360 -> 2263593075232
2263593075232 [label=AccumulateGrad]
2263589926512 -> 2263578566400
2263589926512 [label=TBackward0]
2263593075136 -> 2263589926512
2263541364640 [label="value_net.weight
(1, 64)" fillcolor=lightblue]
2263541364640 -> 2263593075136
2263593075136 [label=AccumulateGrad]
2263578566400 -> 2263581907360
2263593173632 [label="
(1)" fillcolor=darkolivegreen1]
2263573748496 [label=SumBackward1]
2263587832448 -> 2263573748496
2263587832448 [label=StackBackward0]
2263593074944 -> 2263587832448
2263593074944 [label=SqueezeBackward1]
2263593075472 -> 2263593074944
2263593075472 [label=GatherBackward0]
2263593075568 -> 2263593075472
2263593075568 [label=SubBackward0]
2263593075712 -> 2263593075568
2263593075712 [label=SplitWithSizesBackward0]
2263593075664 -> 2263593075712
2263593075664 [label=AddmmBackward0]
2263593076576 -> 2263593075664
2263541364560 [label="action_net.bias
(10)" fillcolor=lightblue]
2263541364560 -> 2263593076576
2263593076576 [label=AccumulateGrad]
2263593076288 -> 2263593075664
2263593076288 [label=TanhBackward0]
2263593076864 -> 2263593076288
2263593076864 [label=AddmmBackward0]
2263593076960 -> 2263593076864
2263541363120 [label="mlp_extractor.policy_net.2.bias
(64)" fillcolor=lightblue]
2263541363120 -> 2263593076960
2263593076960 [label=AccumulateGrad]
2263593076912 -> 2263593076864
2263593076912 [label=TanhBackward0]
2263593077536 -> 2263593076912
2263593077536 [label=AddmmBackward0]
2263593077680 -> 2263593077536
2263541362880 [label="mlp_extractor.policy_net.0.bias
(64)" fillcolor=lightblue]
2263541362880 -> 2263593077680
2263593077680 [label=AccumulateGrad]
2263593077632 -> 2263593077536
2263593077632 [label=TBackward0]
2263593077776 -> 2263593077632
2263541362800 [label="mlp_extractor.policy_net.0.weight
(64, 25)" fillcolor=lightblue]
2263541362800 -> 2263593077776
2263593077776 [label=AccumulateGrad]
2263593077152 -> 2263593076864
2263593077152 [label=TBackward0]
2263593077728 -> 2263593077152
2263541363040 [label="mlp_extractor.policy_net.2.weight
(64, 64)" fillcolor=lightblue]
2263541363040 -> 2263593077728
2263593077728 [label=AccumulateGrad]
2263593075760 -> 2263593075664
2263593075760 [label=TBackward0]
2263593077584 -> 2263593075760
2263541364480 [label="action_net.weight
(10, 64)" fillcolor=lightblue]
2263541364480 -> 2263593077584
2263593077584 [label=AccumulateGrad]
2263593075616 -> 2263593075568
2263593075616 [label=LogsumexpBackward0]
2263593075712 -> 2263593075616
2263593075328 -> 2263587832448
2263593075328 [label=SqueezeBackward1]
2263593075424 -> 2263593075328
2263593075424 [label=GatherBackward0]
2263593076336 -> 2263593075424
2263593076336 [label=SubBackward0]
2263593075712 -> 2263593076336
2263593077488 -> 2263593076336
2263593077488 [label=LogsumexpBackward0]
2263593075712 -> 2263593077488
2263573748496 -> 2263593173632
}