-
Notifications
You must be signed in to change notification settings - Fork 8
/
args.py
172 lines (159 loc) · 5.31 KB
/
args.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
import argparse
import os
import pathlib
from simple_einet.dist import Dist
def parse_args():
home = os.getenv("HOME")
data_dir = os.getenv("DATA_DIR", os.path.join(home, "data"))
results_dir = os.getenv("RESULTS_DIR", os.path.join(home, "results"))
parser = argparse.ArgumentParser(description="PyTorch MNIST Example")
parser.add_argument(
"--dataset",
required=True,
help="Dataset to use for training.",
)
# Flag if model should be trained
parser.add_argument(
"--train",
action="store_true",
help="Flag if model should be trained.",
)
parser.add_argument("--data-dir", default=data_dir, help="path to dataset")
parser.add_argument("--results-dir", default=results_dir, help="path to results")
parser.add_argument(
"--mixture",
default=1,
type=int,
help="Number of mixture components for an EinetMixture model (if 1 then only an Einet model is used).",
)
parser.add_argument(
"--lr",
type=float,
default=0.1,
help="Learning rate",
)
parser.add_argument(
"--batch-size",
type=int,
default=64,
metavar="N",
help="input batch size for training (default: 64)",
)
parser.add_argument(
"--n-bits",
type=int,
default=8,
metavar="N",
help="number of bits for each pixel (default: 8)",
)
parser.add_argument("--num-workers", type=int, help="number of data loading workers", default=4)
parser.add_argument(
"--epochs",
type=int,
default=14,
metavar="N",
help="number of epochs to train (default: 14)",
)
parser.add_argument(
"--temperature-leaves",
type=float,
default=1.0,
help="Temperature for leave variance during sampling.",
)
parser.add_argument(
"--temperature-sums",
type=float,
default=1.0,
help="Temperature for sum weights during sampling.",
)
parser.add_argument(
"--dropout",
type=float,
default=0.0,
help="Dropout probability.",
)
parser.add_argument(
"--min-sigma",
type=float,
default=1e-2,
help="Normal distribution min sigma value.",
)
parser.add_argument(
"--max-sigma",
type=float,
default=2.0,
help="Normal distribution min sigma value.",
)
parser.add_argument(
"--dry-run",
action="store_true",
default=False,
help="quickly check a single pass",
)
parser.add_argument("--seed", type=int, default=1, metavar="S", help="random seed (default: 1)")
parser.add_argument(
"--log-interval",
type=int,
default=10,
metavar="N",
help="how many batches to wait before logging training status",
)
parser.add_argument(
"--classification",
action="store_true",
default=False,
help="Flag for learning a discriminative task of classifying MNIST digits.",
)
parser.add_argument(
"--device",
default="cuda",
help="Device flag. Can be either 'cpu' or 'cuda'.",
)
parser.add_argument(
"--debug",
action="store_true",
help="Debug flag (less data, fewer iterations)",
)
parser.add_argument("-S", type=int, default=10, help="Number of output sum nodes in each layer.")
parser.add_argument("-I", type=int, default=10, help="Number of distributions for each RV.")
parser.add_argument("-D", type=int, default=3)
parser.add_argument("-R", type=int, default=1)
parser.add_argument("--gpu", help="GPU device id.")
parser.add_argument(
"--load-and-eval",
default=None,
type=pathlib.Path,
help="path to a result directory with a "
"model and stored args. if set, "
"training is skipped and model is "
"evaluated",
)
parser.add_argument("--layer", choices=["einsum", "linsum"], default="linsum", help="layer type")
parser.add_argument(
"--dist",
type=Dist,
choices=list(Dist),
default=Dist.BINOMIAL,
help="data distribution",
)
parser.add_argument(
"--precision",
"-p",
default=32,
help="floating point precision [16, " "bf16, 32]",
choices=["16", "bf16", "32"],
)
parser.add_argument("--group-tag", type=str, help="tag for group of experiments")
parser.add_argument("--tag", type=str, help="tag for experiment")
parser.add_argument("--wandb", action="store_true", help="enable wandb online logging")
parser.add_argument("--swa", action="store_true", help="use Stochastic Weight Averaging")
parser.add_argument("--profiler", help="", choices=["simple", "pytorch", "advanced"])
parser.add_argument("--log-weights", action="store_true", help="use log weights")
parser.add_argument("--num-devices", type=int, default=1, help="number of devices")
parser.add_argument("--structure", default="top-down", choices=["bottom-up", "top-down"], help="structure of the network")
# Parse args
args = parser.parse_args()
# If FP16/FP32 is given, convert to int (else it's "bf16", keep string)
if args.precision == "16" or args.precision == "32":
args.precision = int(args.precision)
return args