1111
1212
1313def add_all_arguments (parser ):
14- # path / directory
14+
1515 parser .add_argument (
16- "--result_dir" , default = "./runs" , help = "The directory to save checkpoints and logs (default: %(default)s)"
16+ "-h" ,
17+ "--help" ,
18+ action = "help" ,
19+ help = "Quickstart: https://www.csie.ntu.edu.tw/~cjlin/libmultilabel/cli/quickstart.html" ,
1720 )
1821
22+ parser .add_argument ("--seed" , type = int , help = "Random seed (default: %(default)s)" )
23+
24+ # choose model (linear / nn)
25+ parser .add_argument ("--linear" , action = "store_true" , help = "Train linear model" )
26+
27+ # others
28+ parser .add_argument ("--cpu" , action = "store_true" , help = "Disable CUDA" )
29+ parser .add_argument ("--silent" , action = "store_true" , help = "Enable silent mode" )
30+ parser .add_argument (
31+ "--data_workers" , type = int , default = 4 , help = "Use multi-cpu core for data pre-processing (default: %(default)s)"
32+ )
33+ parser .add_argument (
34+ "--embed_cache_dir" ,
35+ type = str ,
36+ help = "For parameter search only: path to a directory for storing embeddings for multiple runs. (default: %(default)s)" ,
37+ )
38+ parser .add_argument (
39+ "--eval" , action = "store_true" , help = "Only run evaluation on the test set (default: %(default)s)"
40+ )
41+ parser .add_argument ("--checkpoint_path" , help = "The checkpoint to warm-up with (default: %(default)s)" )
42+
1943 # data
20- parser .add_argument ("--data_name" , default = "unnamed_data" , help = "Dataset name (default: %(default)s)" )
44+ parser .add_argument (
45+ "--data_name" ,
46+ default = "unnamed_data" ,
47+ help = "Dataset name for generating the output directory (default: %(default)s)" ,
48+ )
2149 parser .add_argument ("--training_file" , help = "Path to training data (default: %(default)s)" )
2250 parser .add_argument ("--val_file" , help = "Path to validation data (default: %(default)s)" )
23- parser .add_argument ("--test_file" , help = "Path to test data (default: %(default)s" )
51+ parser .add_argument ("--test_file" , help = "Path to test data (default: %(default)s)" )
52+ parser .add_argument ("--label_file" , type = str , help = "Path to a file holding all labels (default: %(default)s)" )
2453 parser .add_argument (
2554 "--val_size" ,
2655 type = float ,
2756 default = 0.2 ,
28- help = "Training-validation split: a ratio in [0, 1] or an integer for the size of the validation set (default: %(default)s). " ,
57+ help = "Training-validation split: a ratio in [0, 1] or an integer for the size of the validation set (default: %(default)s)" ,
2958 )
3059 parser .add_argument (
3160 "--min_vocab_freq" ,
@@ -67,8 +96,24 @@ def add_all_arguments(parser):
6796 help = "Whether to add the special tokens for inputs of the transformer-based language model. (default: %(default)s)" ,
6897 )
6998
99+ # model
100+ parser .add_argument ("--model_name" , default = "unnamed_model" , help = "Model to be used (default: %(default)s)" )
101+ parser .add_argument (
102+ "--init_weight" , default = "kaiming_uniform" , help = "Weight initialization to be used (default: %(default)s)"
103+ )
104+ parser .add_argument (
105+ "--loss_function" , default = "binary_cross_entropy_with_logits" , help = "Loss function (default: %(default)s)"
106+ )
107+
108+ # pretrained vocab / embeddings
109+ parser .add_argument ("--vocab_file" , type = str , help = "Path to a file holding vocabuaries (default: %(default)s)" )
110+ parser .add_argument (
111+ "--embed_file" ,
112+ type = str ,
113+ help = "Path to a file holding pre-trained embeddings or the name of the pretrained GloVe embedding (default: %(default)s)" ,
114+ )
115+
70116 # train
71- parser .add_argument ("--seed" , type = int , help = "Random seed (default: %(default)s)" )
72117 parser .add_argument (
73118 "--epochs" , type = int , default = 10000 , help = "The number of epochs to train (default: %(default)s)"
74119 )
@@ -109,15 +154,6 @@ def add_all_arguments(parser):
109154 help = "Whether the embeddings of each word is normalized to a unit vector (default: %(default)s)" ,
110155 )
111156
112- # model
113- parser .add_argument ("--model_name" , default = "unnamed_model" , help = "Model to be used (default: %(default)s)" )
114- parser .add_argument (
115- "--init_weight" , default = "kaiming_uniform" , help = "Weight initialization to be used (default: %(default)s)"
116- )
117- parser .add_argument (
118- "--loss_function" , default = "binary_cross_entropy_with_logits" , help = "Loss function (default: %(default)s)"
119- )
120-
121157 # eval
122158 parser .add_argument (
123159 "--eval_batch_size" , type = int , default = 256 , help = "Size of evaluating batches (default: %(default)s)"
@@ -138,28 +174,6 @@ def add_all_arguments(parser):
138174 "--val_metric" , default = "P@1" , help = "The metric to select the best model for testing (default: %(default)s)"
139175 )
140176
141- # pretrained vocab / embeddings
142- parser .add_argument ("--vocab_file" , type = str , help = "Path to a file holding vocabuaries (default: %(default)s)" )
143- parser .add_argument (
144- "--embed_file" , type = str , help = "Path to a file holding pre-trained embeddings or the name of the pretrained GloVe embedding (default: %(default)s)"
145- )
146- parser .add_argument ("--label_file" , type = str , help = "Path to a file holding all labels (default: %(default)s)" )
147-
148- # log
149- parser .add_argument (
150- "--save_k_predictions" ,
151- type = int ,
152- nargs = "?" ,
153- const = 100 ,
154- default = 0 ,
155- help = "Save top k predictions on test set. k=%(const)s if not specified. (default: %(default)s)" ,
156- )
157- parser .add_argument (
158- "--predict_out_path" ,
159- default = "./predictions.txt" ,
160- help = "Path to the output file holding label results (default: %(default)s)" ,
161- )
162-
163177 # auto-test
164178 parser .add_argument (
165179 "--limit_train_batches" ,
@@ -180,24 +194,27 @@ def add_all_arguments(parser):
180194 help = "Percentage of test dataset to use for auto-testing (default: %(default)s)" ,
181195 )
182196
183- # others
184- parser .add_argument ("--cpu" , action = "store_true" , help = "Disable CUDA" )
185- parser .add_argument ("--silent" , action = "store_true" , help = "Enable silent mode" )
197+ # log
186198 parser .add_argument (
187- "--data_workers" , type = int , default = 4 , help = "Use multi-cpu core for data pre-processing (default: %(default)s)"
199+ "--save_k_predictions" ,
200+ type = int ,
201+ nargs = "?" ,
202+ const = 100 ,
203+ default = 0 ,
204+ help = "Save top k predictions on test set. k=%(const)s if not specified. (default: %(default)s)" ,
188205 )
189206 parser .add_argument (
190- "--embed_cache_dir " ,
191- type = str ,
192- help = "For parameter search only: path to a directory for storing embeddings for multiple runs. (default: %(default)s)" ,
207+ "--predict_out_path " ,
208+ default = "./predictions.txt" ,
209+ help = "Path to the output file holding label results (default: %(default)s)" ,
193210 )
211+
212+ # path / directory
194213 parser .add_argument (
195- "--eval " , action = "store_true " , help = "Only run evaluation on the test set (default: %(default)s)"
214+ "--result_dir " , default = "./runs " , help = "The directory to save checkpoints and logs (default: %(default)s)"
196215 )
197- parser .add_argument ("--checkpoint_path" , help = "The checkpoint to warm-up with (default: %(default)s)" )
198216
199217 # linear options
200- parser .add_argument ("--linear" , action = "store_true" , help = "Train linear model" )
201218 parser .add_argument (
202219 "--data_format" ,
203220 type = str ,
@@ -224,7 +241,10 @@ def add_all_arguments(parser):
224241 "--tree_max_depth" , type = int , default = 10 , help = "Maximum depth of the tree (default: %(default)s)"
225242 )
226243 parser .add_argument (
227- "--tree_ensemble_models" , type = int , default = 1 , help = "Number of models in the tree ensemble (default: %(default)s)"
244+ "--tree_ensemble_models" ,
245+ type = int ,
246+ default = 1 ,
247+ help = "Number of models in the tree ensemble (default: %(default)s)" ,
228248 )
229249 parser .add_argument (
230250 "--beam_width" ,
@@ -239,13 +259,6 @@ def add_all_arguments(parser):
239259 default = 8 ,
240260 help = "the maximal number of labels inside a cluster (default: %(default)s)" ,
241261 )
242- parser .add_argument (
243- "-h" ,
244- "--help" ,
245- action = "help" ,
246- help = "If you are trying to specify network config such as dropout or activation or config of the learning rate scheduler, use a yaml file instead. "
247- "See example configs in example_config" ,
248- )
249262
250263
251264def get_config ():
0 commit comments