-
Notifications
You must be signed in to change notification settings - Fork 46
/
Copy pathpreprocess.py
611 lines (593 loc) · 48.9 KB
/
preprocess.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
import os
import argparse
from multiprocessing import cpu_count
from utils.convert_csqa import convert_to_entailment
from utils.convert_scitail import convert_to_scitail_statement
from utils.convert_phys import convert_to_phys_statement
from utils.convert_socialiqa import convert_to_socialiqa_statement
from utils.convert_obqa import convert_to_obqa_statement
from utils.tokenization_utils import tokenize_statement_file, make_word_vocab
from utils.conceptnet import extract_english, construct_graph
from utils.embedding import glove2npy, load_pretrained_embeddings
from utils.grounding import create_matcher_patterns, ground
from utils.paths import find_paths, score_paths, prune_paths, find_relational_paths_from_paths, generate_path_and_graph_from_adj
from utils.graph import generate_graph, generate_adj_data_from_grounded_concepts, coo_to_normalized
from utils.triples import generate_triples_from_adj
input_paths = {
'csqa': {
'train': './data/csqa/train_rand_split.jsonl',
'dev': './data/csqa/dev_rand_split.jsonl',
'test': './data/csqa/test_rand_split_no_answers.jsonl',
},
'scitail': {
'train': './data/scitail/SciTailV1.1/predictor_format/scitail_1.0_structure_train.jsonl',
'dev': './data/scitail/SciTailV1.1/predictor_format/scitail_1.0_structure_dev.jsonl',
'test': './data/scitail/SciTailV1.1/predictor_format/scitail_1.0_structure_test.jsonl',
},
'phys': {
'train': './data/phys/physicaliqa-train-dev/train.jsonl',
'dev': './data/phys/physicaliqa-train-dev/dev.jsonl',
'train-label': './data/phys/physicaliqa-train-dev/train-labels.lst',
'dev-label': './data/phys/physicaliqa-train-dev/dev-labels.lst',
},
'socialiqa': {
'train': './data/socialiqa/socialiqa-train-dev/train.jsonl',
'dev': './data/socialiqa/socialiqa-train-dev/dev.jsonl',
'train-label': './data/socialiqa/socialiqa-train-dev/train-labels.lst',
'dev-label': './data/socialiqa/socialiqa-train-dev/dev-labels.lst',
},
'obqa': {
'train': './data/obqa/OpenBookQA-V1-Sep2018/Data/Main/train.jsonl',
'dev': './data/obqa/OpenBookQA-V1-Sep2018/Data/Main/dev.jsonl',
'test': './data/obqa/OpenBookQA-V1-Sep2018/Data/Main/test.jsonl',
},
'cpnet': {
'csv': './data/cpnet/conceptnet-assertions-5.6.0.csv',
},
'glove': {
'txt': './data/glove/glove.6B.300d.txt',
},
'numberbatch': {
'txt': './data/transe/numberbatch-en-19.08.txt',
},
'transe': {
'ent': './data/transe/glove.transe.sgd.ent.npy',
'rel': './data/transe/glove.transe.sgd.rel.npy',
},
}
output_paths = {
'cpnet': {
'csv': './data/cpnet/conceptnet.en.csv',
'vocab': './data/cpnet/concept.txt',
'patterns': './data/cpnet/matcher_patterns.json',
'unpruned-graph': './data/cpnet/conceptnet.en.unpruned.graph',
'pruned-graph': './data/cpnet/conceptnet.en.pruned.graph',
},
'glove': {
'npy': './data/glove/glove.6B.300d.npy',
'vocab': './data/glove/glove.vocab',
},
'numberbatch': {
'npy': './data/transe/nb.npy',
'vocab': './data/transe/nb.vocab',
'concept_npy': './data/transe/concept.nb.npy'
},
'csqa': {
'statement': {
'train': './data/csqa/statement/train.statement.jsonl',
'dev': './data/csqa/statement/dev.statement.jsonl',
'test': './data/csqa/statement/test.statement.jsonl',
'vocab': './data/csqa/statement/vocab.json',
},
'statement-with-ans-pos': {
'train': './data/csqa/statement/train.statement-with-ans-pos.jsonl',
'dev': './data/csqa/statement/dev.statement-with-ans-pos.jsonl',
'test': './data/csqa/statement/test.statement-with-ans-pos.jsonl',
},
'tokenized': {
'train': './data/csqa/tokenized/train.tokenized.txt',
'dev': './data/csqa/tokenized/dev.tokenized.txt',
'test': './data/csqa/tokenized/test.tokenized.txt',
},
'grounded': {
'train': './data/csqa/grounded/train.grounded.jsonl',
'dev': './data/csqa/grounded/dev.grounded.jsonl',
'test': './data/csqa/grounded/test.grounded.jsonl',
},
'paths': {
'raw-train': './data/csqa/paths/train.paths.raw.jsonl',
'raw-dev': './data/csqa/paths/dev.paths.raw.jsonl',
'raw-test': './data/csqa/paths/test.paths.raw.jsonl',
'scores-train': './data/csqa/paths/train.paths.scores.jsonl',
'scores-dev': './data/csqa/paths/dev.paths.scores.jsonl',
'scores-test': './data/csqa/paths/test.paths.scores.jsonl',
'pruned-train': './data/csqa/paths/train.paths.pruned.jsonl',
'pruned-dev': './data/csqa/paths/dev.paths.pruned.jsonl',
'pruned-test': './data/csqa/paths/test.paths.pruned.jsonl',
'adj-train': './data/csqa/paths/train.paths.adj.jsonl',
'adj-dev': './data/csqa/paths/dev.paths.adj.jsonl',
'adj-test': './data/csqa/paths/test.paths.adj.jsonl',
},
'graph': {
'train': './data/csqa/graph/train.graph.jsonl',
'dev': './data/csqa/graph/dev.graph.jsonl',
'test': './data/csqa/graph/test.graph.jsonl',
'adj-train': './data/csqa/graph/train.graph.adj.pk',
'adj-dev': './data/csqa/graph/dev.graph.adj.pk',
'adj-test': './data/csqa/graph/test.graph.adj.pk',
'nxg-from-adj-train': './data/csqa/graph/train.graph.adj.jsonl',
'nxg-from-adj-dev': './data/csqa/graph/dev.graph.adj.jsonl',
'nxg-from-adj-test': './data/csqa/graph/test.graph.adj.jsonl',
},
'triple': {
'train': './data/csqa/triples/train.triples.pk',
'dev': './data/csqa/triples/dev.triples.pk',
'test': './data/csqa/triples/test.triples.pk',
},
},
'scitail': {
'statement': {
'train': './data/scitail/statement/train.statement.jsonl',
'dev': './data/scitail/statement/dev.statement.jsonl',
'test': './data/scitail/statement/test.statement.jsonl',
'train-fairseq': './data/scitail/fairseq/official/train.jsonl',
'dev-fairseq': './data/scitail/fairseq/official/valid.jsonl',
'test-fairseq': './data/scitail/fairseq/official/test.jsonl',
'vocab': './data/scitail/statement/vocab.json',
},
'tokenized': {
'train': './data/scitail/tokenized/train.tokenized.txt',
'dev': './data/scitail/tokenized/dev.tokenized.txt',
'test': './data/scitail/tokenized/test.tokenized.txt',
},
'grounded': {
'train': './data/scitail/grounded/train.grounded.jsonl',
'dev': './data/scitail/grounded/dev.grounded.jsonl',
'test': './data/scitail/grounded/test.grounded.jsonl',
},
'paths': {
'raw-train': './data/scitail/paths/train.paths.raw.jsonl',
'raw-dev': './data/scitail/paths/dev.paths.raw.jsonl',
'raw-test': './data/scitail/paths/test.paths.raw.jsonl',
'scores-train': './data/scitail/paths/train.paths.scores.jsonl',
'scores-dev': './data/scitail/paths/dev.paths.scores.jsonl',
'scores-test': './data/scitail/paths/test.paths.scores.jsonl',
'pruned-train': './data/scitail/paths/train.paths.pruned.jsonl',
'pruned-dev': './data/scitail/paths/dev.paths.pruned.jsonl',
'pruned-test': './data/scitail/paths/test.paths.pruned.jsonl',
},
'graph': {
'train': './data/scitail/graph/train.graph.jsonl',
'dev': './data/scitail/graph/dev.graph.jsonl',
'test': './data/scitail/graph/test.graph.jsonl',
'adj-train': './data/scitail/graph/train.graph.adj.pk',
'adj-dev': './data/scitail/graph/dev.graph.adj.pk',
'adj-test': './data/scitail/graph/test.graph.adj.pk',
},
'triple': {
'train': './data/scitail/triples/train.triples.pk',
'dev': './data/scitail/triples/dev.triples.pk',
'test': './data/scitail/triples/test.triples.pk',
},
},
'phys': {
'statement': {
'train': './data/phys/statement/train.statement.jsonl',
'dev': './data/phys/statement/dev.statement.jsonl',
'train-fairseq': './data/phys/fairseq/official/train.jsonl',
'dev-fairseq': './data/phys/fairseq/official/valid.jsonl',
'vocab': './data/phys/statement/vocab.json',
},
'tokenized': {
'train': './data/phys/tokenized/train.tokenized.txt',
'dev': './data/phys/tokenized/dev.tokenized.txt',
},
'grounded': {
'train': './data/phys/grounded/train.grounded.jsonl',
'dev': './data/phys/grounded/dev.grounded.jsonl',
},
'paths': {
'raw-train': './data/phys/paths/train.paths.raw.jsonl',
'raw-dev': './data/phys/paths/dev.paths.raw.jsonl',
'scores-train': './data/phys/paths/train.paths.scores.jsonl',
'scores-dev': './data/phys/paths/dev.paths.scores.jsonl',
'pruned-train': './data/phys/paths/train.paths.pruned.jsonl',
'pruned-dev': './data/phys/paths/dev.paths.pruned.jsonl',
},
'graph': {
'train': './data/phys/graph/train.graph.jsonl',
'dev': './data/phys/graph/dev.graph.jsonl',
'adj-train': './data/phys/graph/train.graph.adj.pk',
'adj-dev': './data/phys/graph/dev.graph.adj.pk',
},
'triple': {
'train': './data/phys/triples/train.triples.pk',
'dev': './data/phys/triples/dev.triples.pk',
'test': './data/phys/triples/test.triples.pk',
},
},
'socialiqa': {
'statement': {
'train': './data/socialiqa/statement/train.statement.jsonl',
'dev': './data/socialiqa/statement/dev.statement.jsonl',
'train-fairseq': './data/socialiqa/fairseq/official/train.jsonl',
'dev-fairseq': './data/socialiqa/fairseq/official/valid.jsonl',
'vocab': './data/socialiqa/statement/vocab.json',
},
'tokenized': {
'train': './data/socialiqa/tokenized/train.tokenized.txt',
'dev': './data/socialiqa/tokenized/dev.tokenized.txt',
},
'grounded': {
'train': './data/socialiqa/grounded/train.grounded.jsonl',
'dev': './data/socialiqa/grounded/dev.grounded.jsonl',
},
'paths': {
'raw-train': './data/socialiqa/paths/train.paths.raw.jsonl',
'raw-dev': './data/socialiqa/paths/dev.paths.raw.jsonl',
'scores-train': './data/socialiqa/paths/train.paths.scores.jsonl',
'scores-dev': './data/socialiqa/paths/dev.paths.scores.jsonl',
'pruned-train': './data/socialiqa/paths/train.paths.pruned.jsonl',
'pruned-dev': './data/socialiqa/paths/dev.paths.pruned.jsonl',
'adj-train': './data/socialiqa/paths/train.paths.adj.jsonl',
'adj-dev': './data/socialiqa/paths/dev.paths.adj.jsonl',
'adj-test': './data/socialiqa/paths/test.paths.adj.jsonl',
},
'graph': {
'train': './data/socialiqa/graph/train.graph.jsonl',
'dev': './data/socialiqa/graph/dev.graph.jsonl',
'adj-train': './data/socialiqa/graph/train.graph.adj.pk',
'adj-dev': './data/socialiqa/graph/dev.graph.adj.pk',
'nxg-from-adj-train': './data/socialiqa/graph/train.graph.adj.jsonl',
'nxg-from-adj-dev': './data/socialiqa/graph/dev.graph.adj.jsonl',
},
'triple': {
'train': './data/socialiqa/triples/train.triples.pk',
'dev': './data/socialiqa/triples/dev.triples.pk',
'test': './data/socialiqa/triples/test.triples.pk',
},
},
'obqa': {
'statement': {
'train': './data/obqa/statement/train.statement.jsonl',
'dev': './data/obqa/statement/dev.statement.jsonl',
'test': './data/obqa/statement/test.statement.jsonl',
'train-fairseq': './data/obqa/fairseq/official/train.jsonl',
'dev-fairseq': './data/obqa/fairseq/official/valid.jsonl',
'test-fairseq': './data/obqa/fairseq/official/test.jsonl',
'vocab': './data/obqa/statement/vocab.json',
},
'tokenized': {
'train': './data/obqa/tokenized/train.tokenized.txt',
'dev': './data/obqa/tokenized/dev.tokenized.txt',
'test': './data/obqa/tokenized/test.tokenized.txt',
},
'grounded': {
'train': './data/obqa/grounded/train.grounded.jsonl',
'dev': './data/obqa/grounded/dev.grounded.jsonl',
'test': './data/obqa/grounded/test.grounded.jsonl',
},
'paths': {
'raw-train': './data/obqa/paths/train.paths.raw.jsonl',
'raw-dev': './data/obqa/paths/dev.paths.raw.jsonl',
'raw-test': './data/obqa/paths/test.paths.raw.jsonl',
'scores-train': './data/obqa/paths/train.paths.scores.jsonl',
'scores-dev': './data/obqa/paths/dev.paths.scores.jsonl',
'scores-test': './data/obqa/paths/test.paths.scores.jsonl',
'pruned-train': './data/obqa/paths/train.paths.pruned.jsonl',
'pruned-dev': './data/obqa/paths/dev.paths.pruned.jsonl',
'pruned-test': './data/obqa/paths/test.paths.pruned.jsonl',
'adj-train': './data/obqa/paths/train.paths.adj.jsonl',
'adj-dev': './data/obqa/paths/dev.paths.adj.jsonl',
'adj-test': './data/obqa/paths/test.paths.adj.jsonl',
},
'graph': {
'train': './data/obqa/graph/train.graph.jsonl',
'dev': './data/obqa/graph/dev.graph.jsonl',
'test': './data/obqa/graph/test.graph.jsonl',
'adj-train': './data/obqa/graph/train.graph.adj.pk',
'adj-dev': './data/obqa/graph/dev.graph.adj.pk',
'adj-test': './data/obqa/graph/test.graph.adj.pk',
'nxg-from-adj-train': './data/obqa/graph/train.graph.adj.jsonl',
'nxg-from-adj-dev': './data/obqa/graph/dev.graph.adj.jsonl',
'nxg-from-adj-test': './data/obqa/graph/test.graph.adj.jsonl',
},
'triple': {
'train': './data/obqa/triples/train.triples.pk',
'dev': './data/obqa/triples/dev.triples.pk',
'test': './data/obqa/triples/test.triples.pk',
},
},
'hswag': {},
'anli': {},
}
def main():
parser = argparse.ArgumentParser()
parser.add_argument('--run', default=['common', 'csqa'], choices=['common', 'csqa', 'hswag', 'anli', 'exp', 'scitail', 'phys', 'socialiqa', 'obqa', 'make_word_vocab'], nargs='+')
parser.add_argument('--path_prune_threshold', type=float, default=0.12, help='threshold for pruning paths')
parser.add_argument('--max_node_num', type=int, default=200, help='maximum number of nodes per graph')
parser.add_argument('-p', '--nprocs', type=int, default=cpu_count(), help='number of processes to use')
parser.add_argument('--seed', type=int, default=0, help='random seed')
parser.add_argument('--debug', action='store_true', help='enable debug mode')
args = parser.parse_args()
if args.debug:
raise NotImplementedError()
routines = {
'common': [
{'func': glove2npy, 'args': (input_paths['glove']['txt'], output_paths['glove']['npy'], output_paths['glove']['vocab'])},
{'func': glove2npy, 'args': (input_paths['numberbatch']['txt'], output_paths['numberbatch']['npy'], output_paths['numberbatch']['vocab'], True)},
{'func': extract_english, 'args': (input_paths['cpnet']['csv'], output_paths['cpnet']['csv'], output_paths['cpnet']['vocab'])},
{'func': load_pretrained_embeddings,
'args': (output_paths['numberbatch']['npy'], output_paths['numberbatch']['vocab'], output_paths['cpnet']['vocab'], False, output_paths['numberbatch']['concept_npy'])},
{'func': construct_graph, 'args': (output_paths['cpnet']['csv'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['unpruned-graph'], False)},
{'func': construct_graph, 'args': (output_paths['cpnet']['csv'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['pruned-graph'], True)},
{'func': create_matcher_patterns, 'args': (output_paths['cpnet']['vocab'], output_paths['cpnet']['patterns'])},
],
'csqa': [
{'func': convert_to_entailment, 'args': (input_paths['csqa']['train'], output_paths['csqa']['statement']['train'])},
{'func': convert_to_entailment, 'args': (input_paths['csqa']['dev'], output_paths['csqa']['statement']['dev'])},
{'func': convert_to_entailment, 'args': (input_paths['csqa']['test'], output_paths['csqa']['statement']['test'])},
{'func': tokenize_statement_file, 'args': (output_paths['csqa']['statement']['train'], output_paths['csqa']['tokenized']['train'])},
{'func': tokenize_statement_file, 'args': (output_paths['csqa']['statement']['dev'], output_paths['csqa']['tokenized']['dev'])},
{'func': tokenize_statement_file, 'args': (output_paths['csqa']['statement']['test'], output_paths['csqa']['tokenized']['test'])},
{'func': make_word_vocab, 'args': ((output_paths['csqa']['statement']['train'],), output_paths['csqa']['statement']['vocab'])},
{'func': ground, 'args': (output_paths['csqa']['statement']['train'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['patterns'], output_paths['csqa']['grounded']['train'], args.nprocs)},
{'func': ground, 'args': (output_paths['csqa']['statement']['dev'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['patterns'], output_paths['csqa']['grounded']['dev'], args.nprocs)},
{'func': ground, 'args': (output_paths['csqa']['statement']['test'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['patterns'], output_paths['csqa']['grounded']['test'], args.nprocs)},
{'func': find_paths, 'args': (output_paths['csqa']['grounded']['train'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['pruned-graph'], output_paths['csqa']['paths']['raw-train'], args.nprocs, args.seed)},
{'func': find_paths, 'args': (output_paths['csqa']['grounded']['dev'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['pruned-graph'], output_paths['csqa']['paths']['raw-dev'], args.nprocs, args.seed)},
{'func': find_paths, 'args': (output_paths['csqa']['grounded']['test'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['pruned-graph'], output_paths['csqa']['paths']['raw-test'], args.nprocs, args.seed)},
{'func': score_paths, 'args': (output_paths['csqa']['paths']['raw-train'], input_paths['transe']['ent'], input_paths['transe']['rel'],
output_paths['cpnet']['vocab'], output_paths['csqa']['paths']['scores-train'], args.nprocs)},
{'func': score_paths, 'args': (output_paths['csqa']['paths']['raw-dev'], input_paths['transe']['ent'], input_paths['transe']['rel'],
output_paths['cpnet']['vocab'], output_paths['csqa']['paths']['scores-dev'], args.nprocs)},
{'func': score_paths, 'args': (output_paths['csqa']['paths']['raw-test'], input_paths['transe']['ent'], input_paths['transe']['rel'],
output_paths['cpnet']['vocab'], output_paths['csqa']['paths']['scores-test'], args.nprocs)},
{'func': prune_paths, 'args': (output_paths['csqa']['paths']['raw-train'], output_paths['csqa']['paths']['scores-train'],
output_paths['csqa']['paths']['pruned-train'], args.path_prune_threshold)},
{'func': prune_paths, 'args': (output_paths['csqa']['paths']['raw-dev'], output_paths['csqa']['paths']['scores-dev'],
output_paths['csqa']['paths']['pruned-dev'], args.path_prune_threshold)},
{'func': prune_paths, 'args': (output_paths['csqa']['paths']['raw-test'], output_paths['csqa']['paths']['scores-test'],
output_paths['csqa']['paths']['pruned-test'], args.path_prune_threshold)},
{'func': generate_graph, 'args': (output_paths['csqa']['grounded']['train'], output_paths['csqa']['paths']['pruned-train'],
output_paths['cpnet']['vocab'], output_paths['cpnet']['pruned-graph'],
output_paths['csqa']['graph']['train'])},
{'func': generate_graph, 'args': (output_paths['csqa']['grounded']['dev'], output_paths['csqa']['paths']['pruned-dev'],
output_paths['cpnet']['vocab'], output_paths['cpnet']['pruned-graph'],
output_paths['csqa']['graph']['dev'])},
{'func': generate_graph, 'args': (output_paths['csqa']['grounded']['test'], output_paths['csqa']['paths']['pruned-test'],
output_paths['cpnet']['vocab'], output_paths['cpnet']['pruned-graph'],
output_paths['csqa']['graph']['test'])},
{'func': generate_adj_data_from_grounded_concepts, 'args': (output_paths['csqa']['grounded']['train'], output_paths['cpnet']['pruned-graph'],
output_paths['cpnet']['vocab'], output_paths['csqa']['graph']['adj-train'], args.nprocs)},
{'func': generate_adj_data_from_grounded_concepts, 'args': (output_paths['csqa']['grounded']['dev'], output_paths['cpnet']['pruned-graph'],
output_paths['cpnet']['vocab'], output_paths['csqa']['graph']['adj-dev'], args.nprocs)},
{'func': generate_adj_data_from_grounded_concepts, 'args': (output_paths['csqa']['grounded']['test'], output_paths['cpnet']['pruned-graph'],
output_paths['cpnet']['vocab'], output_paths['csqa']['graph']['adj-test'], args.nprocs)},
{'func': generate_triples_from_adj, 'args': (output_paths['csqa']['graph']['adj-train'], output_paths['csqa']['grounded']['train'],
output_paths['cpnet']['vocab'], output_paths['csqa']['triple']['train'])},
{'func': generate_triples_from_adj, 'args': (output_paths['csqa']['graph']['adj-dev'], output_paths['csqa']['grounded']['dev'],
output_paths['cpnet']['vocab'], output_paths['csqa']['triple']['dev'])},
{'func': generate_triples_from_adj, 'args': (output_paths['csqa']['graph']['adj-test'], output_paths['csqa']['grounded']['test'],
output_paths['cpnet']['vocab'], output_paths['csqa']['triple']['test'])},
{'func': generate_path_and_graph_from_adj, 'args': (output_paths['csqa']['graph']['adj-train'], output_paths['cpnet']['pruned-graph'], output_paths['csqa']['paths']['adj-train'], output_paths['csqa']['graph']['nxg-from-adj-train'], args.nprocs)},
{'func': generate_path_and_graph_from_adj, 'args': (output_paths['csqa']['graph']['adj-dev'], output_paths['cpnet']['pruned-graph'], output_paths['csqa']['paths']['adj-dev'], output_paths['csqa']['graph']['nxg-from-adj-dev'], args.nprocs)},
{'func': generate_path_and_graph_from_adj, 'args': (output_paths['csqa']['graph']['adj-test'], output_paths['cpnet']['pruned-graph'], output_paths['csqa']['paths']['adj-test'], output_paths['csqa']['graph']['nxg-from-adj-test'], args.nprocs)},
],
'scitail': [
{'func': convert_to_scitail_statement, 'args': (input_paths['scitail']['train'], output_paths['scitail']['statement']['train'])},
{'func': convert_to_scitail_statement, 'args': (input_paths['scitail']['dev'], output_paths['scitail']['statement']['dev'])},
{'func': convert_to_scitail_statement, 'args': (input_paths['scitail']['test'], output_paths['scitail']['statement']['test'])},
{'func': tokenize_statement_file, 'args': (output_paths['scitail']['statement']['train'], output_paths['scitail']['tokenized']['train'])},
{'func': tokenize_statement_file, 'args': (output_paths['scitail']['statement']['dev'], output_paths['scitail']['tokenized']['dev'])},
{'func': tokenize_statement_file, 'args': (output_paths['scitail']['statement']['test'], output_paths['scitail']['tokenized']['test'])},
{'func': make_word_vocab, 'args': ((output_paths['scitail']['statement']['train'],), output_paths['scitail']['statement']['vocab'])},
{'func': ground, 'args': (output_paths['scitail']['statement']['train'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['patterns'], output_paths['scitail']['grounded']['train'], args.nprocs)},
{'func': ground, 'args': (output_paths['scitail']['statement']['dev'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['patterns'], output_paths['scitail']['grounded']['dev'], args.nprocs)},
{'func': ground, 'args': (output_paths['scitail']['statement']['test'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['patterns'], output_paths['scitail']['grounded']['test'], args.nprocs)},
{'func': find_paths, 'args': (output_paths['scitail']['grounded']['train'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['pruned-graph'], output_paths['scitail']['paths']['raw-train'], args.nprocs, args.seed)},
{'func': find_paths, 'args': (output_paths['scitail']['grounded']['dev'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['pruned-graph'], output_paths['scitail']['paths']['raw-dev'], args.nprocs, args.seed)},
{'func': find_paths, 'args': (output_paths['scitail']['grounded']['test'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['pruned-graph'], output_paths['scitail']['paths']['raw-test'], args.nprocs, args.seed)},
{'func': score_paths, 'args': (output_paths['scitail']['paths']['raw-train'], input_paths['transe']['ent'], input_paths['transe']['rel'],
output_paths['cpnet']['vocab'], output_paths['scitail']['paths']['scores-train'], args.nprocs)},
{'func': score_paths, 'args': (output_paths['scitail']['paths']['raw-dev'], input_paths['transe']['ent'], input_paths['transe']['rel'],
output_paths['cpnet']['vocab'], output_paths['scitail']['paths']['scores-dev'], args.nprocs)},
{'func': score_paths, 'args': (output_paths['scitail']['paths']['raw-test'], input_paths['transe']['ent'], input_paths['transe']['rel'],
output_paths['cpnet']['vocab'], output_paths['scitail']['paths']['scores-test'], args.nprocs)},
{'func': prune_paths, 'args': (output_paths['scitail']['paths']['raw-train'], output_paths['scitail']['paths']['scores-train'],
output_paths['scitail']['paths']['pruned-train'], args.path_prune_threshold)},
{'func': prune_paths, 'args': (output_paths['scitail']['paths']['raw-dev'], output_paths['scitail']['paths']['scores-dev'],
output_paths['scitail']['paths']['pruned-dev'], args.path_prune_threshold)},
{'func': prune_paths, 'args': (output_paths['scitail']['paths']['raw-test'], output_paths['scitail']['paths']['scores-test'],
output_paths['scitail']['paths']['pruned-test'], args.path_prune_threshold)},
{'func': generate_graph, 'args': (output_paths['scitail']['grounded']['train'], output_paths['scitail']['paths']['pruned-train'],
output_paths['cpnet']['vocab'], output_paths['cpnet']['pruned-graph'],
output_paths['scitail']['graph']['train'])},
{'func': generate_graph, 'args': (output_paths['scitail']['grounded']['dev'], output_paths['scitail']['paths']['pruned-dev'],
output_paths['cpnet']['vocab'], output_paths['cpnet']['pruned-graph'],
output_paths['scitail']['graph']['dev'])},
{'func': generate_graph, 'args': (output_paths['scitail']['grounded']['test'], output_paths['scitail']['paths']['pruned-test'],
output_paths['cpnet']['vocab'], output_paths['cpnet']['pruned-graph'],
output_paths['scitail']['graph']['test'])},
{'func': generate_adj_data_from_grounded_concepts, 'args': (output_paths['scitail']['grounded']['train'], output_paths['cpnet']['pruned-graph'],
output_paths['cpnet']['vocab'], output_paths['scitail']['graph']['adj-train'], args.nprocs)},
{'func': generate_adj_data_from_grounded_concepts, 'args': (output_paths['scitail']['grounded']['dev'], output_paths['cpnet']['pruned-graph'],
output_paths['cpnet']['vocab'], output_paths['scitail']['graph']['adj-dev'], args.nprocs)},
{'func': generate_adj_data_from_grounded_concepts, 'args': (output_paths['scitail']['grounded']['test'], output_paths['cpnet']['pruned-graph'],
output_paths['cpnet']['vocab'], output_paths['scitail']['graph']['adj-test'], args.nprocs)},
],
'phys': [
{'func': convert_to_phys_statement,
'args': (input_paths['phys']['train'], input_paths['phys']['train-label'], output_paths['phys']['statement']['train'], output_paths['phys']['statement']['train-fairseq'])},
{'func': convert_to_phys_statement,
'args': (input_paths['phys']['dev'], input_paths['phys']['dev-label'], output_paths['phys']['statement']['dev'], output_paths['phys']['statement']['dev-fairseq'])},
{'func': tokenize_statement_file, 'args': (output_paths['phys']['statement']['train'], output_paths['phys']['tokenized']['train'])},
{'func': tokenize_statement_file, 'args': (output_paths['phys']['statement']['dev'], output_paths['phys']['tokenized']['dev'])},
{'func': make_word_vocab, 'args': ((output_paths['phys']['statement']['train'],), output_paths['phys']['statement']['vocab'])},
{'func': ground, 'args': (output_paths['phys']['statement']['train'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['patterns'], output_paths['phys']['grounded']['train'], args.nprocs)},
{'func': ground, 'args': (output_paths['phys']['statement']['dev'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['patterns'], output_paths['phys']['grounded']['dev'], args.nprocs)},
{'func': find_paths, 'args': (output_paths['phys']['grounded']['train'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['pruned-graph'], output_paths['phys']['paths']['raw-train'], args.nprocs, args.seed)},
{'func': find_paths, 'args': (output_paths['phys']['grounded']['dev'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['pruned-graph'], output_paths['phys']['paths']['raw-dev'], args.nprocs, args.seed)},
{'func': score_paths, 'args': (output_paths['phys']['paths']['raw-train'], input_paths['transe']['ent'], input_paths['transe']['rel'],
output_paths['cpnet']['vocab'], output_paths['phys']['paths']['scores-train'], args.nprocs)},
{'func': score_paths, 'args': (output_paths['phys']['paths']['raw-dev'], input_paths['transe']['ent'], input_paths['transe']['rel'],
output_paths['cpnet']['vocab'], output_paths['phys']['paths']['scores-dev'], args.nprocs)},
{'func': prune_paths, 'args': (output_paths['phys']['paths']['raw-train'], output_paths['phys']['paths']['scores-train'],
output_paths['phys']['paths']['pruned-train'], args.path_prune_threshold)},
{'func': prune_paths, 'args': (output_paths['phys']['paths']['raw-dev'], output_paths['phys']['paths']['scores-dev'],
output_paths['phys']['paths']['pruned-dev'], args.path_prune_threshold)},
{'func': generate_graph, 'args': (output_paths['phys']['grounded']['train'], output_paths['phys']['paths']['pruned-train'],
output_paths['cpnet']['vocab'], output_paths['cpnet']['pruned-graph'],
output_paths['phys']['graph']['train'])},
{'func': generate_graph, 'args': (output_paths['phys']['grounded']['dev'], output_paths['phys']['paths']['pruned-dev'],
output_paths['cpnet']['vocab'], output_paths['cpnet']['pruned-graph'],
output_paths['phys']['graph']['dev'])},
{'func': generate_adj_data_from_grounded_concepts, 'args': (output_paths['phys']['grounded']['train'], output_paths['cpnet']['pruned-graph'],
output_paths['cpnet']['vocab'], output_paths['phys']['graph']['adj-train'], args.nprocs)},
{'func': generate_adj_data_from_grounded_concepts, 'args': (output_paths['phys']['grounded']['dev'], output_paths['cpnet']['pruned-graph'],
output_paths['cpnet']['vocab'], output_paths['phys']['graph']['adj-dev'], args.nprocs)},
],
'socialiqa': [
{'func': convert_to_socialiqa_statement, 'args': (
input_paths['socialiqa']['train'], input_paths['socialiqa']['train-label'], output_paths['socialiqa']['statement']['train'], output_paths['socialiqa']['statement']['train-fairseq'])},
{'func': convert_to_socialiqa_statement,
'args': (input_paths['socialiqa']['dev'], input_paths['socialiqa']['dev-label'], output_paths['socialiqa']['statement']['dev'], output_paths['socialiqa']['statement']['dev-fairseq'])},
{'func': tokenize_statement_file, 'args': (output_paths['socialiqa']['statement']['train'], output_paths['socialiqa']['tokenized']['train'])},
{'func': tokenize_statement_file, 'args': (output_paths['socialiqa']['statement']['dev'], output_paths['socialiqa']['tokenized']['dev'])},
{'func': make_word_vocab, 'args': ((output_paths['socialiqa']['statement']['train'],), output_paths['socialiqa']['statement']['vocab'])},
{'func': ground, 'args': (output_paths['socialiqa']['statement']['train'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['patterns'], output_paths['socialiqa']['grounded']['train'], args.nprocs)},
{'func': ground, 'args': (output_paths['socialiqa']['statement']['dev'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['patterns'], output_paths['socialiqa']['grounded']['dev'], args.nprocs)},
{'func': find_paths, 'args': (output_paths['socialiqa']['grounded']['train'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['pruned-graph'], output_paths['socialiqa']['paths']['raw-train'], args.nprocs, args.seed)},
{'func': find_paths, 'args': (output_paths['socialiqa']['grounded']['dev'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['pruned-graph'], output_paths['socialiqa']['paths']['raw-dev'], args.nprocs, args.seed)},
{'func': score_paths, 'args': (output_paths['socialiqa']['paths']['raw-train'], input_paths['transe']['ent'], input_paths['transe']['rel'],
output_paths['cpnet']['vocab'], output_paths['socialiqa']['paths']['scores-train'], args.nprocs)},
{'func': score_paths, 'args': (output_paths['socialiqa']['paths']['raw-dev'], input_paths['transe']['ent'], input_paths['transe']['rel'],
output_paths['cpnet']['vocab'], output_paths['socialiqa']['paths']['scores-dev'], args.nprocs)},
{'func': prune_paths, 'args': (output_paths['socialiqa']['paths']['raw-train'], output_paths['socialiqa']['paths']['scores-train'],
output_paths['socialiqa']['paths']['pruned-train'], args.path_prune_threshold)},
{'func': prune_paths, 'args': (output_paths['socialiqa']['paths']['raw-dev'], output_paths['socialiqa']['paths']['scores-dev'],
output_paths['socialiqa']['paths']['pruned-dev'], args.path_prune_threshold)},
{'func': generate_graph, 'args': (output_paths['socialiqa']['grounded']['train'], output_paths['socialiqa']['paths']['pruned-train'],
output_paths['cpnet']['vocab'], output_paths['cpnet']['pruned-graph'],
output_paths['socialiqa']['graph']['train'])},
{'func': generate_graph, 'args': (output_paths['socialiqa']['grounded']['dev'], output_paths['socialiqa']['paths']['pruned-dev'],
output_paths['cpnet']['vocab'], output_paths['cpnet']['pruned-graph'],
output_paths['socialiqa']['graph']['dev'])},
{'func': generate_adj_data_from_grounded_concepts, 'args': (output_paths['socialiqa']['grounded']['train'], output_paths['cpnet']['pruned-graph'],
output_paths['cpnet']['vocab'], output_paths['socialiqa']['graph']['adj-train'], args.nprocs)},
{'func': generate_adj_data_from_grounded_concepts, 'args': (output_paths['socialiqa']['grounded']['dev'], output_paths['cpnet']['pruned-graph'],
output_paths['cpnet']['vocab'], output_paths['socialiqa']['graph']['adj-dev'], args.nprocs)},
{'func': generate_triples_from_adj, 'args': (output_paths['socialiqa']['graph']['adj-train'], output_paths['socialiqa']['grounded']['train'],
output_paths['cpnet']['vocab'], output_paths['socialiqa']['triple']['train'])},
{'func': generate_triples_from_adj, 'args': (output_paths['socialiqa']['graph']['adj-dev'], output_paths['socialiqa']['grounded']['dev'],
output_paths['cpnet']['vocab'], output_paths['socialiqa']['triple']['dev'])},
{'func': generate_path_and_graph_from_adj, 'args': (output_paths['socialiqa']['graph']['adj-train'], output_paths['cpnet']['pruned-graph'], output_paths['socialiqa']['paths']['adj-train'], output_paths['socialiqa']['graph']['nxg-from-adj-train'], args.nprocs)},
{'func': generate_path_and_graph_from_adj, 'args': (output_paths['socialiqa']['graph']['adj-dev'], output_paths['cpnet']['pruned-graph'], output_paths['socialiqa']['paths']['adj-dev'], output_paths['socialiqa']['graph']['nxg-from-adj-dev'], args.nprocs)},
],
'obqa': [
{'func': convert_to_obqa_statement, 'args': (input_paths['obqa']['train'], output_paths['obqa']['statement']['train'], output_paths['obqa']['statement']['train-fairseq'])},
{'func': convert_to_obqa_statement, 'args': (input_paths['obqa']['dev'], output_paths['obqa']['statement']['dev'], output_paths['obqa']['statement']['dev-fairseq'])},
{'func': convert_to_obqa_statement, 'args': (input_paths['obqa']['test'], output_paths['obqa']['statement']['test'], output_paths['obqa']['statement']['test-fairseq'])},
{'func': tokenize_statement_file, 'args': (output_paths['obqa']['statement']['train'], output_paths['obqa']['tokenized']['train'])},
{'func': tokenize_statement_file, 'args': (output_paths['obqa']['statement']['dev'], output_paths['obqa']['tokenized']['dev'])},
{'func': tokenize_statement_file, 'args': (output_paths['obqa']['statement']['test'], output_paths['obqa']['tokenized']['test'])},
{'func': make_word_vocab, 'args': ((output_paths['obqa']['statement']['train'],), output_paths['obqa']['statement']['vocab'])},
{'func': ground, 'args': (output_paths['obqa']['statement']['train'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['patterns'], output_paths['obqa']['grounded']['train'], args.nprocs)},
{'func': ground, 'args': (output_paths['obqa']['statement']['dev'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['patterns'], output_paths['obqa']['grounded']['dev'], args.nprocs)},
{'func': ground, 'args': (output_paths['obqa']['statement']['test'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['patterns'], output_paths['obqa']['grounded']['test'], args.nprocs)},
{'func': find_paths, 'args': (output_paths['obqa']['grounded']['train'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['pruned-graph'], output_paths['obqa']['paths']['raw-train'], args.nprocs, args.seed)},
{'func': find_paths, 'args': (output_paths['obqa']['grounded']['dev'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['pruned-graph'], output_paths['obqa']['paths']['raw-dev'], args.nprocs, args.seed)},
{'func': find_paths, 'args': (output_paths['obqa']['grounded']['test'], output_paths['cpnet']['vocab'],
output_paths['cpnet']['pruned-graph'], output_paths['obqa']['paths']['raw-test'], args.nprocs, args.seed)},
{'func': score_paths, 'args': (output_paths['obqa']['paths']['raw-train'], input_paths['transe']['ent'], input_paths['transe']['rel'],
output_paths['cpnet']['vocab'], output_paths['obqa']['paths']['scores-train'], args.nprocs)},
{'func': score_paths, 'args': (output_paths['obqa']['paths']['raw-dev'], input_paths['transe']['ent'], input_paths['transe']['rel'],
output_paths['cpnet']['vocab'], output_paths['obqa']['paths']['scores-dev'], args.nprocs)},
{'func': score_paths, 'args': (output_paths['obqa']['paths']['raw-test'], input_paths['transe']['ent'], input_paths['transe']['rel'],
output_paths['cpnet']['vocab'], output_paths['obqa']['paths']['scores-test'], args.nprocs)},
{'func': prune_paths, 'args': (output_paths['obqa']['paths']['raw-train'], output_paths['obqa']['paths']['scores-train'],
output_paths['obqa']['paths']['pruned-train'], args.path_prune_threshold)},
{'func': prune_paths, 'args': (output_paths['obqa']['paths']['raw-dev'], output_paths['obqa']['paths']['scores-dev'],
output_paths['obqa']['paths']['pruned-dev'], args.path_prune_threshold)},
{'func': prune_paths, 'args': (output_paths['obqa']['paths']['raw-test'], output_paths['obqa']['paths']['scores-test'],
output_paths['obqa']['paths']['pruned-test'], args.path_prune_threshold)},
{'func': generate_graph, 'args': (output_paths['obqa']['grounded']['train'], output_paths['obqa']['paths']['pruned-train'],
output_paths['cpnet']['vocab'], output_paths['cpnet']['pruned-graph'],
output_paths['obqa']['graph']['train'])},
{'func': generate_graph, 'args': (output_paths['obqa']['grounded']['dev'], output_paths['obqa']['paths']['pruned-dev'],
output_paths['cpnet']['vocab'], output_paths['cpnet']['pruned-graph'],
output_paths['obqa']['graph']['dev'])},
{'func': generate_graph, 'args': (output_paths['obqa']['grounded']['test'], output_paths['obqa']['paths']['pruned-test'],
output_paths['cpnet']['vocab'], output_paths['cpnet']['pruned-graph'],
output_paths['obqa']['graph']['test'])},
{'func': generate_adj_data_from_grounded_concepts, 'args': (output_paths['obqa']['grounded']['train'], output_paths['cpnet']['pruned-graph'],
output_paths['cpnet']['vocab'], output_paths['obqa']['graph']['adj-train'], args.nprocs)},
{'func': generate_adj_data_from_grounded_concepts, 'args': (output_paths['obqa']['grounded']['dev'], output_paths['cpnet']['pruned-graph'],
output_paths['cpnet']['vocab'], output_paths['obqa']['graph']['adj-dev'], args.nprocs)},
{'func': generate_adj_data_from_grounded_concepts, 'args': (output_paths['obqa']['grounded']['test'], output_paths['cpnet']['pruned-graph'],
output_paths['cpnet']['vocab'], output_paths['obqa']['graph']['adj-test'], args.nprocs)},
{'func': generate_triples_from_adj, 'args': (output_paths['obqa']['graph']['adj-train'], output_paths['obqa']['grounded']['train'],
output_paths['cpnet']['vocab'], output_paths['obqa']['triple']['train'])},
{'func': generate_triples_from_adj, 'args': (output_paths['obqa']['graph']['adj-dev'], output_paths['obqa']['grounded']['dev'],
output_paths['cpnet']['vocab'], output_paths['obqa']['triple']['dev'])},
{'func': generate_triples_from_adj, 'args': (output_paths['obqa']['graph']['adj-test'], output_paths['obqa']['grounded']['test'],
output_paths['cpnet']['vocab'], output_paths['obqa']['triple']['test'])},
{'func': generate_path_and_graph_from_adj, 'args': (output_paths['obqa']['graph']['adj-train'], output_paths['cpnet']['pruned-graph'], output_paths['obqa']['paths']['adj-train'], output_paths['obqa']['graph']['nxg-from-adj-train'], args.nprocs)},
{'func': generate_path_and_graph_from_adj, 'args': (output_paths['obqa']['graph']['adj-dev'], output_paths['cpnet']['pruned-graph'], output_paths['obqa']['paths']['adj-dev'], output_paths['obqa']['graph']['nxg-from-adj-dev'], args.nprocs)},
{'func': generate_path_and_graph_from_adj, 'args': (output_paths['obqa']['graph']['adj-test'], output_paths['cpnet']['pruned-graph'], output_paths['obqa']['paths']['adj-test'], output_paths['obqa']['graph']['nxg-from-adj-test'], args.nprocs)},
],
'exp': [
{'func': convert_to_entailment,
'args': (input_paths['csqa']['train'], output_paths['csqa']['statement-with-ans-pos']['train'], True)},
{'func': convert_to_entailment,
'args': (input_paths['csqa']['dev'], output_paths['csqa']['statement-with-ans-pos']['dev'], True)},
{'func': convert_to_entailment,
'args': (input_paths['csqa']['test'], output_paths['csqa']['statement-with-ans-pos']['test'], True)},
],
'hswag': [
# TODO
],
'anli': [
# TODO
],
'make_word_vocab': [
{'func': make_word_vocab, 'args': ((output_paths['csqa']['statement']['train'],), output_paths['csqa']['statement']['vocab'])},
{'func': make_word_vocab, 'args': ((output_paths['scitail']['statement']['train'],), output_paths['scitail']['statement']['vocab'])},
{'func': make_word_vocab, 'args': ((output_paths['phys']['statement']['train'],), output_paths['phys']['statement']['vocab'])},
{'func': make_word_vocab, 'args': ((output_paths['socialiqa']['statement']['train'],), output_paths['socialiqa']['statement']['vocab'])},
{'func': make_word_vocab, 'args': ((output_paths['obqa']['statement']['train'],), output_paths['obqa']['statement']['vocab'])},
],
}
for rt in args.run:
for rt_dic in routines[rt]:
rt_dic['func'](*rt_dic['args'])
print('Successfully run {}'.format(' '.join(args.run)))
if __name__ == '__main__':
main()