Spaces:
Runtime error
Runtime error
Update config.py
Browse files
config.py
CHANGED
|
@@ -95,6 +95,7 @@ config = Config()
|
|
| 95 |
def parseArgs():
|
| 96 |
parser = argparse.ArgumentParser(fromfile_prefix_chars = "@")
|
| 97 |
|
|
|
|
| 98 |
################ systems
|
| 99 |
|
| 100 |
#custom args
|
|
@@ -222,7 +223,7 @@ def parseArgs():
|
|
| 222 |
parser.add_argument("--memoryVariationalDropout", action = "store_true", help = "use variational dropout across the MAC network")
|
| 223 |
|
| 224 |
## nonlinearities
|
| 225 |
-
parser.add_argument("--relu", default = "
|
| 226 |
# parser.add_argument("--reluAlpha", default = 0.2, type = float, help = "alpha value for the leaky ReLU")
|
| 227 |
|
| 228 |
parser.add_argument("--mulBias", default = 0.0, type = float, help = "bias to add in multiplications (x + b) * (y + b) for better training") #
|
|
@@ -324,7 +325,7 @@ def parseArgs():
|
|
| 324 |
parser.add_argument("--controlFeedPrev", action = "store_true", help = "feed previous control state")
|
| 325 |
parser.add_argument("--controlFeedPrevAtt", action = "store_true", help = "feed previous control post word attention (otherwise will feed continuous control)")
|
| 326 |
parser.add_argument("--controlFeedInputs", action = "store_true", help = "feed question representation")
|
| 327 |
-
parser.add_argument("--controlContAct", default = "
|
| 328 |
|
| 329 |
# step 2: word attention and optional projection
|
| 330 |
parser.add_argument("--controlConcatWords", action = "store_true", help = "concatenate words to interaction when computing attention")
|
|
@@ -426,33 +427,10 @@ def parseArgs():
|
|
| 426 |
# parser.add_argument("--gumbelSoftmaxBoth", action = "store_true", help = "use softmax for training and testing") #
|
| 427 |
# parser.add_argument("--gumbelArgmaxBoth", action = "store_true", help = "use argmax for training and testing") #
|
| 428 |
|
| 429 |
-
parser.
|
| 430 |
-
|
| 431 |
-
|
| 432 |
-
|
| 433 |
-
useEMA=True,
|
| 434 |
-
lrReduce=True,
|
| 435 |
-
adam=True,
|
| 436 |
-
clip=True,
|
| 437 |
-
memoryVariationalDropout=True,
|
| 438 |
-
relu='ELU',
|
| 439 |
-
encBi=True,
|
| 440 |
-
wrdEmbRandom=True,
|
| 441 |
-
wrdEmbUniform=True,
|
| 442 |
-
outQuestion=True,
|
| 443 |
-
initCtrl='Q',
|
| 444 |
-
controlContextual=True,
|
| 445 |
-
controlInputUnshared=True,
|
| 446 |
-
readProjInputs=True,
|
| 447 |
-
readMemConcatKB=True,
|
| 448 |
-
readMemConcatProj=True,
|
| 449 |
-
readMemProj=True,
|
| 450 |
-
readCtrl=True,
|
| 451 |
-
writeMemProj=True,
|
| 452 |
-
restore=True,
|
| 453 |
-
expName='PDF_exp_extra',
|
| 454 |
-
netLength=16
|
| 455 |
-
)
|
| 456 |
|
| 457 |
###################################### dataset configuration ######################################
|
| 458 |
|
|
|
|
| 95 |
def parseArgs():
|
| 96 |
parser = argparse.ArgumentParser(fromfile_prefix_chars = "@")
|
| 97 |
|
| 98 |
+
|
| 99 |
################ systems
|
| 100 |
|
| 101 |
#custom args
|
|
|
|
| 223 |
parser.add_argument("--memoryVariationalDropout", action = "store_true", help = "use variational dropout across the MAC network")
|
| 224 |
|
| 225 |
## nonlinearities
|
| 226 |
+
parser.add_argument("--relu", default = "ELU", choices = ["STD", "PRM", "ELU", "LKY", "SELU"], type = str, help = "type of ReLU to use: standard, parametric, ELU, or leaky")
|
| 227 |
# parser.add_argument("--reluAlpha", default = 0.2, type = float, help = "alpha value for the leaky ReLU")
|
| 228 |
|
| 229 |
parser.add_argument("--mulBias", default = 0.0, type = float, help = "bias to add in multiplications (x + b) * (y + b) for better training") #
|
|
|
|
| 325 |
parser.add_argument("--controlFeedPrev", action = "store_true", help = "feed previous control state")
|
| 326 |
parser.add_argument("--controlFeedPrevAtt", action = "store_true", help = "feed previous control post word attention (otherwise will feed continuous control)")
|
| 327 |
parser.add_argument("--controlFeedInputs", action = "store_true", help = "feed question representation")
|
| 328 |
+
parser.add_argument("--controlContAct", default = "TANH", type = str, choices = ["NON", "RELU", "TANH"], help = "activation on the words interactions")
|
| 329 |
|
| 330 |
# step 2: word attention and optional projection
|
| 331 |
parser.add_argument("--controlConcatWords", action = "store_true", help = "concatenate words to interaction when computing attention")
|
|
|
|
| 427 |
# parser.add_argument("--gumbelSoftmaxBoth", action = "store_true", help = "use softmax for training and testing") #
|
| 428 |
# parser.add_argument("--gumbelArgmaxBoth", action = "store_true", help = "use argmax for training and testing") #
|
| 429 |
|
| 430 |
+
parser.parse_args(namespace = config)
|
| 431 |
+
|
| 432 |
+
|
| 433 |
+
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 434 |
|
| 435 |
###################################### dataset configuration ######################################
|
| 436 |
|