fairseq/models/lightconv_lm.py

Killed 12 out of 114 mutants

Survived

Survived mutation testing. These mutants show holes in your test suite.

Mutant 1546

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -24,7 +24,6 @@
     def __init__(self, decoder):
         super().__init__(decoder)
 
-    @staticmethod
     def add_args(parser):
         """Add model-specific arguments to the parser."""
         parser.add_argument('--dropout', default=0.1, type=float, metavar='D',

Mutant 1547

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -27,7 +27,7 @@
     @staticmethod
     def add_args(parser):
         """Add model-specific arguments to the parser."""
-        parser.add_argument('--dropout', default=0.1, type=float, metavar='D',
+        parser.add_argument('XX--dropoutXX', default=0.1, type=float, metavar='D',
                             help='dropout probability')
         parser.add_argument('--attention-dropout', default=0., type=float, metavar='D',
                             help='dropout probability for attention weights')

Mutant 1548

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -27,7 +27,7 @@
     @staticmethod
     def add_args(parser):
         """Add model-specific arguments to the parser."""
-        parser.add_argument('--dropout', default=0.1, type=float, metavar='D',
+        parser.add_argument('--dropout', default=1.1, type=float, metavar='D',
                             help='dropout probability')
         parser.add_argument('--attention-dropout', default=0., type=float, metavar='D',
                             help='dropout probability for attention weights')

Mutant 1549

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -27,7 +27,7 @@
     @staticmethod
     def add_args(parser):
         """Add model-specific arguments to the parser."""
-        parser.add_argument('--dropout', default=0.1, type=float, metavar='D',
+        parser.add_argument('--dropout', default=0.1, type=float, metavar='XXDXX',
                             help='dropout probability')
         parser.add_argument('--attention-dropout', default=0., type=float, metavar='D',
                             help='dropout probability for attention weights')

Mutant 1550

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -28,7 +28,7 @@
     def add_args(parser):
         """Add model-specific arguments to the parser."""
         parser.add_argument('--dropout', default=0.1, type=float, metavar='D',
-                            help='dropout probability')
+                            help='XXdropout probabilityXX')
         parser.add_argument('--attention-dropout', default=0., type=float, metavar='D',
                             help='dropout probability for attention weights')
         parser.add_argument('--relu-dropout', default=0., type=float, metavar='D',

Mutant 1551

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -29,7 +29,7 @@
         """Add model-specific arguments to the parser."""
         parser.add_argument('--dropout', default=0.1, type=float, metavar='D',
                             help='dropout probability')
-        parser.add_argument('--attention-dropout', default=0., type=float, metavar='D',
+        parser.add_argument('XX--attention-dropoutXX', default=0., type=float, metavar='D',
                             help='dropout probability for attention weights')
         parser.add_argument('--relu-dropout', default=0., type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')

Mutant 1552

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -29,7 +29,7 @@
         """Add model-specific arguments to the parser."""
         parser.add_argument('--dropout', default=0.1, type=float, metavar='D',
                             help='dropout probability')
-        parser.add_argument('--attention-dropout', default=0., type=float, metavar='D',
+        parser.add_argument('--attention-dropout', default=1.0, type=float, metavar='D',
                             help='dropout probability for attention weights')
         parser.add_argument('--relu-dropout', default=0., type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')

Mutant 1553

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -29,7 +29,7 @@
         """Add model-specific arguments to the parser."""
         parser.add_argument('--dropout', default=0.1, type=float, metavar='D',
                             help='dropout probability')
-        parser.add_argument('--attention-dropout', default=0., type=float, metavar='D',
+        parser.add_argument('--attention-dropout', default=0., type=float, metavar='XXDXX',
                             help='dropout probability for attention weights')
         parser.add_argument('--relu-dropout', default=0., type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')

Mutant 1554

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -30,7 +30,7 @@
         parser.add_argument('--dropout', default=0.1, type=float, metavar='D',
                             help='dropout probability')
         parser.add_argument('--attention-dropout', default=0., type=float, metavar='D',
-                            help='dropout probability for attention weights')
+                            help='XXdropout probability for attention weightsXX')
         parser.add_argument('--relu-dropout', default=0., type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')
         parser.add_argument('--input-dropout', type=float, metavar='D',

Mutant 1555

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -31,7 +31,7 @@
                             help='dropout probability')
         parser.add_argument('--attention-dropout', default=0., type=float, metavar='D',
                             help='dropout probability for attention weights')
-        parser.add_argument('--relu-dropout', default=0., type=float, metavar='D',
+        parser.add_argument('XX--relu-dropoutXX', default=0., type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')
         parser.add_argument('--input-dropout', type=float, metavar='D',
                             help='dropout probability of the inputs')

Mutant 1556

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -31,7 +31,7 @@
                             help='dropout probability')
         parser.add_argument('--attention-dropout', default=0., type=float, metavar='D',
                             help='dropout probability for attention weights')
-        parser.add_argument('--relu-dropout', default=0., type=float, metavar='D',
+        parser.add_argument('--relu-dropout', default=1.0, type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')
         parser.add_argument('--input-dropout', type=float, metavar='D',
                             help='dropout probability of the inputs')

Mutant 1557

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -31,7 +31,7 @@
                             help='dropout probability')
         parser.add_argument('--attention-dropout', default=0., type=float, metavar='D',
                             help='dropout probability for attention weights')
-        parser.add_argument('--relu-dropout', default=0., type=float, metavar='D',
+        parser.add_argument('--relu-dropout', default=0., type=float, metavar='XXDXX',
                             help='dropout probability after ReLU in FFN')
         parser.add_argument('--input-dropout', type=float, metavar='D',
                             help='dropout probability of the inputs')

Mutant 1558

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -32,7 +32,7 @@
         parser.add_argument('--attention-dropout', default=0., type=float, metavar='D',
                             help='dropout probability for attention weights')
         parser.add_argument('--relu-dropout', default=0., type=float, metavar='D',
-                            help='dropout probability after ReLU in FFN')
+                            help='XXdropout probability after ReLU in FFNXX')
         parser.add_argument('--input-dropout', type=float, metavar='D',
                             help='dropout probability of the inputs')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',

Mutant 1559

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -33,7 +33,7 @@
                             help='dropout probability for attention weights')
         parser.add_argument('--relu-dropout', default=0., type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')
-        parser.add_argument('--input-dropout', type=float, metavar='D',
+        parser.add_argument('XX--input-dropoutXX', type=float, metavar='D',
                             help='dropout probability of the inputs')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension')

Mutant 1560

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -33,7 +33,7 @@
                             help='dropout probability for attention weights')
         parser.add_argument('--relu-dropout', default=0., type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')
-        parser.add_argument('--input-dropout', type=float, metavar='D',
+        parser.add_argument('--input-dropout', type=float, metavar='XXDXX',
                             help='dropout probability of the inputs')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension')

Mutant 1561

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -34,7 +34,7 @@
         parser.add_argument('--relu-dropout', default=0., type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')
         parser.add_argument('--input-dropout', type=float, metavar='D',
-                            help='dropout probability of the inputs')
+                            help='XXdropout probability of the inputsXX')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-output-dim', type=int, metavar='N',

Mutant 1562

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -35,7 +35,7 @@
                             help='dropout probability after ReLU in FFN')
         parser.add_argument('--input-dropout', type=float, metavar='D',
                             help='dropout probability of the inputs')
-        parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
+        parser.add_argument('XX--decoder-embed-dimXX', type=int, metavar='N',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-output-dim', type=int, metavar='N',
                             help='decoder output dimension')

Mutant 1563

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -35,7 +35,7 @@
                             help='dropout probability after ReLU in FFN')
         parser.add_argument('--input-dropout', type=float, metavar='D',
                             help='dropout probability of the inputs')
-        parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
+        parser.add_argument('--decoder-embed-dim', type=int, metavar='XXNXX',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-output-dim', type=int, metavar='N',
                             help='decoder output dimension')

Mutant 1564

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -36,7 +36,7 @@
         parser.add_argument('--input-dropout', type=float, metavar='D',
                             help='dropout probability of the inputs')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
-                            help='decoder embedding dimension')
+                            help='XXdecoder embedding dimensionXX')
         parser.add_argument('--decoder-output-dim', type=int, metavar='N',
                             help='decoder output dimension')
         parser.add_argument('--decoder-input-dim', type=int, metavar='N',

Mutant 1565

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -37,7 +37,7 @@
                             help='dropout probability of the inputs')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
-        parser.add_argument('--decoder-output-dim', type=int, metavar='N',
+        parser.add_argument('XX--decoder-output-dimXX', type=int, metavar='N',
                             help='decoder output dimension')
         parser.add_argument('--decoder-input-dim', type=int, metavar='N',
                             help='decoder input dimension')

Mutant 1566

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -37,7 +37,7 @@
                             help='dropout probability of the inputs')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
-        parser.add_argument('--decoder-output-dim', type=int, metavar='N',
+        parser.add_argument('--decoder-output-dim', type=int, metavar='XXNXX',
                             help='decoder output dimension')
         parser.add_argument('--decoder-input-dim', type=int, metavar='N',
                             help='decoder input dimension')

Mutant 1567

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -38,7 +38,7 @@
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-output-dim', type=int, metavar='N',
-                            help='decoder output dimension')
+                            help='XXdecoder output dimensionXX')
         parser.add_argument('--decoder-input-dim', type=int, metavar='N',
                             help='decoder input dimension')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',

Mutant 1568

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -39,7 +39,7 @@
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-output-dim', type=int, metavar='N',
                             help='decoder output dimension')
-        parser.add_argument('--decoder-input-dim', type=int, metavar='N',
+        parser.add_argument('XX--decoder-input-dimXX', type=int, metavar='N',
                             help='decoder input dimension')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')

Mutant 1569

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -39,7 +39,7 @@
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-output-dim', type=int, metavar='N',
                             help='decoder output dimension')
-        parser.add_argument('--decoder-input-dim', type=int, metavar='N',
+        parser.add_argument('--decoder-input-dim', type=int, metavar='XXNXX',
                             help='decoder input dimension')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')

Mutant 1570

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -40,7 +40,7 @@
         parser.add_argument('--decoder-output-dim', type=int, metavar='N',
                             help='decoder output dimension')
         parser.add_argument('--decoder-input-dim', type=int, metavar='N',
-                            help='decoder input dimension')
+                            help='XXdecoder input dimensionXX')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')
         parser.add_argument('--decoder-layers', type=int, metavar='N',

Mutant 1571

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -41,7 +41,7 @@
                             help='decoder output dimension')
         parser.add_argument('--decoder-input-dim', type=int, metavar='N',
                             help='decoder input dimension')
-        parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
+        parser.add_argument('XX--decoder-ffn-embed-dimXX', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')
         parser.add_argument('--decoder-layers', type=int, metavar='N',
                             help='num decoder layers')

Mutant 1572

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -41,7 +41,7 @@
                             help='decoder output dimension')
         parser.add_argument('--decoder-input-dim', type=int, metavar='N',
                             help='decoder input dimension')
-        parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
+        parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='XXNXX',
                             help='decoder embedding dimension for FFN')
         parser.add_argument('--decoder-layers', type=int, metavar='N',
                             help='num decoder layers')

Mutant 1573

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -42,7 +42,7 @@
         parser.add_argument('--decoder-input-dim', type=int, metavar='N',
                             help='decoder input dimension')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
-                            help='decoder embedding dimension for FFN')
+                            help='XXdecoder embedding dimension for FFNXX')
         parser.add_argument('--decoder-layers', type=int, metavar='N',
                             help='num decoder layers')
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',

Mutant 1574

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -43,7 +43,7 @@
                             help='decoder input dimension')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')
-        parser.add_argument('--decoder-layers', type=int, metavar='N',
+        parser.add_argument('XX--decoder-layersXX', type=int, metavar='N',
                             help='num decoder layers')
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
                             help='num decoder attention heads or LightConv/DynamicConv heads')

Mutant 1575

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -43,7 +43,7 @@
                             help='decoder input dimension')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')
-        parser.add_argument('--decoder-layers', type=int, metavar='N',
+        parser.add_argument('--decoder-layers', type=int, metavar='XXNXX',
                             help='num decoder layers')
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
                             help='num decoder attention heads or LightConv/DynamicConv heads')

Mutant 1576

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -44,7 +44,7 @@
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')
         parser.add_argument('--decoder-layers', type=int, metavar='N',
-                            help='num decoder layers')
+                            help='XXnum decoder layersXX')
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
                             help='num decoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--decoder-normalize-before', default=False, action='store_true',

Mutant 1577

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -45,7 +45,7 @@
                             help='decoder embedding dimension for FFN')
         parser.add_argument('--decoder-layers', type=int, metavar='N',
                             help='num decoder layers')
-        parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
+        parser.add_argument('XX--decoder-attention-headsXX', type=int, metavar='N',
                             help='num decoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--decoder-normalize-before', default=False, action='store_true',
                             help='apply layernorm before each decoder block')

Mutant 1578

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -45,7 +45,7 @@
                             help='decoder embedding dimension for FFN')
         parser.add_argument('--decoder-layers', type=int, metavar='N',
                             help='num decoder layers')
-        parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
+        parser.add_argument('--decoder-attention-heads', type=int, metavar='XXNXX',
                             help='num decoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--decoder-normalize-before', default=False, action='store_true',
                             help='apply layernorm before each decoder block')

Mutant 1579

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -46,7 +46,7 @@
         parser.add_argument('--decoder-layers', type=int, metavar='N',
                             help='num decoder layers')
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
-                            help='num decoder attention heads or LightConv/DynamicConv heads')
+                            help='XXnum decoder attention heads or LightConv/DynamicConv headsXX')
         parser.add_argument('--decoder-normalize-before', default=False, action='store_true',
                             help='apply layernorm before each decoder block')
         parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',

Mutant 1580

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -47,7 +47,7 @@
                             help='num decoder layers')
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
                             help='num decoder attention heads or LightConv/DynamicConv heads')
-        parser.add_argument('--decoder-normalize-before', default=False, action='store_true',
+        parser.add_argument('XX--decoder-normalize-beforeXX', default=False, action='store_true',
                             help='apply layernorm before each decoder block')
         parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
                             help='comma separated list of adaptive softmax cutoff points. '

Mutant 1581

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -47,7 +47,7 @@
                             help='num decoder layers')
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
                             help='num decoder attention heads or LightConv/DynamicConv heads')
-        parser.add_argument('--decoder-normalize-before', default=False, action='store_true',
+        parser.add_argument('--decoder-normalize-before', default=True, action='store_true',
                             help='apply layernorm before each decoder block')
         parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
                             help='comma separated list of adaptive softmax cutoff points. '

Mutant 1583

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -48,7 +48,7 @@
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
                             help='num decoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--decoder-normalize-before', default=False, action='store_true',
-                            help='apply layernorm before each decoder block')
+                            help='XXapply layernorm before each decoder blockXX')
         parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
                             help='comma separated list of adaptive softmax cutoff points. '
                                  'Must be used with adaptive_loss criterion')

Mutant 1584

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -49,7 +49,7 @@
                             help='num decoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--decoder-normalize-before', default=False, action='store_true',
                             help='apply layernorm before each decoder block')
-        parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
+        parser.add_argument('XX--adaptive-softmax-cutoffXX', metavar='EXPR',
                             help='comma separated list of adaptive softmax cutoff points. '
                                  'Must be used with adaptive_loss criterion')
         parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',

Mutant 1585

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -49,7 +49,7 @@
                             help='num decoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--decoder-normalize-before', default=False, action='store_true',
                             help='apply layernorm before each decoder block')
-        parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
+        parser.add_argument('--adaptive-softmax-cutoff', metavar='XXEXPRXX',
                             help='comma separated list of adaptive softmax cutoff points. '
                                  'Must be used with adaptive_loss criterion')
         parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',

Mutant 1586

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -50,7 +50,7 @@
         parser.add_argument('--decoder-normalize-before', default=False, action='store_true',
                             help='apply layernorm before each decoder block')
         parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
-                            help='comma separated list of adaptive softmax cutoff points. '
+                            help='XXcomma separated list of adaptive softmax cutoff points. XX'
                                  'Must be used with adaptive_loss criterion')
         parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',
                             help='sets adaptive softmax dropout for the tail projections')

Mutant 1587

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -52,7 +52,7 @@
         parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
                             help='comma separated list of adaptive softmax cutoff points. '
                                  'Must be used with adaptive_loss criterion')
-        parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',
+        parser.add_argument('XX--adaptive-softmax-dropoutXX', type=float, metavar='D',
                             help='sets adaptive softmax dropout for the tail projections')
         parser.add_argument('--adaptive-softmax-factor', type=float, metavar='N',
                             help='adaptive input factor')

Mutant 1588

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -52,7 +52,7 @@
         parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
                             help='comma separated list of adaptive softmax cutoff points. '
                                  'Must be used with adaptive_loss criterion')
-        parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',
+        parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='XXDXX',
                             help='sets adaptive softmax dropout for the tail projections')
         parser.add_argument('--adaptive-softmax-factor', type=float, metavar='N',
                             help='adaptive input factor')

Mutant 1589

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -53,7 +53,7 @@
                             help='comma separated list of adaptive softmax cutoff points. '
                                  'Must be used with adaptive_loss criterion')
         parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',
-                            help='sets adaptive softmax dropout for the tail projections')
+                            help='XXsets adaptive softmax dropout for the tail projectionsXX')
         parser.add_argument('--adaptive-softmax-factor', type=float, metavar='N',
                             help='adaptive input factor')
         parser.add_argument('--no-token-positional-embeddings', default=False, action='store_true',

Mutant 1590

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -54,7 +54,7 @@
                                  'Must be used with adaptive_loss criterion')
         parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',
                             help='sets adaptive softmax dropout for the tail projections')
-        parser.add_argument('--adaptive-softmax-factor', type=float, metavar='N',
+        parser.add_argument('XX--adaptive-softmax-factorXX', type=float, metavar='N',
                             help='adaptive input factor')
         parser.add_argument('--no-token-positional-embeddings', default=False, action='store_true',
                             help='if set, disables positional embeddings (outside self attention)')

Mutant 1591

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -54,7 +54,7 @@
                                  'Must be used with adaptive_loss criterion')
         parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',
                             help='sets adaptive softmax dropout for the tail projections')
-        parser.add_argument('--adaptive-softmax-factor', type=float, metavar='N',
+        parser.add_argument('--adaptive-softmax-factor', type=float, metavar='XXNXX',
                             help='adaptive input factor')
         parser.add_argument('--no-token-positional-embeddings', default=False, action='store_true',
                             help='if set, disables positional embeddings (outside self attention)')

Mutant 1592

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -55,7 +55,7 @@
         parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',
                             help='sets adaptive softmax dropout for the tail projections')
         parser.add_argument('--adaptive-softmax-factor', type=float, metavar='N',
-                            help='adaptive input factor')
+                            help='XXadaptive input factorXX')
         parser.add_argument('--no-token-positional-embeddings', default=False, action='store_true',
                             help='if set, disables positional embeddings (outside self attention)')
         parser.add_argument('--share-decoder-input-output-embed', default=False, action='store_true',

Mutant 1593

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -56,7 +56,7 @@
                             help='sets adaptive softmax dropout for the tail projections')
         parser.add_argument('--adaptive-softmax-factor', type=float, metavar='N',
                             help='adaptive input factor')
-        parser.add_argument('--no-token-positional-embeddings', default=False, action='store_true',
+        parser.add_argument('XX--no-token-positional-embeddingsXX', default=False, action='store_true',
                             help='if set, disables positional embeddings (outside self attention)')
         parser.add_argument('--share-decoder-input-output-embed', default=False, action='store_true',
                             help='share decoder input and output embeddings')

Mutant 1594

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -56,7 +56,7 @@
                             help='sets adaptive softmax dropout for the tail projections')
         parser.add_argument('--adaptive-softmax-factor', type=float, metavar='N',
                             help='adaptive input factor')
-        parser.add_argument('--no-token-positional-embeddings', default=False, action='store_true',
+        parser.add_argument('--no-token-positional-embeddings', default=True, action='store_true',
                             help='if set, disables positional embeddings (outside self attention)')
         parser.add_argument('--share-decoder-input-output-embed', default=False, action='store_true',
                             help='share decoder input and output embeddings')

Mutant 1596

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -57,7 +57,7 @@
         parser.add_argument('--adaptive-softmax-factor', type=float, metavar='N',
                             help='adaptive input factor')
         parser.add_argument('--no-token-positional-embeddings', default=False, action='store_true',
-                            help='if set, disables positional embeddings (outside self attention)')
+                            help='XXif set, disables positional embeddings (outside self attention)XX')
         parser.add_argument('--share-decoder-input-output-embed', default=False, action='store_true',
                             help='share decoder input and output embeddings')
         parser.add_argument('--character-embeddings', default=False, action='store_true',

Mutant 1597

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -58,7 +58,7 @@
                             help='adaptive input factor')
         parser.add_argument('--no-token-positional-embeddings', default=False, action='store_true',
                             help='if set, disables positional embeddings (outside self attention)')
-        parser.add_argument('--share-decoder-input-output-embed', default=False, action='store_true',
+        parser.add_argument('XX--share-decoder-input-output-embedXX', default=False, action='store_true',
                             help='share decoder input and output embeddings')
         parser.add_argument('--character-embeddings', default=False, action='store_true',
                             help='if set, uses character embedding convolutions to produce token embeddings')

Mutant 1598

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -58,7 +58,7 @@
                             help='adaptive input factor')
         parser.add_argument('--no-token-positional-embeddings', default=False, action='store_true',
                             help='if set, disables positional embeddings (outside self attention)')
-        parser.add_argument('--share-decoder-input-output-embed', default=False, action='store_true',
+        parser.add_argument('--share-decoder-input-output-embed', default=True, action='store_true',
                             help='share decoder input and output embeddings')
         parser.add_argument('--character-embeddings', default=False, action='store_true',
                             help='if set, uses character embedding convolutions to produce token embeddings')

Mutant 1600

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -59,7 +59,7 @@
         parser.add_argument('--no-token-positional-embeddings', default=False, action='store_true',
                             help='if set, disables positional embeddings (outside self attention)')
         parser.add_argument('--share-decoder-input-output-embed', default=False, action='store_true',
-                            help='share decoder input and output embeddings')
+                            help='XXshare decoder input and output embeddingsXX')
         parser.add_argument('--character-embeddings', default=False, action='store_true',
                             help='if set, uses character embedding convolutions to produce token embeddings')
         parser.add_argument('--character-filters', type=str, metavar='LIST',

Mutant 1601

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -60,7 +60,7 @@
                             help='if set, disables positional embeddings (outside self attention)')
         parser.add_argument('--share-decoder-input-output-embed', default=False, action='store_true',
                             help='share decoder input and output embeddings')
-        parser.add_argument('--character-embeddings', default=False, action='store_true',
+        parser.add_argument('XX--character-embeddingsXX', default=False, action='store_true',
                             help='if set, uses character embedding convolutions to produce token embeddings')
         parser.add_argument('--character-filters', type=str, metavar='LIST',
                             default='[(1, 64), (2, 128), (3, 192), (4, 256), (5, 256), (6, 256), (7, 256)]',

Mutant 1602

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -60,7 +60,7 @@
                             help='if set, disables positional embeddings (outside self attention)')
         parser.add_argument('--share-decoder-input-output-embed', default=False, action='store_true',
                             help='share decoder input and output embeddings')
-        parser.add_argument('--character-embeddings', default=False, action='store_true',
+        parser.add_argument('--character-embeddings', default=True, action='store_true',
                             help='if set, uses character embedding convolutions to produce token embeddings')
         parser.add_argument('--character-filters', type=str, metavar='LIST',
                             default='[(1, 64), (2, 128), (3, 192), (4, 256), (5, 256), (6, 256), (7, 256)]',

Mutant 1604

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -61,7 +61,7 @@
         parser.add_argument('--share-decoder-input-output-embed', default=False, action='store_true',
                             help='share decoder input and output embeddings')
         parser.add_argument('--character-embeddings', default=False, action='store_true',
-                            help='if set, uses character embedding convolutions to produce token embeddings')
+                            help='XXif set, uses character embedding convolutions to produce token embeddingsXX')
         parser.add_argument('--character-filters', type=str, metavar='LIST',
                             default='[(1, 64), (2, 128), (3, 192), (4, 256), (5, 256), (6, 256), (7, 256)]',
                             help='size of character embeddings')

Mutant 1605

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -62,7 +62,7 @@
                             help='share decoder input and output embeddings')
         parser.add_argument('--character-embeddings', default=False, action='store_true',
                             help='if set, uses character embedding convolutions to produce token embeddings')
-        parser.add_argument('--character-filters', type=str, metavar='LIST',
+        parser.add_argument('XX--character-filtersXX', type=str, metavar='LIST',
                             default='[(1, 64), (2, 128), (3, 192), (4, 256), (5, 256), (6, 256), (7, 256)]',
                             help='size of character embeddings')
         parser.add_argument('--character-embedding-dim', type=int, metavar='N', default=4,

Mutant 1606

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -62,7 +62,7 @@
                             help='share decoder input and output embeddings')
         parser.add_argument('--character-embeddings', default=False, action='store_true',
                             help='if set, uses character embedding convolutions to produce token embeddings')
-        parser.add_argument('--character-filters', type=str, metavar='LIST',
+        parser.add_argument('--character-filters', type=str, metavar='XXLISTXX',
                             default='[(1, 64), (2, 128), (3, 192), (4, 256), (5, 256), (6, 256), (7, 256)]',
                             help='size of character embeddings')
         parser.add_argument('--character-embedding-dim', type=int, metavar='N', default=4,

Mutant 1607

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -63,7 +63,7 @@
         parser.add_argument('--character-embeddings', default=False, action='store_true',
                             help='if set, uses character embedding convolutions to produce token embeddings')
         parser.add_argument('--character-filters', type=str, metavar='LIST',
-                            default='[(1, 64), (2, 128), (3, 192), (4, 256), (5, 256), (6, 256), (7, 256)]',
+                            default='XX[(1, 64), (2, 128), (3, 192), (4, 256), (5, 256), (6, 256), (7, 256)]XX',
                             help='size of character embeddings')
         parser.add_argument('--character-embedding-dim', type=int, metavar='N', default=4,
                             help='size of character embeddings')

Mutant 1608

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -64,7 +64,7 @@
                             help='if set, uses character embedding convolutions to produce token embeddings')
         parser.add_argument('--character-filters', type=str, metavar='LIST',
                             default='[(1, 64), (2, 128), (3, 192), (4, 256), (5, 256), (6, 256), (7, 256)]',
-                            help='size of character embeddings')
+                            help='XXsize of character embeddingsXX')
         parser.add_argument('--character-embedding-dim', type=int, metavar='N', default=4,
                             help='size of character embeddings')
         parser.add_argument('--char-embedder-highway-layers', type=int, metavar='N', default=2,

Mutant 1609

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -65,7 +65,7 @@
         parser.add_argument('--character-filters', type=str, metavar='LIST',
                             default='[(1, 64), (2, 128), (3, 192), (4, 256), (5, 256), (6, 256), (7, 256)]',
                             help='size of character embeddings')
-        parser.add_argument('--character-embedding-dim', type=int, metavar='N', default=4,
+        parser.add_argument('XX--character-embedding-dimXX', type=int, metavar='N', default=4,
                             help='size of character embeddings')
         parser.add_argument('--char-embedder-highway-layers', type=int, metavar='N', default=2,
                             help='number of highway layers for character token embeddder')

Mutant 1610

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -65,7 +65,7 @@
         parser.add_argument('--character-filters', type=str, metavar='LIST',
                             default='[(1, 64), (2, 128), (3, 192), (4, 256), (5, 256), (6, 256), (7, 256)]',
                             help='size of character embeddings')
-        parser.add_argument('--character-embedding-dim', type=int, metavar='N', default=4,
+        parser.add_argument('--character-embedding-dim', type=int, metavar='XXNXX', default=4,
                             help='size of character embeddings')
         parser.add_argument('--char-embedder-highway-layers', type=int, metavar='N', default=2,
                             help='number of highway layers for character token embeddder')

Mutant 1611

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -65,7 +65,7 @@
         parser.add_argument('--character-filters', type=str, metavar='LIST',
                             default='[(1, 64), (2, 128), (3, 192), (4, 256), (5, 256), (6, 256), (7, 256)]',
                             help='size of character embeddings')
-        parser.add_argument('--character-embedding-dim', type=int, metavar='N', default=4,
+        parser.add_argument('--character-embedding-dim', type=int, metavar='N', default=5,
                             help='size of character embeddings')
         parser.add_argument('--char-embedder-highway-layers', type=int, metavar='N', default=2,
                             help='number of highway layers for character token embeddder')

Mutant 1612

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -66,7 +66,7 @@
                             default='[(1, 64), (2, 128), (3, 192), (4, 256), (5, 256), (6, 256), (7, 256)]',
                             help='size of character embeddings')
         parser.add_argument('--character-embedding-dim', type=int, metavar='N', default=4,
-                            help='size of character embeddings')
+                            help='XXsize of character embeddingsXX')
         parser.add_argument('--char-embedder-highway-layers', type=int, metavar='N', default=2,
                             help='number of highway layers for character token embeddder')
         parser.add_argument('--adaptive-input', default=False, action='store_true',

Mutant 1613

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -67,7 +67,7 @@
                             help='size of character embeddings')
         parser.add_argument('--character-embedding-dim', type=int, metavar='N', default=4,
                             help='size of character embeddings')
-        parser.add_argument('--char-embedder-highway-layers', type=int, metavar='N', default=2,
+        parser.add_argument('XX--char-embedder-highway-layersXX', type=int, metavar='N', default=2,
                             help='number of highway layers for character token embeddder')
         parser.add_argument('--adaptive-input', default=False, action='store_true',
                             help='if set, uses adaptive input')

Mutant 1614

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -67,7 +67,7 @@
                             help='size of character embeddings')
         parser.add_argument('--character-embedding-dim', type=int, metavar='N', default=4,
                             help='size of character embeddings')
-        parser.add_argument('--char-embedder-highway-layers', type=int, metavar='N', default=2,
+        parser.add_argument('--char-embedder-highway-layers', type=int, metavar='XXNXX', default=2,
                             help='number of highway layers for character token embeddder')
         parser.add_argument('--adaptive-input', default=False, action='store_true',
                             help='if set, uses adaptive input')

Mutant 1615

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -67,7 +67,7 @@
                             help='size of character embeddings')
         parser.add_argument('--character-embedding-dim', type=int, metavar='N', default=4,
                             help='size of character embeddings')
-        parser.add_argument('--char-embedder-highway-layers', type=int, metavar='N', default=2,
+        parser.add_argument('--char-embedder-highway-layers', type=int, metavar='N', default=3,
                             help='number of highway layers for character token embeddder')
         parser.add_argument('--adaptive-input', default=False, action='store_true',
                             help='if set, uses adaptive input')

Mutant 1616

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -68,7 +68,7 @@
         parser.add_argument('--character-embedding-dim', type=int, metavar='N', default=4,
                             help='size of character embeddings')
         parser.add_argument('--char-embedder-highway-layers', type=int, metavar='N', default=2,
-                            help='number of highway layers for character token embeddder')
+                            help='XXnumber of highway layers for character token embeddderXX')
         parser.add_argument('--adaptive-input', default=False, action='store_true',
                             help='if set, uses adaptive input')
         parser.add_argument('--adaptive-input-factor', type=float, metavar='N',

Mutant 1617

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -69,7 +69,7 @@
                             help='size of character embeddings')
         parser.add_argument('--char-embedder-highway-layers', type=int, metavar='N', default=2,
                             help='number of highway layers for character token embeddder')
-        parser.add_argument('--adaptive-input', default=False, action='store_true',
+        parser.add_argument('XX--adaptive-inputXX', default=False, action='store_true',
                             help='if set, uses adaptive input')
         parser.add_argument('--adaptive-input-factor', type=float, metavar='N',
                             help='adaptive input factor')

Mutant 1618

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -69,7 +69,7 @@
                             help='size of character embeddings')
         parser.add_argument('--char-embedder-highway-layers', type=int, metavar='N', default=2,
                             help='number of highway layers for character token embeddder')
-        parser.add_argument('--adaptive-input', default=False, action='store_true',
+        parser.add_argument('--adaptive-input', default=True, action='store_true',
                             help='if set, uses adaptive input')
         parser.add_argument('--adaptive-input-factor', type=float, metavar='N',
                             help='adaptive input factor')

Mutant 1620

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -70,7 +70,7 @@
         parser.add_argument('--char-embedder-highway-layers', type=int, metavar='N', default=2,
                             help='number of highway layers for character token embeddder')
         parser.add_argument('--adaptive-input', default=False, action='store_true',
-                            help='if set, uses adaptive input')
+                            help='XXif set, uses adaptive inputXX')
         parser.add_argument('--adaptive-input-factor', type=float, metavar='N',
                             help='adaptive input factor')
         parser.add_argument('--adaptive-input-cutoff', metavar='EXPR',

Mutant 1621

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -71,7 +71,7 @@
                             help='number of highway layers for character token embeddder')
         parser.add_argument('--adaptive-input', default=False, action='store_true',
                             help='if set, uses adaptive input')
-        parser.add_argument('--adaptive-input-factor', type=float, metavar='N',
+        parser.add_argument('XX--adaptive-input-factorXX', type=float, metavar='N',
                             help='adaptive input factor')
         parser.add_argument('--adaptive-input-cutoff', metavar='EXPR',
                             help='comma separated list of adaptive input cutoff points.')

Mutant 1622

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -71,7 +71,7 @@
                             help='number of highway layers for character token embeddder')
         parser.add_argument('--adaptive-input', default=False, action='store_true',
                             help='if set, uses adaptive input')
-        parser.add_argument('--adaptive-input-factor', type=float, metavar='N',
+        parser.add_argument('--adaptive-input-factor', type=float, metavar='XXNXX',
                             help='adaptive input factor')
         parser.add_argument('--adaptive-input-cutoff', metavar='EXPR',
                             help='comma separated list of adaptive input cutoff points.')

Mutant 1623

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -72,7 +72,7 @@
         parser.add_argument('--adaptive-input', default=False, action='store_true',
                             help='if set, uses adaptive input')
         parser.add_argument('--adaptive-input-factor', type=float, metavar='N',
-                            help='adaptive input factor')
+                            help='XXadaptive input factorXX')
         parser.add_argument('--adaptive-input-cutoff', metavar='EXPR',
                             help='comma separated list of adaptive input cutoff points.')
         parser.add_argument('--tie-adaptive-weights', action='store_true',

Mutant 1624

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -73,7 +73,7 @@
                             help='if set, uses adaptive input')
         parser.add_argument('--adaptive-input-factor', type=float, metavar='N',
                             help='adaptive input factor')
-        parser.add_argument('--adaptive-input-cutoff', metavar='EXPR',
+        parser.add_argument('XX--adaptive-input-cutoffXX', metavar='EXPR',
                             help='comma separated list of adaptive input cutoff points.')
         parser.add_argument('--tie-adaptive-weights', action='store_true',
                             help='if set, ties the weights of adaptive softmax and adaptive input')

Mutant 1625

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -73,7 +73,7 @@
                             help='if set, uses adaptive input')
         parser.add_argument('--adaptive-input-factor', type=float, metavar='N',
                             help='adaptive input factor')
-        parser.add_argument('--adaptive-input-cutoff', metavar='EXPR',
+        parser.add_argument('--adaptive-input-cutoff', metavar='XXEXPRXX',
                             help='comma separated list of adaptive input cutoff points.')
         parser.add_argument('--tie-adaptive-weights', action='store_true',
                             help='if set, ties the weights of adaptive softmax and adaptive input')

Mutant 1626

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -74,7 +74,7 @@
         parser.add_argument('--adaptive-input-factor', type=float, metavar='N',
                             help='adaptive input factor')
         parser.add_argument('--adaptive-input-cutoff', metavar='EXPR',
-                            help='comma separated list of adaptive input cutoff points.')
+                            help='XXcomma separated list of adaptive input cutoff points.XX')
         parser.add_argument('--tie-adaptive-weights', action='store_true',
                             help='if set, ties the weights of adaptive softmax and adaptive input')
         parser.add_argument('--tie-adaptive-proj', action='store_true',

Mutant 1627

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -75,7 +75,7 @@
                             help='adaptive input factor')
         parser.add_argument('--adaptive-input-cutoff', metavar='EXPR',
                             help='comma separated list of adaptive input cutoff points.')
-        parser.add_argument('--tie-adaptive-weights', action='store_true',
+        parser.add_argument('XX--tie-adaptive-weightsXX', action='store_true',
                             help='if set, ties the weights of adaptive softmax and adaptive input')
         parser.add_argument('--tie-adaptive-proj', action='store_true',
                             help='if set, ties the projection weights of adaptive softmax and adaptive input')

Mutant 1629

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -76,7 +76,7 @@
         parser.add_argument('--adaptive-input-cutoff', metavar='EXPR',
                             help='comma separated list of adaptive input cutoff points.')
         parser.add_argument('--tie-adaptive-weights', action='store_true',
-                            help='if set, ties the weights of adaptive softmax and adaptive input')
+                            help='XXif set, ties the weights of adaptive softmax and adaptive inputXX')
         parser.add_argument('--tie-adaptive-proj', action='store_true',
                             help='if set, ties the projection weights of adaptive softmax and adaptive input')
         parser.add_argument('--decoder-learned-pos', action='store_true',

Mutant 1630

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -77,7 +77,7 @@
                             help='comma separated list of adaptive input cutoff points.')
         parser.add_argument('--tie-adaptive-weights', action='store_true',
                             help='if set, ties the weights of adaptive softmax and adaptive input')
-        parser.add_argument('--tie-adaptive-proj', action='store_true',
+        parser.add_argument('XX--tie-adaptive-projXX', action='store_true',
                             help='if set, ties the projection weights of adaptive softmax and adaptive input')
         parser.add_argument('--decoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the decoder')

Mutant 1632

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -78,7 +78,7 @@
         parser.add_argument('--tie-adaptive-weights', action='store_true',
                             help='if set, ties the weights of adaptive softmax and adaptive input')
         parser.add_argument('--tie-adaptive-proj', action='store_true',
-                            help='if set, ties the projection weights of adaptive softmax and adaptive input')
+                            help='XXif set, ties the projection weights of adaptive softmax and adaptive inputXX')
         parser.add_argument('--decoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the decoder')
 

Mutant 1633

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -79,7 +79,7 @@
                             help='if set, ties the weights of adaptive softmax and adaptive input')
         parser.add_argument('--tie-adaptive-proj', action='store_true',
                             help='if set, ties the projection weights of adaptive softmax and adaptive input')
-        parser.add_argument('--decoder-learned-pos', action='store_true',
+        parser.add_argument('XX--decoder-learned-posXX', action='store_true',
                             help='use learned positional embeddings in the decoder')
 
         """LightConv and DynamicConv arguments"""

Mutant 1635

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -80,7 +80,7 @@
         parser.add_argument('--tie-adaptive-proj', action='store_true',
                             help='if set, ties the projection weights of adaptive softmax and adaptive input')
         parser.add_argument('--decoder-learned-pos', action='store_true',
-                            help='use learned positional embeddings in the decoder')
+                            help='XXuse learned positional embeddings in the decoderXX')
 
         """LightConv and DynamicConv arguments"""
         parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),

Mutant 1636

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -83,7 +83,7 @@
                             help='use learned positional embeddings in the decoder')
 
         """LightConv and DynamicConv arguments"""
-        parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
+        parser.add_argument('XX--decoder-kernel-size-listXX', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')
         parser.add_argument('--decoder-glu', type=options.eval_bool,
                             help='glu after in proj')

Mutant 1637

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -83,7 +83,7 @@
                             help='use learned positional embeddings in the decoder')
 
         """LightConv and DynamicConv arguments"""
-        parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
+        parser.add_argument('--decoder-kernel-size-list', type=lambda x: None,
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')
         parser.add_argument('--decoder-glu', type=options.eval_bool,
                             help='glu after in proj')

Mutant 1638

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -84,7 +84,7 @@
 
         """LightConv and DynamicConv arguments"""
         parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
-                            help='list of kernel size (default: "[3,7,15,31,31,31]")')
+                            help='XXlist of kernel size (default: "[3,7,15,31,31,31]")XX')
         parser.add_argument('--decoder-glu', type=options.eval_bool,
                             help='glu after in proj')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,

Mutant 1639

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -85,7 +85,7 @@
         """LightConv and DynamicConv arguments"""
         parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')
-        parser.add_argument('--decoder-glu', type=options.eval_bool,
+        parser.add_argument('XX--decoder-gluXX', type=options.eval_bool,
                             help='glu after in proj')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],

Mutant 1640

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -86,7 +86,7 @@
         parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')
         parser.add_argument('--decoder-glu', type=options.eval_bool,
-                            help='glu after in proj')
+                            help='XXglu after in projXX')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')

Mutant 1641

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -87,7 +87,7 @@
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')
         parser.add_argument('--decoder-glu', type=options.eval_bool,
                             help='glu after in proj')
-        parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
+        parser.add_argument('XX--decoder-conv-typeXX', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)

Mutant 1642

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -87,7 +87,7 @@
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')
         parser.add_argument('--decoder-glu', type=options.eval_bool,
                             help='glu after in proj')
-        parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
+        parser.add_argument('--decoder-conv-type', default='XXdynamicXX', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)

Mutant 1643

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -88,7 +88,7 @@
         parser.add_argument('--decoder-glu', type=options.eval_bool,
                             help='glu after in proj')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
-                            choices=['dynamic', 'lightweight'],
+                            choices=['XXdynamicXX', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
         parser.add_argument('--weight-dropout', type=float, metavar='D',

Mutant 1644

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -88,7 +88,7 @@
         parser.add_argument('--decoder-glu', type=options.eval_bool,
                             help='glu after in proj')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
-                            choices=['dynamic', 'lightweight'],
+                            choices=['dynamic', 'XXlightweightXX'],
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
         parser.add_argument('--weight-dropout', type=float, metavar='D',

Mutant 1645

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -89,7 +89,7 @@
                             help='glu after in proj')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
-                            help='type of convolution')
+                            help='XXtype of convolutionXX')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
         parser.add_argument('--weight-dropout', type=float, metavar='D',
                             help='dropout probability for conv weights')

Mutant 1646

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -90,7 +90,7 @@
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
-        parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
+        parser.add_argument('XX--weight-softmaxXX', default=True, type=options.eval_bool)
         parser.add_argument('--weight-dropout', type=float, metavar='D',
                             help='dropout probability for conv weights')
 

Mutant 1647

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -90,7 +90,7 @@
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
-        parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
+        parser.add_argument('--weight-softmax', default=False, type=options.eval_bool)
         parser.add_argument('--weight-dropout', type=float, metavar='D',
                             help='dropout probability for conv weights')
 

Mutant 1648

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -91,7 +91,7 @@
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
-        parser.add_argument('--weight-dropout', type=float, metavar='D',
+        parser.add_argument('XX--weight-dropoutXX', type=float, metavar='D',
                             help='dropout probability for conv weights')
 
     @classmethod

Mutant 1649

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -91,7 +91,7 @@
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
-        parser.add_argument('--weight-dropout', type=float, metavar='D',
+        parser.add_argument('--weight-dropout', type=float, metavar='XXDXX',
                             help='dropout probability for conv weights')
 
     @classmethod

Mutant 1650

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -92,7 +92,7 @@
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
         parser.add_argument('--weight-dropout', type=float, metavar='D',
-                            help='dropout probability for conv weights')
+                            help='XXdropout probability for conv weightsXX')
 
     @classmethod
     def build_model(cls, args, task):

Mutant 1651

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -94,7 +94,6 @@
         parser.add_argument('--weight-dropout', type=float, metavar='D',
                             help='dropout probability for conv weights')
 
-    @classmethod
     def build_model(cls, args, task):
         """Build a new model instance."""
 

Mutant 1653

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -130,7 +130,7 @@
         return LightConvLanguageModel(decoder)
 
 
-@register_model_architecture('lightconv_lm', 'lightconv_lm')
+@register_model_architecture('lightconv_lm', 'XXlightconv_lmXX')
 def base_lm_architecture(args):
     args.decoder_embed_dim = getattr(args, 'decoder_embed_dim', 512)
     args.decoder_ffn_embed_dim = getattr(args, 'decoder_ffn_embed_dim', 2048)

Mutant 1654

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -129,8 +129,6 @@
         decoder = LightConvDecoder(args, task.output_dictionary, embed_tokens, no_encoder_attn=True, final_norm=False)
         return LightConvLanguageModel(decoder)
 
-
-@register_model_architecture('lightconv_lm', 'lightconv_lm')
 def base_lm_architecture(args):
     args.decoder_embed_dim = getattr(args, 'decoder_embed_dim', 512)
     args.decoder_ffn_embed_dim = getattr(args, 'decoder_ffn_embed_dim', 2048)

Mutant 1656

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -166,7 +166,7 @@
     args.weight_dropout = getattr(args, 'weight_dropout', args.attention_dropout)
 
 
-@register_model_architecture('lightconv_lm', 'lightconv_lm_gbw')
+@register_model_architecture('lightconv_lm', 'XXlightconv_lm_gbwXX')
 def lightconv_lm_gbw(args):
     args.decoder_embed_dim = getattr(args, 'decoder_embed_dim', 512)
     args.dropout = getattr(args, 'dropout', 0.1)

Mutant 1657

--- fairseq/models/lightconv_lm.py
+++ fairseq/models/lightconv_lm.py
@@ -165,8 +165,6 @@
     args.input_dropout = getattr(args, 'input_dropout', 0.1)
     args.weight_dropout = getattr(args, 'weight_dropout', args.attention_dropout)
 
-
-@register_model_architecture('lightconv_lm', 'lightconv_lm_gbw')
 def lightconv_lm_gbw(args):
     args.decoder_embed_dim = getattr(args, 'decoder_embed_dim', 512)
     args.dropout = getattr(args, 'dropout', 0.1)