fairseq/models/lightconv.py

Killed 14 out of 131 mutants

Survived

Survived mutation testing. These mutants show holes in your test suite.

Mutant 2725

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -48,7 +48,6 @@
         :prog:
     """
 
-    @classmethod
     def hub_models(cls):
         # fmt: off
 

Mutant 2726

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -78,7 +78,6 @@
     def __init__(self, encoder, decoder):
         super().__init__(encoder, decoder)
 
-    @staticmethod
     def add_args(parser):
         """Add model-specific arguments to the parser."""
         parser.add_argument('--dropout', type=float, metavar='D',

Mutant 2727

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -81,7 +81,7 @@
     @staticmethod
     def add_args(parser):
         """Add model-specific arguments to the parser."""
-        parser.add_argument('--dropout', type=float, metavar='D',
+        parser.add_argument('XX--dropoutXX', type=float, metavar='D',
                             help='dropout probability')
         parser.add_argument('--attention-dropout', type=float, metavar='D',
                             help='dropout probability for attention weights')

Mutant 2728

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -81,7 +81,7 @@
     @staticmethod
     def add_args(parser):
         """Add model-specific arguments to the parser."""
-        parser.add_argument('--dropout', type=float, metavar='D',
+        parser.add_argument('--dropout', type=float, metavar='XXDXX',
                             help='dropout probability')
         parser.add_argument('--attention-dropout', type=float, metavar='D',
                             help='dropout probability for attention weights')

Mutant 2729

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -82,7 +82,7 @@
     def add_args(parser):
         """Add model-specific arguments to the parser."""
         parser.add_argument('--dropout', type=float, metavar='D',
-                            help='dropout probability')
+                            help='XXdropout probabilityXX')
         parser.add_argument('--attention-dropout', type=float, metavar='D',
                             help='dropout probability for attention weights')
         parser.add_argument('--relu-dropout', type=float, metavar='D',

Mutant 2730

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -83,7 +83,7 @@
         """Add model-specific arguments to the parser."""
         parser.add_argument('--dropout', type=float, metavar='D',
                             help='dropout probability')
-        parser.add_argument('--attention-dropout', type=float, metavar='D',
+        parser.add_argument('XX--attention-dropoutXX', type=float, metavar='D',
                             help='dropout probability for attention weights')
         parser.add_argument('--relu-dropout', type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')

Mutant 2731

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -83,7 +83,7 @@
         """Add model-specific arguments to the parser."""
         parser.add_argument('--dropout', type=float, metavar='D',
                             help='dropout probability')
-        parser.add_argument('--attention-dropout', type=float, metavar='D',
+        parser.add_argument('--attention-dropout', type=float, metavar='XXDXX',
                             help='dropout probability for attention weights')
         parser.add_argument('--relu-dropout', type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')

Mutant 2732

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -84,7 +84,7 @@
         parser.add_argument('--dropout', type=float, metavar='D',
                             help='dropout probability')
         parser.add_argument('--attention-dropout', type=float, metavar='D',
-                            help='dropout probability for attention weights')
+                            help='XXdropout probability for attention weightsXX')
         parser.add_argument('--relu-dropout', type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')
         parser.add_argument('--input-dropout', type=float, metavar='D',

Mutant 2733

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -85,7 +85,7 @@
                             help='dropout probability')
         parser.add_argument('--attention-dropout', type=float, metavar='D',
                             help='dropout probability for attention weights')
-        parser.add_argument('--relu-dropout', type=float, metavar='D',
+        parser.add_argument('XX--relu-dropoutXX', type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')
         parser.add_argument('--input-dropout', type=float, metavar='D',
                             help='dropout probability of the inputs')

Mutant 2734

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -85,7 +85,7 @@
                             help='dropout probability')
         parser.add_argument('--attention-dropout', type=float, metavar='D',
                             help='dropout probability for attention weights')
-        parser.add_argument('--relu-dropout', type=float, metavar='D',
+        parser.add_argument('--relu-dropout', type=float, metavar='XXDXX',
                             help='dropout probability after ReLU in FFN')
         parser.add_argument('--input-dropout', type=float, metavar='D',
                             help='dropout probability of the inputs')

Mutant 2735

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -86,7 +86,7 @@
         parser.add_argument('--attention-dropout', type=float, metavar='D',
                             help='dropout probability for attention weights')
         parser.add_argument('--relu-dropout', type=float, metavar='D',
-                            help='dropout probability after ReLU in FFN')
+                            help='XXdropout probability after ReLU in FFNXX')
         parser.add_argument('--input-dropout', type=float, metavar='D',
                             help='dropout probability of the inputs')
         parser.add_argument('--encoder-embed-path', type=str, metavar='STR',

Mutant 2736

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -87,7 +87,7 @@
                             help='dropout probability for attention weights')
         parser.add_argument('--relu-dropout', type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')
-        parser.add_argument('--input-dropout', type=float, metavar='D',
+        parser.add_argument('XX--input-dropoutXX', type=float, metavar='D',
                             help='dropout probability of the inputs')
         parser.add_argument('--encoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained encoder embedding')

Mutant 2737

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -87,7 +87,7 @@
                             help='dropout probability for attention weights')
         parser.add_argument('--relu-dropout', type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')
-        parser.add_argument('--input-dropout', type=float, metavar='D',
+        parser.add_argument('--input-dropout', type=float, metavar='XXDXX',
                             help='dropout probability of the inputs')
         parser.add_argument('--encoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained encoder embedding')

Mutant 2738

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -88,7 +88,7 @@
         parser.add_argument('--relu-dropout', type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')
         parser.add_argument('--input-dropout', type=float, metavar='D',
-                            help='dropout probability of the inputs')
+                            help='XXdropout probability of the inputsXX')
         parser.add_argument('--encoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained encoder embedding')
         parser.add_argument('--encoder-embed-dim', type=int, metavar='N',

Mutant 2739

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -89,7 +89,7 @@
                             help='dropout probability after ReLU in FFN')
         parser.add_argument('--input-dropout', type=float, metavar='D',
                             help='dropout probability of the inputs')
-        parser.add_argument('--encoder-embed-path', type=str, metavar='STR',
+        parser.add_argument('XX--encoder-embed-pathXX', type=str, metavar='STR',
                             help='path to pre-trained encoder embedding')
         parser.add_argument('--encoder-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension')

Mutant 2740

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -89,7 +89,7 @@
                             help='dropout probability after ReLU in FFN')
         parser.add_argument('--input-dropout', type=float, metavar='D',
                             help='dropout probability of the inputs')
-        parser.add_argument('--encoder-embed-path', type=str, metavar='STR',
+        parser.add_argument('--encoder-embed-path', type=str, metavar='XXSTRXX',
                             help='path to pre-trained encoder embedding')
         parser.add_argument('--encoder-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension')

Mutant 2741

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -90,7 +90,7 @@
         parser.add_argument('--input-dropout', type=float, metavar='D',
                             help='dropout probability of the inputs')
         parser.add_argument('--encoder-embed-path', type=str, metavar='STR',
-                            help='path to pre-trained encoder embedding')
+                            help='XXpath to pre-trained encoder embeddingXX')
         parser.add_argument('--encoder-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-conv-dim', type=int, metavar='N',

Mutant 2742

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -91,7 +91,7 @@
                             help='dropout probability of the inputs')
         parser.add_argument('--encoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained encoder embedding')
-        parser.add_argument('--encoder-embed-dim', type=int, metavar='N',
+        parser.add_argument('XX--encoder-embed-dimXX', type=int, metavar='N',
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-conv-dim', type=int, metavar='N',
                             help='encoder embedding dimension')

Mutant 2743

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -91,7 +91,7 @@
                             help='dropout probability of the inputs')
         parser.add_argument('--encoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained encoder embedding')
-        parser.add_argument('--encoder-embed-dim', type=int, metavar='N',
+        parser.add_argument('--encoder-embed-dim', type=int, metavar='XXNXX',
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-conv-dim', type=int, metavar='N',
                             help='encoder embedding dimension')

Mutant 2744

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -92,7 +92,7 @@
         parser.add_argument('--encoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained encoder embedding')
         parser.add_argument('--encoder-embed-dim', type=int, metavar='N',
-                            help='encoder embedding dimension')
+                            help='XXencoder embedding dimensionXX')
         parser.add_argument('--encoder-conv-dim', type=int, metavar='N',
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',

Mutant 2745

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -93,7 +93,7 @@
                             help='path to pre-trained encoder embedding')
         parser.add_argument('--encoder-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension')
-        parser.add_argument('--encoder-conv-dim', type=int, metavar='N',
+        parser.add_argument('XX--encoder-conv-dimXX', type=int, metavar='N',
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension for FFN')

Mutant 2746

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -93,7 +93,7 @@
                             help='path to pre-trained encoder embedding')
         parser.add_argument('--encoder-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension')
-        parser.add_argument('--encoder-conv-dim', type=int, metavar='N',
+        parser.add_argument('--encoder-conv-dim', type=int, metavar='XXNXX',
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension for FFN')

Mutant 2747

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -94,7 +94,7 @@
         parser.add_argument('--encoder-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-conv-dim', type=int, metavar='N',
-                            help='encoder embedding dimension')
+                            help='XXencoder embedding dimensionXX')
         parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension for FFN')
         parser.add_argument('--encoder-layers', type=int, metavar='N',

Mutant 2748

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -95,7 +95,7 @@
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-conv-dim', type=int, metavar='N',
                             help='encoder embedding dimension')
-        parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',
+        parser.add_argument('XX--encoder-ffn-embed-dimXX', type=int, metavar='N',
                             help='encoder embedding dimension for FFN')
         parser.add_argument('--encoder-layers', type=int, metavar='N',
                             help='num encoder layers')

Mutant 2749

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -95,7 +95,7 @@
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-conv-dim', type=int, metavar='N',
                             help='encoder embedding dimension')
-        parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',
+        parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='XXNXX',
                             help='encoder embedding dimension for FFN')
         parser.add_argument('--encoder-layers', type=int, metavar='N',
                             help='num encoder layers')

Mutant 2750

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -96,7 +96,7 @@
         parser.add_argument('--encoder-conv-dim', type=int, metavar='N',
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',
-                            help='encoder embedding dimension for FFN')
+                            help='XXencoder embedding dimension for FFNXX')
         parser.add_argument('--encoder-layers', type=int, metavar='N',
                             help='num encoder layers')
         parser.add_argument('--encoder-attention-heads', type=int, metavar='N',

Mutant 2751

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -97,7 +97,7 @@
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension for FFN')
-        parser.add_argument('--encoder-layers', type=int, metavar='N',
+        parser.add_argument('XX--encoder-layersXX', type=int, metavar='N',
                             help='num encoder layers')
         parser.add_argument('--encoder-attention-heads', type=int, metavar='N',
                             help='num encoder attention heads or LightConv/DynamicConv heads')

Mutant 2752

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -97,7 +97,7 @@
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension for FFN')
-        parser.add_argument('--encoder-layers', type=int, metavar='N',
+        parser.add_argument('--encoder-layers', type=int, metavar='XXNXX',
                             help='num encoder layers')
         parser.add_argument('--encoder-attention-heads', type=int, metavar='N',
                             help='num encoder attention heads or LightConv/DynamicConv heads')

Mutant 2753

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -98,7 +98,7 @@
         parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension for FFN')
         parser.add_argument('--encoder-layers', type=int, metavar='N',
-                            help='num encoder layers')
+                            help='XXnum encoder layersXX')
         parser.add_argument('--encoder-attention-heads', type=int, metavar='N',
                             help='num encoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--encoder-normalize-before', action='store_true',

Mutant 2754

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -99,7 +99,7 @@
                             help='encoder embedding dimension for FFN')
         parser.add_argument('--encoder-layers', type=int, metavar='N',
                             help='num encoder layers')
-        parser.add_argument('--encoder-attention-heads', type=int, metavar='N',
+        parser.add_argument('XX--encoder-attention-headsXX', type=int, metavar='N',
                             help='num encoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--encoder-normalize-before', action='store_true',
                             help='apply layernorm before each encoder block')

Mutant 2755

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -99,7 +99,7 @@
                             help='encoder embedding dimension for FFN')
         parser.add_argument('--encoder-layers', type=int, metavar='N',
                             help='num encoder layers')
-        parser.add_argument('--encoder-attention-heads', type=int, metavar='N',
+        parser.add_argument('--encoder-attention-heads', type=int, metavar='XXNXX',
                             help='num encoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--encoder-normalize-before', action='store_true',
                             help='apply layernorm before each encoder block')

Mutant 2756

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -100,7 +100,7 @@
         parser.add_argument('--encoder-layers', type=int, metavar='N',
                             help='num encoder layers')
         parser.add_argument('--encoder-attention-heads', type=int, metavar='N',
-                            help='num encoder attention heads or LightConv/DynamicConv heads')
+                            help='XXnum encoder attention heads or LightConv/DynamicConv headsXX')
         parser.add_argument('--encoder-normalize-before', action='store_true',
                             help='apply layernorm before each encoder block')
         parser.add_argument('--encoder-learned-pos', action='store_true',

Mutant 2757

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -101,7 +101,7 @@
                             help='num encoder layers')
         parser.add_argument('--encoder-attention-heads', type=int, metavar='N',
                             help='num encoder attention heads or LightConv/DynamicConv heads')
-        parser.add_argument('--encoder-normalize-before', action='store_true',
+        parser.add_argument('XX--encoder-normalize-beforeXX', action='store_true',
                             help='apply layernorm before each encoder block')
         parser.add_argument('--encoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the encoder')

Mutant 2759

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -102,7 +102,7 @@
         parser.add_argument('--encoder-attention-heads', type=int, metavar='N',
                             help='num encoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--encoder-normalize-before', action='store_true',
-                            help='apply layernorm before each encoder block')
+                            help='XXapply layernorm before each encoder blockXX')
         parser.add_argument('--encoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the encoder')
         parser.add_argument('--decoder-embed-path', type=str, metavar='STR',

Mutant 2760

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -103,7 +103,7 @@
                             help='num encoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--encoder-normalize-before', action='store_true',
                             help='apply layernorm before each encoder block')
-        parser.add_argument('--encoder-learned-pos', action='store_true',
+        parser.add_argument('XX--encoder-learned-posXX', action='store_true',
                             help='use learned positional embeddings in the encoder')
         parser.add_argument('--decoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained decoder embedding')

Mutant 2762

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -104,7 +104,7 @@
         parser.add_argument('--encoder-normalize-before', action='store_true',
                             help='apply layernorm before each encoder block')
         parser.add_argument('--encoder-learned-pos', action='store_true',
-                            help='use learned positional embeddings in the encoder')
+                            help='XXuse learned positional embeddings in the encoderXX')
         parser.add_argument('--decoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained decoder embedding')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',

Mutant 2763

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -105,7 +105,7 @@
                             help='apply layernorm before each encoder block')
         parser.add_argument('--encoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the encoder')
-        parser.add_argument('--decoder-embed-path', type=str, metavar='STR',
+        parser.add_argument('XX--decoder-embed-pathXX', type=str, metavar='STR',
                             help='path to pre-trained decoder embedding')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension')

Mutant 2764

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -105,7 +105,7 @@
                             help='apply layernorm before each encoder block')
         parser.add_argument('--encoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the encoder')
-        parser.add_argument('--decoder-embed-path', type=str, metavar='STR',
+        parser.add_argument('--decoder-embed-path', type=str, metavar='XXSTRXX',
                             help='path to pre-trained decoder embedding')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension')

Mutant 2765

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -106,7 +106,7 @@
         parser.add_argument('--encoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the encoder')
         parser.add_argument('--decoder-embed-path', type=str, metavar='STR',
-                            help='path to pre-trained decoder embedding')
+                            help='XXpath to pre-trained decoder embeddingXX')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-conv-dim', type=int, metavar='N',

Mutant 2766

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -107,7 +107,7 @@
                             help='use learned positional embeddings in the encoder')
         parser.add_argument('--decoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained decoder embedding')
-        parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
+        parser.add_argument('XX--decoder-embed-dimXX', type=int, metavar='N',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-conv-dim', type=int, metavar='N',
                             help='decoder embedding dimension')

Mutant 2767

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -107,7 +107,7 @@
                             help='use learned positional embeddings in the encoder')
         parser.add_argument('--decoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained decoder embedding')
-        parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
+        parser.add_argument('--decoder-embed-dim', type=int, metavar='XXNXX',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-conv-dim', type=int, metavar='N',
                             help='decoder embedding dimension')

Mutant 2768

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -108,7 +108,7 @@
         parser.add_argument('--decoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained decoder embedding')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
-                            help='decoder embedding dimension')
+                            help='XXdecoder embedding dimensionXX')
         parser.add_argument('--decoder-conv-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',

Mutant 2769

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -109,7 +109,7 @@
                             help='path to pre-trained decoder embedding')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
-        parser.add_argument('--decoder-conv-dim', type=int, metavar='N',
+        parser.add_argument('XX--decoder-conv-dimXX', type=int, metavar='N',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')

Mutant 2770

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -109,7 +109,7 @@
                             help='path to pre-trained decoder embedding')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
-        parser.add_argument('--decoder-conv-dim', type=int, metavar='N',
+        parser.add_argument('--decoder-conv-dim', type=int, metavar='XXNXX',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')

Mutant 2771

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -110,7 +110,7 @@
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-conv-dim', type=int, metavar='N',
-                            help='decoder embedding dimension')
+                            help='XXdecoder embedding dimensionXX')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')
         parser.add_argument('--decoder-layers', type=int, metavar='N',

Mutant 2772

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -111,7 +111,7 @@
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-conv-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
-        parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
+        parser.add_argument('XX--decoder-ffn-embed-dimXX', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')
         parser.add_argument('--decoder-layers', type=int, metavar='N',
                             help='num decoder layers')

Mutant 2773

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -111,7 +111,7 @@
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-conv-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
-        parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
+        parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='XXNXX',
                             help='decoder embedding dimension for FFN')
         parser.add_argument('--decoder-layers', type=int, metavar='N',
                             help='num decoder layers')

Mutant 2774

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -112,7 +112,7 @@
         parser.add_argument('--decoder-conv-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
-                            help='decoder embedding dimension for FFN')
+                            help='XXdecoder embedding dimension for FFNXX')
         parser.add_argument('--decoder-layers', type=int, metavar='N',
                             help='num decoder layers')
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',

Mutant 2775

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -113,7 +113,7 @@
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')
-        parser.add_argument('--decoder-layers', type=int, metavar='N',
+        parser.add_argument('XX--decoder-layersXX', type=int, metavar='N',
                             help='num decoder layers')
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
                             help='num decoder attention heads or LightConv/DynamicConv heads')

Mutant 2776

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -113,7 +113,7 @@
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')
-        parser.add_argument('--decoder-layers', type=int, metavar='N',
+        parser.add_argument('--decoder-layers', type=int, metavar='XXNXX',
                             help='num decoder layers')
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
                             help='num decoder attention heads or LightConv/DynamicConv heads')

Mutant 2777

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -114,7 +114,7 @@
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')
         parser.add_argument('--decoder-layers', type=int, metavar='N',
-                            help='num decoder layers')
+                            help='XXnum decoder layersXX')
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
                             help='num decoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--decoder-learned-pos', action='store_true',

Mutant 2778

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -115,7 +115,7 @@
                             help='decoder embedding dimension for FFN')
         parser.add_argument('--decoder-layers', type=int, metavar='N',
                             help='num decoder layers')
-        parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
+        parser.add_argument('XX--decoder-attention-headsXX', type=int, metavar='N',
                             help='num decoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--decoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the decoder')

Mutant 2779

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -115,7 +115,7 @@
                             help='decoder embedding dimension for FFN')
         parser.add_argument('--decoder-layers', type=int, metavar='N',
                             help='num decoder layers')
-        parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
+        parser.add_argument('--decoder-attention-heads', type=int, metavar='XXNXX',
                             help='num decoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--decoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the decoder')

Mutant 2780

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -116,7 +116,7 @@
         parser.add_argument('--decoder-layers', type=int, metavar='N',
                             help='num decoder layers')
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
-                            help='num decoder attention heads or LightConv/DynamicConv heads')
+                            help='XXnum decoder attention heads or LightConv/DynamicConv headsXX')
         parser.add_argument('--decoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the decoder')
         parser.add_argument('--decoder-normalize-before', action='store_true',

Mutant 2781

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -117,7 +117,7 @@
                             help='num decoder layers')
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
                             help='num decoder attention heads or LightConv/DynamicConv heads')
-        parser.add_argument('--decoder-learned-pos', action='store_true',
+        parser.add_argument('XX--decoder-learned-posXX', action='store_true',
                             help='use learned positional embeddings in the decoder')
         parser.add_argument('--decoder-normalize-before', action='store_true',
                             help='apply layernorm before each decoder block')

Mutant 2783

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -118,7 +118,7 @@
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
                             help='num decoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--decoder-learned-pos', action='store_true',
-                            help='use learned positional embeddings in the decoder')
+                            help='XXuse learned positional embeddings in the decoderXX')
         parser.add_argument('--decoder-normalize-before', action='store_true',
                             help='apply layernorm before each decoder block')
         parser.add_argument('--share-decoder-input-output-embed', action='store_true',

Mutant 2784

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -119,7 +119,7 @@
                             help='num decoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--decoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the decoder')
-        parser.add_argument('--decoder-normalize-before', action='store_true',
+        parser.add_argument('XX--decoder-normalize-beforeXX', action='store_true',
                             help='apply layernorm before each decoder block')
         parser.add_argument('--share-decoder-input-output-embed', action='store_true',
                             help='share decoder input and output embeddings')

Mutant 2786

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -120,7 +120,7 @@
         parser.add_argument('--decoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the decoder')
         parser.add_argument('--decoder-normalize-before', action='store_true',
-                            help='apply layernorm before each decoder block')
+                            help='XXapply layernorm before each decoder blockXX')
         parser.add_argument('--share-decoder-input-output-embed', action='store_true',
                             help='share decoder input and output embeddings')
         parser.add_argument('--share-all-embeddings', action='store_true',

Mutant 2787

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -121,7 +121,7 @@
                             help='use learned positional embeddings in the decoder')
         parser.add_argument('--decoder-normalize-before', action='store_true',
                             help='apply layernorm before each decoder block')
-        parser.add_argument('--share-decoder-input-output-embed', action='store_true',
+        parser.add_argument('XX--share-decoder-input-output-embedXX', action='store_true',
                             help='share decoder input and output embeddings')
         parser.add_argument('--share-all-embeddings', action='store_true',
                             help='share encoder, decoder and output embeddings'

Mutant 2789

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -122,7 +122,7 @@
         parser.add_argument('--decoder-normalize-before', action='store_true',
                             help='apply layernorm before each decoder block')
         parser.add_argument('--share-decoder-input-output-embed', action='store_true',
-                            help='share decoder input and output embeddings')
+                            help='XXshare decoder input and output embeddingsXX')
         parser.add_argument('--share-all-embeddings', action='store_true',
                             help='share encoder, decoder and output embeddings'
                                  ' (requires shared dictionary and embed dim)')

Mutant 2790

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -123,7 +123,7 @@
                             help='apply layernorm before each decoder block')
         parser.add_argument('--share-decoder-input-output-embed', action='store_true',
                             help='share decoder input and output embeddings')
-        parser.add_argument('--share-all-embeddings', action='store_true',
+        parser.add_argument('XX--share-all-embeddingsXX', action='store_true',
                             help='share encoder, decoder and output embeddings'
                                  ' (requires shared dictionary and embed dim)')
         parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',

Mutant 2792

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -124,7 +124,7 @@
         parser.add_argument('--share-decoder-input-output-embed', action='store_true',
                             help='share decoder input and output embeddings')
         parser.add_argument('--share-all-embeddings', action='store_true',
-                            help='share encoder, decoder and output embeddings'
+                            help='XXshare encoder, decoder and output embeddingsXX'
                                  ' (requires shared dictionary and embed dim)')
         parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
                             help='comma separated list of adaptive softmax cutoff points. '

Mutant 2793

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -126,7 +126,7 @@
         parser.add_argument('--share-all-embeddings', action='store_true',
                             help='share encoder, decoder and output embeddings'
                                  ' (requires shared dictionary and embed dim)')
-        parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
+        parser.add_argument('XX--adaptive-softmax-cutoffXX', metavar='EXPR',
                             help='comma separated list of adaptive softmax cutoff points. '
                                  'Must be used with adaptive_loss criterion'),
         parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',

Mutant 2794

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -126,7 +126,7 @@
         parser.add_argument('--share-all-embeddings', action='store_true',
                             help='share encoder, decoder and output embeddings'
                                  ' (requires shared dictionary and embed dim)')
-        parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
+        parser.add_argument('--adaptive-softmax-cutoff', metavar='XXEXPRXX',
                             help='comma separated list of adaptive softmax cutoff points. '
                                  'Must be used with adaptive_loss criterion'),
         parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',

Mutant 2795

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -127,7 +127,7 @@
                             help='share encoder, decoder and output embeddings'
                                  ' (requires shared dictionary and embed dim)')
         parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
-                            help='comma separated list of adaptive softmax cutoff points. '
+                            help='XXcomma separated list of adaptive softmax cutoff points. XX'
                                  'Must be used with adaptive_loss criterion'),
         parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',
                             help='sets adaptive softmax dropout for the tail projections')

Mutant 2796

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -129,7 +129,7 @@
         parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
                             help='comma separated list of adaptive softmax cutoff points. '
                                  'Must be used with adaptive_loss criterion'),
-        parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',
+        parser.add_argument('XX--adaptive-softmax-dropoutXX', type=float, metavar='D',
                             help='sets adaptive softmax dropout for the tail projections')
 
         """LightConv and DynamicConv arguments"""

Mutant 2797

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -129,7 +129,7 @@
         parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
                             help='comma separated list of adaptive softmax cutoff points. '
                                  'Must be used with adaptive_loss criterion'),
-        parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',
+        parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='XXDXX',
                             help='sets adaptive softmax dropout for the tail projections')
 
         """LightConv and DynamicConv arguments"""

Mutant 2798

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -130,7 +130,7 @@
                             help='comma separated list of adaptive softmax cutoff points. '
                                  'Must be used with adaptive_loss criterion'),
         parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',
-                            help='sets adaptive softmax dropout for the tail projections')
+                            help='XXsets adaptive softmax dropout for the tail projectionsXX')
 
         """LightConv and DynamicConv arguments"""
         parser.add_argument('--encoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),

Mutant 2799

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -133,7 +133,7 @@
                             help='sets adaptive softmax dropout for the tail projections')
 
         """LightConv and DynamicConv arguments"""
-        parser.add_argument('--encoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
+        parser.add_argument('XX--encoder-kernel-size-listXX', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31,31]")')
         parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')

Mutant 2800

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -133,7 +133,7 @@
                             help='sets adaptive softmax dropout for the tail projections')
 
         """LightConv and DynamicConv arguments"""
-        parser.add_argument('--encoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
+        parser.add_argument('--encoder-kernel-size-list', type=lambda x: None,
                             help='list of kernel size (default: "[3,7,15,31,31,31,31]")')
         parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')

Mutant 2801

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -134,7 +134,7 @@
 
         """LightConv and DynamicConv arguments"""
         parser.add_argument('--encoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
-                            help='list of kernel size (default: "[3,7,15,31,31,31,31]")')
+                            help='XXlist of kernel size (default: "[3,7,15,31,31,31,31]")XX')
         parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')
         parser.add_argument('--encoder-glu', type=options.eval_bool,

Mutant 2802

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -135,7 +135,7 @@
         """LightConv and DynamicConv arguments"""
         parser.add_argument('--encoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31,31]")')
-        parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
+        parser.add_argument('XX--decoder-kernel-size-listXX', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')
         parser.add_argument('--encoder-glu', type=options.eval_bool,
                             help='glu after in proj')

Mutant 2803

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -135,7 +135,7 @@
         """LightConv and DynamicConv arguments"""
         parser.add_argument('--encoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31,31]")')
-        parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
+        parser.add_argument('--decoder-kernel-size-list', type=lambda x: None,
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')
         parser.add_argument('--encoder-glu', type=options.eval_bool,
                             help='glu after in proj')

Mutant 2804

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -136,7 +136,7 @@
         parser.add_argument('--encoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31,31]")')
         parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
-                            help='list of kernel size (default: "[3,7,15,31,31,31]")')
+                            help='XXlist of kernel size (default: "[3,7,15,31,31,31]")XX')
         parser.add_argument('--encoder-glu', type=options.eval_bool,
                             help='glu after in proj')
         parser.add_argument('--decoder-glu', type=options.eval_bool,

Mutant 2805

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -137,7 +137,7 @@
                             help='list of kernel size (default: "[3,7,15,31,31,31,31]")')
         parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')
-        parser.add_argument('--encoder-glu', type=options.eval_bool,
+        parser.add_argument('XX--encoder-gluXX', type=options.eval_bool,
                             help='glu after in proj')
         parser.add_argument('--decoder-glu', type=options.eval_bool,
                             help='glu after in proj')

Mutant 2806

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -138,7 +138,7 @@
         parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')
         parser.add_argument('--encoder-glu', type=options.eval_bool,
-                            help='glu after in proj')
+                            help='XXglu after in projXX')
         parser.add_argument('--decoder-glu', type=options.eval_bool,
                             help='glu after in proj')
         parser.add_argument('--encoder-conv-type', default='dynamic', type=str,

Mutant 2807

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -139,7 +139,7 @@
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')
         parser.add_argument('--encoder-glu', type=options.eval_bool,
                             help='glu after in proj')
-        parser.add_argument('--decoder-glu', type=options.eval_bool,
+        parser.add_argument('XX--decoder-gluXX', type=options.eval_bool,
                             help='glu after in proj')
         parser.add_argument('--encoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],

Mutant 2808

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -140,7 +140,7 @@
         parser.add_argument('--encoder-glu', type=options.eval_bool,
                             help='glu after in proj')
         parser.add_argument('--decoder-glu', type=options.eval_bool,
-                            help='glu after in proj')
+                            help='XXglu after in projXX')
         parser.add_argument('--encoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')

Mutant 2809

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -141,7 +141,7 @@
                             help='glu after in proj')
         parser.add_argument('--decoder-glu', type=options.eval_bool,
                             help='glu after in proj')
-        parser.add_argument('--encoder-conv-type', default='dynamic', type=str,
+        parser.add_argument('XX--encoder-conv-typeXX', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,

Mutant 2810

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -141,7 +141,7 @@
                             help='glu after in proj')
         parser.add_argument('--decoder-glu', type=options.eval_bool,
                             help='glu after in proj')
-        parser.add_argument('--encoder-conv-type', default='dynamic', type=str,
+        parser.add_argument('--encoder-conv-type', default='XXdynamicXX', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,

Mutant 2811

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -142,7 +142,7 @@
         parser.add_argument('--decoder-glu', type=options.eval_bool,
                             help='glu after in proj')
         parser.add_argument('--encoder-conv-type', default='dynamic', type=str,
-                            choices=['dynamic', 'lightweight'],
+                            choices=['XXdynamicXX', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],

Mutant 2812

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -142,7 +142,7 @@
         parser.add_argument('--decoder-glu', type=options.eval_bool,
                             help='glu after in proj')
         parser.add_argument('--encoder-conv-type', default='dynamic', type=str,
-                            choices=['dynamic', 'lightweight'],
+                            choices=['dynamic', 'XXlightweightXX'],
                             help='type of convolution')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],

Mutant 2813

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -143,7 +143,7 @@
                             help='glu after in proj')
         parser.add_argument('--encoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
-                            help='type of convolution')
+                            help='XXtype of convolutionXX')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')

Mutant 2814

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -144,7 +144,7 @@
         parser.add_argument('--encoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
-        parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
+        parser.add_argument('XX--decoder-conv-typeXX', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)

Mutant 2815

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -144,7 +144,7 @@
         parser.add_argument('--encoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
-        parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
+        parser.add_argument('--decoder-conv-type', default='XXdynamicXX', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)

Mutant 2816

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -145,7 +145,7 @@
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
-                            choices=['dynamic', 'lightweight'],
+                            choices=['XXdynamicXX', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
         parser.add_argument('--weight-dropout', type=float, metavar='D',

Mutant 2817

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -145,7 +145,7 @@
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
-                            choices=['dynamic', 'lightweight'],
+                            choices=['dynamic', 'XXlightweightXX'],
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
         parser.add_argument('--weight-dropout', type=float, metavar='D',

Mutant 2818

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -146,7 +146,7 @@
                             help='type of convolution')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
-                            help='type of convolution')
+                            help='XXtype of convolutionXX')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
         parser.add_argument('--weight-dropout', type=float, metavar='D',
                             help='dropout probability for conv weights')

Mutant 2819

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -147,7 +147,7 @@
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
-        parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
+        parser.add_argument('XX--weight-softmaxXX', default=True, type=options.eval_bool)
         parser.add_argument('--weight-dropout', type=float, metavar='D',
                             help='dropout probability for conv weights')
 

Mutant 2820

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -147,7 +147,7 @@
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
-        parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
+        parser.add_argument('--weight-softmax', default=False, type=options.eval_bool)
         parser.add_argument('--weight-dropout', type=float, metavar='D',
                             help='dropout probability for conv weights')
 

Mutant 2821

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -148,7 +148,7 @@
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
-        parser.add_argument('--weight-dropout', type=float, metavar='D',
+        parser.add_argument('XX--weight-dropoutXX', type=float, metavar='D',
                             help='dropout probability for conv weights')
 
     @classmethod

Mutant 2822

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -148,7 +148,7 @@
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
-        parser.add_argument('--weight-dropout', type=float, metavar='D',
+        parser.add_argument('--weight-dropout', type=float, metavar='XXDXX',
                             help='dropout probability for conv weights')
 
     @classmethod

Mutant 2823

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -149,7 +149,7 @@
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
         parser.add_argument('--weight-dropout', type=float, metavar='D',
-                            help='dropout probability for conv weights')
+                            help='XXdropout probability for conv weightsXX')
 
     @classmethod
     def build_model(cls, args, task):

Mutant 2824

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -151,7 +151,6 @@
         parser.add_argument('--weight-dropout', type=float, metavar='D',
                             help='dropout probability for conv weights')
 
-    @classmethod
     def build_model(cls, args, task):
         """Build a new model instance."""
 

Mutant 2825

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -316,7 +316,7 @@
             Default: ``False``
     """
 
-    def __init__(self, args, dictionary, embed_tokens, no_encoder_attn=False, final_norm=True):
+    def __init__(self, args, dictionary, embed_tokens, no_encoder_attn=True, final_norm=True):
         super().__init__(dictionary)
         self.dropout_module = FairseqDropout(args.dropout, module_name=self.__class__.__name__)
         self.share_input_output_embed = args.share_decoder_input_output_embed

Mutant 2826

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -316,7 +316,7 @@
             Default: ``False``
     """
 
-    def __init__(self, args, dictionary, embed_tokens, no_encoder_attn=False, final_norm=True):
+    def __init__(self, args, dictionary, embed_tokens, no_encoder_attn=False, final_norm=False):
         super().__init__(dictionary)
         self.dropout_module = FairseqDropout(args.dropout, module_name=self.__class__.__name__)
         self.share_input_output_embed = args.share_decoder_input_output_embed

Mutant 2827

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -462,7 +462,7 @@
         kernel_size: kernel size of the convolution
     """
 
-    def __init__(self, args, kernel_size=0):
+    def __init__(self, args, kernel_size=1):
         super().__init__()
         self.embed_dim = args.encoder_embed_dim
         self.conv_dim = args.encoder_conv_dim

Mutant 2828

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -530,7 +530,7 @@
         x = self.maybe_layer_norm(1, x, after=True)
         return x
 
-    def maybe_layer_norm(self, i, x, before=False, after=False):
+    def maybe_layer_norm(self, i, x, before=True, after=False):
         assert before ^ after
         if after ^ self.normalize_before:
             return self.layer_norms[i](x)

Mutant 2829

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -530,7 +530,7 @@
         x = self.maybe_layer_norm(1, x, after=True)
         return x
 
-    def maybe_layer_norm(self, i, x, before=False, after=False):
+    def maybe_layer_norm(self, i, x, before=False, after=True):
         assert before ^ after
         if after ^ self.normalize_before:
             return self.layer_norms[i](x)

Mutant 2830

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -552,7 +552,7 @@
         kernel_size: kernel size of the convolution
     """
 
-    def __init__(self, args, no_encoder_attn=False, kernel_size=0):
+    def __init__(self, args, no_encoder_attn=True, kernel_size=0):
         super().__init__()
         self.embed_dim = args.decoder_embed_dim
         self.conv_dim = args.decoder_conv_dim

Mutant 2831

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -552,7 +552,7 @@
         kernel_size: kernel size of the convolution
     """
 
-    def __init__(self, args, no_encoder_attn=False, kernel_size=0):
+    def __init__(self, args, no_encoder_attn=False, kernel_size=1):
         super().__init__()
         self.embed_dim = args.decoder_embed_dim
         self.conv_dim = args.decoder_conv_dim

Mutant 2832

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -660,7 +660,7 @@
         x = self.maybe_layer_norm(self.final_layer_norm, x, after=True)
         return x, attn
 
-    def maybe_layer_norm(self, layer_norm, x, before=False, after=False):
+    def maybe_layer_norm(self, layer_norm, x, before=True, after=False):
         assert before ^ after
         if after ^ self.normalize_before:
             return layer_norm(x)

Mutant 2833

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -660,7 +660,7 @@
         x = self.maybe_layer_norm(self.final_layer_norm, x, after=True)
         return x, attn
 
-    def maybe_layer_norm(self, layer_norm, x, before=False, after=False):
+    def maybe_layer_norm(self, layer_norm, x, before=False, after=True):
         assert before ^ after
         if after ^ self.normalize_before:
             return layer_norm(x)

Mutant 2834

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -667,7 +667,7 @@
         else:
             return x
 
-    def make_generation_fast_(self, need_attn=False, **kwargs):
+    def make_generation_fast_(self, need_attn=True, **kwargs):
         self.need_attn = need_attn
 
     def extra_repr(self):

Mutant 2835

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -682,7 +682,7 @@
     return m
 
 
-def Linear(in_features, out_features, bias=True):
+def Linear(in_features, out_features, bias=False):
     m = nn.Linear(in_features, out_features, bias)
     nn.init.xavier_uniform_(m.weight)
     if bias:

Mutant 2837

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -690,7 +690,7 @@
     return m
 
 
-@register_model_architecture('lightconv', 'lightconv')
+@register_model_architecture('lightconv', 'XXlightconvXX')
 def base_architecture(args):
     args.encoder_embed_path = getattr(args, 'encoder_embed_path', None)
     args.encoder_embed_dim = getattr(args, 'encoder_embed_dim', 512)

Mutant 2838

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -689,8 +689,6 @@
         nn.init.constant_(m.bias, 0.)
     return m
 
-
-@register_model_architecture('lightconv', 'lightconv')
 def base_architecture(args):
     args.encoder_embed_path = getattr(args, 'encoder_embed_path', None)
     args.encoder_embed_dim = getattr(args, 'encoder_embed_dim', 512)

Mutant 2840

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -735,7 +735,7 @@
     args.weight_dropout = getattr(args, 'weight_dropout', args.attention_dropout)
 
 
-@register_model_architecture('lightconv', 'lightconv_iwslt_de_en')
+@register_model_architecture('lightconv', 'XXlightconv_iwslt_de_enXX')
 def lightconv_iwslt_de_en(args):
     args.encoder_embed_dim = getattr(args, 'encoder_embed_dim', 512)
     args.encoder_ffn_embed_dim = getattr(args, 'encoder_ffn_embed_dim', 1024)

Mutant 2841

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -734,8 +734,6 @@
     args.input_dropout = getattr(args, 'input_dropout', 0.1)
     args.weight_dropout = getattr(args, 'weight_dropout', args.attention_dropout)
 
-
-@register_model_architecture('lightconv', 'lightconv_iwslt_de_en')
 def lightconv_iwslt_de_en(args):
     args.encoder_embed_dim = getattr(args, 'encoder_embed_dim', 512)
     args.encoder_ffn_embed_dim = getattr(args, 'encoder_ffn_embed_dim', 1024)

Mutant 2843

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -753,7 +753,7 @@
     base_architecture(args)
 
 
-@register_model_architecture('lightconv', 'lightconv_wmt_en_de')
+@register_model_architecture('lightconv', 'XXlightconv_wmt_en_deXX')
 def lightconv_wmt_en_de(args):
     base_architecture(args)
 

Mutant 2844

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -752,8 +752,6 @@
     args.input_dropout = getattr(args, 'input_dropout', 0.0)
     base_architecture(args)
 
-
-@register_model_architecture('lightconv', 'lightconv_wmt_en_de')
 def lightconv_wmt_en_de(args):
     base_architecture(args)
 

Mutant 2846

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -758,7 +758,7 @@
     base_architecture(args)
 
 
-@register_model_architecture('lightconv', 'lightconv_wmt_en_de_big')
+@register_model_architecture('lightconv', 'XXlightconv_wmt_en_de_bigXX')
 def lightconv_wmt_en_de_big(args):
     args.attention_dropout = getattr(args, 'attention_dropout', 0.1)
     args.encoder_embed_dim = getattr(args, 'encoder_embed_dim', 1024)

Mutant 2847

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -757,8 +757,6 @@
 def lightconv_wmt_en_de(args):
     base_architecture(args)
 
-
-@register_model_architecture('lightconv', 'lightconv_wmt_en_de_big')
 def lightconv_wmt_en_de_big(args):
     args.attention_dropout = getattr(args, 'attention_dropout', 0.1)
     args.encoder_embed_dim = getattr(args, 'encoder_embed_dim', 1024)

Mutant 2849

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -772,7 +772,7 @@
     base_architecture(args)
 
 
-@register_model_architecture('lightconv', 'lightconv_wmt_en_fr_big')
+@register_model_architecture('lightconv', 'XXlightconv_wmt_en_fr_bigXX')
 def lightconv_wmt_en_fr_big(args):
     args.dropout = getattr(args, 'dropout', 0.1)
     lightconv_wmt_en_de_big(args)

Mutant 2850

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -771,8 +771,6 @@
     args.dropout = getattr(args, 'dropout', 0.3)
     base_architecture(args)
 
-
-@register_model_architecture('lightconv', 'lightconv_wmt_en_fr_big')
 def lightconv_wmt_en_fr_big(args):
     args.dropout = getattr(args, 'dropout', 0.1)
     lightconv_wmt_en_de_big(args)

Mutant 2852

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -778,7 +778,7 @@
     lightconv_wmt_en_de_big(args)
 
 
-@register_model_architecture('lightconv', 'lightconv_wmt_zh_en_big')
+@register_model_architecture('lightconv', 'XXlightconv_wmt_zh_en_bigXX')
 def lightconv_wmt_zh_en_big(args):
     args.dropout = getattr(args, 'dropout', 0.2)
     args.attention_dropout = getattr(args, 'attention_dropout', 0.2)

Mutant 2853

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -777,8 +777,6 @@
     args.dropout = getattr(args, 'dropout', 0.1)
     lightconv_wmt_en_de_big(args)
 
-
-@register_model_architecture('lightconv', 'lightconv_wmt_zh_en_big')
 def lightconv_wmt_zh_en_big(args):
     args.dropout = getattr(args, 'dropout', 0.2)
     args.attention_dropout = getattr(args, 'attention_dropout', 0.2)