fairseq/models/lightconv.py

Killed 14 out of 131 mutants

Survived

Survived mutation testing. These mutants show holes in your test suite.

Mutant 2490

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -48,7 +48,6 @@
         :prog:
     """
 
-    @classmethod
     def hub_models(cls):
         # fmt: off
 

Mutant 2491

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -78,7 +78,6 @@
     def __init__(self, encoder, decoder):
         super().__init__(encoder, decoder)
 
-    @staticmethod
     def add_args(parser):
         """Add model-specific arguments to the parser."""
         parser.add_argument('--dropout', type=float, metavar='D',

Mutant 2492

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -81,7 +81,7 @@
     @staticmethod
     def add_args(parser):
         """Add model-specific arguments to the parser."""
-        parser.add_argument('--dropout', type=float, metavar='D',
+        parser.add_argument('XX--dropoutXX', type=float, metavar='D',
                             help='dropout probability')
         parser.add_argument('--attention-dropout', type=float, metavar='D',
                             help='dropout probability for attention weights')

Mutant 2493

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -81,7 +81,7 @@
     @staticmethod
     def add_args(parser):
         """Add model-specific arguments to the parser."""
-        parser.add_argument('--dropout', type=float, metavar='D',
+        parser.add_argument('--dropout', type=float, metavar='XXDXX',
                             help='dropout probability')
         parser.add_argument('--attention-dropout', type=float, metavar='D',
                             help='dropout probability for attention weights')

Mutant 2494

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -82,7 +82,7 @@
     def add_args(parser):
         """Add model-specific arguments to the parser."""
         parser.add_argument('--dropout', type=float, metavar='D',
-                            help='dropout probability')
+                            help='XXdropout probabilityXX')
         parser.add_argument('--attention-dropout', type=float, metavar='D',
                             help='dropout probability for attention weights')
         parser.add_argument('--relu-dropout', type=float, metavar='D',

Mutant 2495

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -83,7 +83,7 @@
         """Add model-specific arguments to the parser."""
         parser.add_argument('--dropout', type=float, metavar='D',
                             help='dropout probability')
-        parser.add_argument('--attention-dropout', type=float, metavar='D',
+        parser.add_argument('XX--attention-dropoutXX', type=float, metavar='D',
                             help='dropout probability for attention weights')
         parser.add_argument('--relu-dropout', type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')

Mutant 2496

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -83,7 +83,7 @@
         """Add model-specific arguments to the parser."""
         parser.add_argument('--dropout', type=float, metavar='D',
                             help='dropout probability')
-        parser.add_argument('--attention-dropout', type=float, metavar='D',
+        parser.add_argument('--attention-dropout', type=float, metavar='XXDXX',
                             help='dropout probability for attention weights')
         parser.add_argument('--relu-dropout', type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')

Mutant 2497

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -84,7 +84,7 @@
         parser.add_argument('--dropout', type=float, metavar='D',
                             help='dropout probability')
         parser.add_argument('--attention-dropout', type=float, metavar='D',
-                            help='dropout probability for attention weights')
+                            help='XXdropout probability for attention weightsXX')
         parser.add_argument('--relu-dropout', type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')
         parser.add_argument('--input-dropout', type=float, metavar='D',

Mutant 2498

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -85,7 +85,7 @@
                             help='dropout probability')
         parser.add_argument('--attention-dropout', type=float, metavar='D',
                             help='dropout probability for attention weights')
-        parser.add_argument('--relu-dropout', type=float, metavar='D',
+        parser.add_argument('XX--relu-dropoutXX', type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')
         parser.add_argument('--input-dropout', type=float, metavar='D',
                             help='dropout probability of the inputs')

Mutant 2499

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -85,7 +85,7 @@
                             help='dropout probability')
         parser.add_argument('--attention-dropout', type=float, metavar='D',
                             help='dropout probability for attention weights')
-        parser.add_argument('--relu-dropout', type=float, metavar='D',
+        parser.add_argument('--relu-dropout', type=float, metavar='XXDXX',
                             help='dropout probability after ReLU in FFN')
         parser.add_argument('--input-dropout', type=float, metavar='D',
                             help='dropout probability of the inputs')

Mutant 2500

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -86,7 +86,7 @@
         parser.add_argument('--attention-dropout', type=float, metavar='D',
                             help='dropout probability for attention weights')
         parser.add_argument('--relu-dropout', type=float, metavar='D',
-                            help='dropout probability after ReLU in FFN')
+                            help='XXdropout probability after ReLU in FFNXX')
         parser.add_argument('--input-dropout', type=float, metavar='D',
                             help='dropout probability of the inputs')
         parser.add_argument('--encoder-embed-path', type=str, metavar='STR',

Mutant 2501

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -87,7 +87,7 @@
                             help='dropout probability for attention weights')
         parser.add_argument('--relu-dropout', type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')
-        parser.add_argument('--input-dropout', type=float, metavar='D',
+        parser.add_argument('XX--input-dropoutXX', type=float, metavar='D',
                             help='dropout probability of the inputs')
         parser.add_argument('--encoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained encoder embedding')

Mutant 2502

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -87,7 +87,7 @@
                             help='dropout probability for attention weights')
         parser.add_argument('--relu-dropout', type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')
-        parser.add_argument('--input-dropout', type=float, metavar='D',
+        parser.add_argument('--input-dropout', type=float, metavar='XXDXX',
                             help='dropout probability of the inputs')
         parser.add_argument('--encoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained encoder embedding')

Mutant 2503

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -88,7 +88,7 @@
         parser.add_argument('--relu-dropout', type=float, metavar='D',
                             help='dropout probability after ReLU in FFN')
         parser.add_argument('--input-dropout', type=float, metavar='D',
-                            help='dropout probability of the inputs')
+                            help='XXdropout probability of the inputsXX')
         parser.add_argument('--encoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained encoder embedding')
         parser.add_argument('--encoder-embed-dim', type=int, metavar='N',

Mutant 2504

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -89,7 +89,7 @@
                             help='dropout probability after ReLU in FFN')
         parser.add_argument('--input-dropout', type=float, metavar='D',
                             help='dropout probability of the inputs')
-        parser.add_argument('--encoder-embed-path', type=str, metavar='STR',
+        parser.add_argument('XX--encoder-embed-pathXX', type=str, metavar='STR',
                             help='path to pre-trained encoder embedding')
         parser.add_argument('--encoder-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension')

Mutant 2505

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -89,7 +89,7 @@
                             help='dropout probability after ReLU in FFN')
         parser.add_argument('--input-dropout', type=float, metavar='D',
                             help='dropout probability of the inputs')
-        parser.add_argument('--encoder-embed-path', type=str, metavar='STR',
+        parser.add_argument('--encoder-embed-path', type=str, metavar='XXSTRXX',
                             help='path to pre-trained encoder embedding')
         parser.add_argument('--encoder-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension')

Mutant 2506

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -90,7 +90,7 @@
         parser.add_argument('--input-dropout', type=float, metavar='D',
                             help='dropout probability of the inputs')
         parser.add_argument('--encoder-embed-path', type=str, metavar='STR',
-                            help='path to pre-trained encoder embedding')
+                            help='XXpath to pre-trained encoder embeddingXX')
         parser.add_argument('--encoder-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-conv-dim', type=int, metavar='N',

Mutant 2507

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -91,7 +91,7 @@
                             help='dropout probability of the inputs')
         parser.add_argument('--encoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained encoder embedding')
-        parser.add_argument('--encoder-embed-dim', type=int, metavar='N',
+        parser.add_argument('XX--encoder-embed-dimXX', type=int, metavar='N',
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-conv-dim', type=int, metavar='N',
                             help='encoder embedding dimension')

Mutant 2508

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -91,7 +91,7 @@
                             help='dropout probability of the inputs')
         parser.add_argument('--encoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained encoder embedding')
-        parser.add_argument('--encoder-embed-dim', type=int, metavar='N',
+        parser.add_argument('--encoder-embed-dim', type=int, metavar='XXNXX',
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-conv-dim', type=int, metavar='N',
                             help='encoder embedding dimension')

Mutant 2509

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -92,7 +92,7 @@
         parser.add_argument('--encoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained encoder embedding')
         parser.add_argument('--encoder-embed-dim', type=int, metavar='N',
-                            help='encoder embedding dimension')
+                            help='XXencoder embedding dimensionXX')
         parser.add_argument('--encoder-conv-dim', type=int, metavar='N',
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',

Mutant 2510

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -93,7 +93,7 @@
                             help='path to pre-trained encoder embedding')
         parser.add_argument('--encoder-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension')
-        parser.add_argument('--encoder-conv-dim', type=int, metavar='N',
+        parser.add_argument('XX--encoder-conv-dimXX', type=int, metavar='N',
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension for FFN')

Mutant 2511

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -93,7 +93,7 @@
                             help='path to pre-trained encoder embedding')
         parser.add_argument('--encoder-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension')
-        parser.add_argument('--encoder-conv-dim', type=int, metavar='N',
+        parser.add_argument('--encoder-conv-dim', type=int, metavar='XXNXX',
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension for FFN')

Mutant 2512

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -94,7 +94,7 @@
         parser.add_argument('--encoder-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-conv-dim', type=int, metavar='N',
-                            help='encoder embedding dimension')
+                            help='XXencoder embedding dimensionXX')
         parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension for FFN')
         parser.add_argument('--encoder-layers', type=int, metavar='N',

Mutant 2513

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -95,7 +95,7 @@
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-conv-dim', type=int, metavar='N',
                             help='encoder embedding dimension')
-        parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',
+        parser.add_argument('XX--encoder-ffn-embed-dimXX', type=int, metavar='N',
                             help='encoder embedding dimension for FFN')
         parser.add_argument('--encoder-layers', type=int, metavar='N',
                             help='num encoder layers')

Mutant 2514

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -95,7 +95,7 @@
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-conv-dim', type=int, metavar='N',
                             help='encoder embedding dimension')
-        parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',
+        parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='XXNXX',
                             help='encoder embedding dimension for FFN')
         parser.add_argument('--encoder-layers', type=int, metavar='N',
                             help='num encoder layers')

Mutant 2515

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -96,7 +96,7 @@
         parser.add_argument('--encoder-conv-dim', type=int, metavar='N',
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',
-                            help='encoder embedding dimension for FFN')
+                            help='XXencoder embedding dimension for FFNXX')
         parser.add_argument('--encoder-layers', type=int, metavar='N',
                             help='num encoder layers')
         parser.add_argument('--encoder-attention-heads', type=int, metavar='N',

Mutant 2516

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -97,7 +97,7 @@
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension for FFN')
-        parser.add_argument('--encoder-layers', type=int, metavar='N',
+        parser.add_argument('XX--encoder-layersXX', type=int, metavar='N',
                             help='num encoder layers')
         parser.add_argument('--encoder-attention-heads', type=int, metavar='N',
                             help='num encoder attention heads or LightConv/DynamicConv heads')

Mutant 2517

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -97,7 +97,7 @@
                             help='encoder embedding dimension')
         parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension for FFN')
-        parser.add_argument('--encoder-layers', type=int, metavar='N',
+        parser.add_argument('--encoder-layers', type=int, metavar='XXNXX',
                             help='num encoder layers')
         parser.add_argument('--encoder-attention-heads', type=int, metavar='N',
                             help='num encoder attention heads or LightConv/DynamicConv heads')

Mutant 2518

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -98,7 +98,7 @@
         parser.add_argument('--encoder-ffn-embed-dim', type=int, metavar='N',
                             help='encoder embedding dimension for FFN')
         parser.add_argument('--encoder-layers', type=int, metavar='N',
-                            help='num encoder layers')
+                            help='XXnum encoder layersXX')
         parser.add_argument('--encoder-attention-heads', type=int, metavar='N',
                             help='num encoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--encoder-normalize-before', action='store_true',

Mutant 2519

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -99,7 +99,7 @@
                             help='encoder embedding dimension for FFN')
         parser.add_argument('--encoder-layers', type=int, metavar='N',
                             help='num encoder layers')
-        parser.add_argument('--encoder-attention-heads', type=int, metavar='N',
+        parser.add_argument('XX--encoder-attention-headsXX', type=int, metavar='N',
                             help='num encoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--encoder-normalize-before', action='store_true',
                             help='apply layernorm before each encoder block')

Mutant 2520

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -99,7 +99,7 @@
                             help='encoder embedding dimension for FFN')
         parser.add_argument('--encoder-layers', type=int, metavar='N',
                             help='num encoder layers')
-        parser.add_argument('--encoder-attention-heads', type=int, metavar='N',
+        parser.add_argument('--encoder-attention-heads', type=int, metavar='XXNXX',
                             help='num encoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--encoder-normalize-before', action='store_true',
                             help='apply layernorm before each encoder block')

Mutant 2521

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -100,7 +100,7 @@
         parser.add_argument('--encoder-layers', type=int, metavar='N',
                             help='num encoder layers')
         parser.add_argument('--encoder-attention-heads', type=int, metavar='N',
-                            help='num encoder attention heads or LightConv/DynamicConv heads')
+                            help='XXnum encoder attention heads or LightConv/DynamicConv headsXX')
         parser.add_argument('--encoder-normalize-before', action='store_true',
                             help='apply layernorm before each encoder block')
         parser.add_argument('--encoder-learned-pos', action='store_true',

Mutant 2522

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -101,7 +101,7 @@
                             help='num encoder layers')
         parser.add_argument('--encoder-attention-heads', type=int, metavar='N',
                             help='num encoder attention heads or LightConv/DynamicConv heads')
-        parser.add_argument('--encoder-normalize-before', action='store_true',
+        parser.add_argument('XX--encoder-normalize-beforeXX', action='store_true',
                             help='apply layernorm before each encoder block')
         parser.add_argument('--encoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the encoder')

Mutant 2524

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -102,7 +102,7 @@
         parser.add_argument('--encoder-attention-heads', type=int, metavar='N',
                             help='num encoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--encoder-normalize-before', action='store_true',
-                            help='apply layernorm before each encoder block')
+                            help='XXapply layernorm before each encoder blockXX')
         parser.add_argument('--encoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the encoder')
         parser.add_argument('--decoder-embed-path', type=str, metavar='STR',

Mutant 2525

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -103,7 +103,7 @@
                             help='num encoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--encoder-normalize-before', action='store_true',
                             help='apply layernorm before each encoder block')
-        parser.add_argument('--encoder-learned-pos', action='store_true',
+        parser.add_argument('XX--encoder-learned-posXX', action='store_true',
                             help='use learned positional embeddings in the encoder')
         parser.add_argument('--decoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained decoder embedding')

Mutant 2527

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -104,7 +104,7 @@
         parser.add_argument('--encoder-normalize-before', action='store_true',
                             help='apply layernorm before each encoder block')
         parser.add_argument('--encoder-learned-pos', action='store_true',
-                            help='use learned positional embeddings in the encoder')
+                            help='XXuse learned positional embeddings in the encoderXX')
         parser.add_argument('--decoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained decoder embedding')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',

Mutant 2528

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -105,7 +105,7 @@
                             help='apply layernorm before each encoder block')
         parser.add_argument('--encoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the encoder')
-        parser.add_argument('--decoder-embed-path', type=str, metavar='STR',
+        parser.add_argument('XX--decoder-embed-pathXX', type=str, metavar='STR',
                             help='path to pre-trained decoder embedding')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension')

Mutant 2529

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -105,7 +105,7 @@
                             help='apply layernorm before each encoder block')
         parser.add_argument('--encoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the encoder')
-        parser.add_argument('--decoder-embed-path', type=str, metavar='STR',
+        parser.add_argument('--decoder-embed-path', type=str, metavar='XXSTRXX',
                             help='path to pre-trained decoder embedding')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension')

Mutant 2530

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -106,7 +106,7 @@
         parser.add_argument('--encoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the encoder')
         parser.add_argument('--decoder-embed-path', type=str, metavar='STR',
-                            help='path to pre-trained decoder embedding')
+                            help='XXpath to pre-trained decoder embeddingXX')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-conv-dim', type=int, metavar='N',

Mutant 2531

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -107,7 +107,7 @@
                             help='use learned positional embeddings in the encoder')
         parser.add_argument('--decoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained decoder embedding')
-        parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
+        parser.add_argument('XX--decoder-embed-dimXX', type=int, metavar='N',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-conv-dim', type=int, metavar='N',
                             help='decoder embedding dimension')

Mutant 2532

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -107,7 +107,7 @@
                             help='use learned positional embeddings in the encoder')
         parser.add_argument('--decoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained decoder embedding')
-        parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
+        parser.add_argument('--decoder-embed-dim', type=int, metavar='XXNXX',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-conv-dim', type=int, metavar='N',
                             help='decoder embedding dimension')

Mutant 2533

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -108,7 +108,7 @@
         parser.add_argument('--decoder-embed-path', type=str, metavar='STR',
                             help='path to pre-trained decoder embedding')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
-                            help='decoder embedding dimension')
+                            help='XXdecoder embedding dimensionXX')
         parser.add_argument('--decoder-conv-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',

Mutant 2534

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -109,7 +109,7 @@
                             help='path to pre-trained decoder embedding')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
-        parser.add_argument('--decoder-conv-dim', type=int, metavar='N',
+        parser.add_argument('XX--decoder-conv-dimXX', type=int, metavar='N',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')

Mutant 2535

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -109,7 +109,7 @@
                             help='path to pre-trained decoder embedding')
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
-        parser.add_argument('--decoder-conv-dim', type=int, metavar='N',
+        parser.add_argument('--decoder-conv-dim', type=int, metavar='XXNXX',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')

Mutant 2536

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -110,7 +110,7 @@
         parser.add_argument('--decoder-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-conv-dim', type=int, metavar='N',
-                            help='decoder embedding dimension')
+                            help='XXdecoder embedding dimensionXX')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')
         parser.add_argument('--decoder-layers', type=int, metavar='N',

Mutant 2537

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -111,7 +111,7 @@
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-conv-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
-        parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
+        parser.add_argument('XX--decoder-ffn-embed-dimXX', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')
         parser.add_argument('--decoder-layers', type=int, metavar='N',
                             help='num decoder layers')

Mutant 2538

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -111,7 +111,7 @@
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-conv-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
-        parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
+        parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='XXNXX',
                             help='decoder embedding dimension for FFN')
         parser.add_argument('--decoder-layers', type=int, metavar='N',
                             help='num decoder layers')

Mutant 2539

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -112,7 +112,7 @@
         parser.add_argument('--decoder-conv-dim', type=int, metavar='N',
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
-                            help='decoder embedding dimension for FFN')
+                            help='XXdecoder embedding dimension for FFNXX')
         parser.add_argument('--decoder-layers', type=int, metavar='N',
                             help='num decoder layers')
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',

Mutant 2540

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -113,7 +113,7 @@
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')
-        parser.add_argument('--decoder-layers', type=int, metavar='N',
+        parser.add_argument('XX--decoder-layersXX', type=int, metavar='N',
                             help='num decoder layers')
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
                             help='num decoder attention heads or LightConv/DynamicConv heads')

Mutant 2541

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -113,7 +113,7 @@
                             help='decoder embedding dimension')
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')
-        parser.add_argument('--decoder-layers', type=int, metavar='N',
+        parser.add_argument('--decoder-layers', type=int, metavar='XXNXX',
                             help='num decoder layers')
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
                             help='num decoder attention heads or LightConv/DynamicConv heads')

Mutant 2542

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -114,7 +114,7 @@
         parser.add_argument('--decoder-ffn-embed-dim', type=int, metavar='N',
                             help='decoder embedding dimension for FFN')
         parser.add_argument('--decoder-layers', type=int, metavar='N',
-                            help='num decoder layers')
+                            help='XXnum decoder layersXX')
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
                             help='num decoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--decoder-learned-pos', action='store_true',

Mutant 2543

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -115,7 +115,7 @@
                             help='decoder embedding dimension for FFN')
         parser.add_argument('--decoder-layers', type=int, metavar='N',
                             help='num decoder layers')
-        parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
+        parser.add_argument('XX--decoder-attention-headsXX', type=int, metavar='N',
                             help='num decoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--decoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the decoder')

Mutant 2544

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -115,7 +115,7 @@
                             help='decoder embedding dimension for FFN')
         parser.add_argument('--decoder-layers', type=int, metavar='N',
                             help='num decoder layers')
-        parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
+        parser.add_argument('--decoder-attention-heads', type=int, metavar='XXNXX',
                             help='num decoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--decoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the decoder')

Mutant 2545

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -116,7 +116,7 @@
         parser.add_argument('--decoder-layers', type=int, metavar='N',
                             help='num decoder layers')
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
-                            help='num decoder attention heads or LightConv/DynamicConv heads')
+                            help='XXnum decoder attention heads or LightConv/DynamicConv headsXX')
         parser.add_argument('--decoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the decoder')
         parser.add_argument('--decoder-normalize-before', action='store_true',

Mutant 2546

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -117,7 +117,7 @@
                             help='num decoder layers')
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
                             help='num decoder attention heads or LightConv/DynamicConv heads')
-        parser.add_argument('--decoder-learned-pos', action='store_true',
+        parser.add_argument('XX--decoder-learned-posXX', action='store_true',
                             help='use learned positional embeddings in the decoder')
         parser.add_argument('--decoder-normalize-before', action='store_true',
                             help='apply layernorm before each decoder block')

Mutant 2548

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -118,7 +118,7 @@
         parser.add_argument('--decoder-attention-heads', type=int, metavar='N',
                             help='num decoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--decoder-learned-pos', action='store_true',
-                            help='use learned positional embeddings in the decoder')
+                            help='XXuse learned positional embeddings in the decoderXX')
         parser.add_argument('--decoder-normalize-before', action='store_true',
                             help='apply layernorm before each decoder block')
         parser.add_argument('--share-decoder-input-output-embed', action='store_true',

Mutant 2549

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -119,7 +119,7 @@
                             help='num decoder attention heads or LightConv/DynamicConv heads')
         parser.add_argument('--decoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the decoder')
-        parser.add_argument('--decoder-normalize-before', action='store_true',
+        parser.add_argument('XX--decoder-normalize-beforeXX', action='store_true',
                             help='apply layernorm before each decoder block')
         parser.add_argument('--share-decoder-input-output-embed', action='store_true',
                             help='share decoder input and output embeddings')

Mutant 2551

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -120,7 +120,7 @@
         parser.add_argument('--decoder-learned-pos', action='store_true',
                             help='use learned positional embeddings in the decoder')
         parser.add_argument('--decoder-normalize-before', action='store_true',
-                            help='apply layernorm before each decoder block')
+                            help='XXapply layernorm before each decoder blockXX')
         parser.add_argument('--share-decoder-input-output-embed', action='store_true',
                             help='share decoder input and output embeddings')
         parser.add_argument('--share-all-embeddings', action='store_true',

Mutant 2552

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -121,7 +121,7 @@
                             help='use learned positional embeddings in the decoder')
         parser.add_argument('--decoder-normalize-before', action='store_true',
                             help='apply layernorm before each decoder block')
-        parser.add_argument('--share-decoder-input-output-embed', action='store_true',
+        parser.add_argument('XX--share-decoder-input-output-embedXX', action='store_true',
                             help='share decoder input and output embeddings')
         parser.add_argument('--share-all-embeddings', action='store_true',
                             help='share encoder, decoder and output embeddings'

Mutant 2554

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -122,7 +122,7 @@
         parser.add_argument('--decoder-normalize-before', action='store_true',
                             help='apply layernorm before each decoder block')
         parser.add_argument('--share-decoder-input-output-embed', action='store_true',
-                            help='share decoder input and output embeddings')
+                            help='XXshare decoder input and output embeddingsXX')
         parser.add_argument('--share-all-embeddings', action='store_true',
                             help='share encoder, decoder and output embeddings'
                                  ' (requires shared dictionary and embed dim)')

Mutant 2555

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -123,7 +123,7 @@
                             help='apply layernorm before each decoder block')
         parser.add_argument('--share-decoder-input-output-embed', action='store_true',
                             help='share decoder input and output embeddings')
-        parser.add_argument('--share-all-embeddings', action='store_true',
+        parser.add_argument('XX--share-all-embeddingsXX', action='store_true',
                             help='share encoder, decoder and output embeddings'
                                  ' (requires shared dictionary and embed dim)')
         parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',

Mutant 2557

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -124,7 +124,7 @@
         parser.add_argument('--share-decoder-input-output-embed', action='store_true',
                             help='share decoder input and output embeddings')
         parser.add_argument('--share-all-embeddings', action='store_true',
-                            help='share encoder, decoder and output embeddings'
+                            help='XXshare encoder, decoder and output embeddingsXX'
                                  ' (requires shared dictionary and embed dim)')
         parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
                             help='comma separated list of adaptive softmax cutoff points. '

Mutant 2558

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -126,7 +126,7 @@
         parser.add_argument('--share-all-embeddings', action='store_true',
                             help='share encoder, decoder and output embeddings'
                                  ' (requires shared dictionary and embed dim)')
-        parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
+        parser.add_argument('XX--adaptive-softmax-cutoffXX', metavar='EXPR',
                             help='comma separated list of adaptive softmax cutoff points. '
                                  'Must be used with adaptive_loss criterion'),
         parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',

Mutant 2559

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -126,7 +126,7 @@
         parser.add_argument('--share-all-embeddings', action='store_true',
                             help='share encoder, decoder and output embeddings'
                                  ' (requires shared dictionary and embed dim)')
-        parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
+        parser.add_argument('--adaptive-softmax-cutoff', metavar='XXEXPRXX',
                             help='comma separated list of adaptive softmax cutoff points. '
                                  'Must be used with adaptive_loss criterion'),
         parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',

Mutant 2560

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -127,7 +127,7 @@
                             help='share encoder, decoder and output embeddings'
                                  ' (requires shared dictionary and embed dim)')
         parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
-                            help='comma separated list of adaptive softmax cutoff points. '
+                            help='XXcomma separated list of adaptive softmax cutoff points. XX'
                                  'Must be used with adaptive_loss criterion'),
         parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',
                             help='sets adaptive softmax dropout for the tail projections')

Mutant 2561

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -129,7 +129,7 @@
         parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
                             help='comma separated list of adaptive softmax cutoff points. '
                                  'Must be used with adaptive_loss criterion'),
-        parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',
+        parser.add_argument('XX--adaptive-softmax-dropoutXX', type=float, metavar='D',
                             help='sets adaptive softmax dropout for the tail projections')
 
         """LightConv and DynamicConv arguments"""

Mutant 2562

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -129,7 +129,7 @@
         parser.add_argument('--adaptive-softmax-cutoff', metavar='EXPR',
                             help='comma separated list of adaptive softmax cutoff points. '
                                  'Must be used with adaptive_loss criterion'),
-        parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',
+        parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='XXDXX',
                             help='sets adaptive softmax dropout for the tail projections')
 
         """LightConv and DynamicConv arguments"""

Mutant 2563

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -130,7 +130,7 @@
                             help='comma separated list of adaptive softmax cutoff points. '
                                  'Must be used with adaptive_loss criterion'),
         parser.add_argument('--adaptive-softmax-dropout', type=float, metavar='D',
-                            help='sets adaptive softmax dropout for the tail projections')
+                            help='XXsets adaptive softmax dropout for the tail projectionsXX')
 
         """LightConv and DynamicConv arguments"""
         parser.add_argument('--encoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),

Mutant 2564

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -133,7 +133,7 @@
                             help='sets adaptive softmax dropout for the tail projections')
 
         """LightConv and DynamicConv arguments"""
-        parser.add_argument('--encoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
+        parser.add_argument('XX--encoder-kernel-size-listXX', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31,31]")')
         parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')

Mutant 2565

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -133,7 +133,7 @@
                             help='sets adaptive softmax dropout for the tail projections')
 
         """LightConv and DynamicConv arguments"""
-        parser.add_argument('--encoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
+        parser.add_argument('--encoder-kernel-size-list', type=lambda x: None,
                             help='list of kernel size (default: "[3,7,15,31,31,31,31]")')
         parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')

Mutant 2566

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -134,7 +134,7 @@
 
         """LightConv and DynamicConv arguments"""
         parser.add_argument('--encoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
-                            help='list of kernel size (default: "[3,7,15,31,31,31,31]")')
+                            help='XXlist of kernel size (default: "[3,7,15,31,31,31,31]")XX')
         parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')
         parser.add_argument('--encoder-glu', type=options.eval_bool,

Mutant 2567

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -135,7 +135,7 @@
         """LightConv and DynamicConv arguments"""
         parser.add_argument('--encoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31,31]")')
-        parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
+        parser.add_argument('XX--decoder-kernel-size-listXX', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')
         parser.add_argument('--encoder-glu', type=options.eval_bool,
                             help='glu after in proj')

Mutant 2568

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -135,7 +135,7 @@
         """LightConv and DynamicConv arguments"""
         parser.add_argument('--encoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31,31]")')
-        parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
+        parser.add_argument('--decoder-kernel-size-list', type=lambda x: None,
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')
         parser.add_argument('--encoder-glu', type=options.eval_bool,
                             help='glu after in proj')

Mutant 2569

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -136,7 +136,7 @@
         parser.add_argument('--encoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31,31]")')
         parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
-                            help='list of kernel size (default: "[3,7,15,31,31,31]")')
+                            help='XXlist of kernel size (default: "[3,7,15,31,31,31]")XX')
         parser.add_argument('--encoder-glu', type=options.eval_bool,
                             help='glu after in proj')
         parser.add_argument('--decoder-glu', type=options.eval_bool,

Mutant 2570

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -137,7 +137,7 @@
                             help='list of kernel size (default: "[3,7,15,31,31,31,31]")')
         parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')
-        parser.add_argument('--encoder-glu', type=options.eval_bool,
+        parser.add_argument('XX--encoder-gluXX', type=options.eval_bool,
                             help='glu after in proj')
         parser.add_argument('--decoder-glu', type=options.eval_bool,
                             help='glu after in proj')

Mutant 2571

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -138,7 +138,7 @@
         parser.add_argument('--decoder-kernel-size-list', type=lambda x: options.eval_str_list(x, int),
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')
         parser.add_argument('--encoder-glu', type=options.eval_bool,
-                            help='glu after in proj')
+                            help='XXglu after in projXX')
         parser.add_argument('--decoder-glu', type=options.eval_bool,
                             help='glu after in proj')
         parser.add_argument('--encoder-conv-type', default='dynamic', type=str,

Mutant 2572

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -139,7 +139,7 @@
                             help='list of kernel size (default: "[3,7,15,31,31,31]")')
         parser.add_argument('--encoder-glu', type=options.eval_bool,
                             help='glu after in proj')
-        parser.add_argument('--decoder-glu', type=options.eval_bool,
+        parser.add_argument('XX--decoder-gluXX', type=options.eval_bool,
                             help='glu after in proj')
         parser.add_argument('--encoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],

Mutant 2573

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -140,7 +140,7 @@
         parser.add_argument('--encoder-glu', type=options.eval_bool,
                             help='glu after in proj')
         parser.add_argument('--decoder-glu', type=options.eval_bool,
-                            help='glu after in proj')
+                            help='XXglu after in projXX')
         parser.add_argument('--encoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')

Mutant 2574

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -141,7 +141,7 @@
                             help='glu after in proj')
         parser.add_argument('--decoder-glu', type=options.eval_bool,
                             help='glu after in proj')
-        parser.add_argument('--encoder-conv-type', default='dynamic', type=str,
+        parser.add_argument('XX--encoder-conv-typeXX', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,

Mutant 2575

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -141,7 +141,7 @@
                             help='glu after in proj')
         parser.add_argument('--decoder-glu', type=options.eval_bool,
                             help='glu after in proj')
-        parser.add_argument('--encoder-conv-type', default='dynamic', type=str,
+        parser.add_argument('--encoder-conv-type', default='XXdynamicXX', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,

Mutant 2576

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -142,7 +142,7 @@
         parser.add_argument('--decoder-glu', type=options.eval_bool,
                             help='glu after in proj')
         parser.add_argument('--encoder-conv-type', default='dynamic', type=str,
-                            choices=['dynamic', 'lightweight'],
+                            choices=['XXdynamicXX', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],

Mutant 2577

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -142,7 +142,7 @@
         parser.add_argument('--decoder-glu', type=options.eval_bool,
                             help='glu after in proj')
         parser.add_argument('--encoder-conv-type', default='dynamic', type=str,
-                            choices=['dynamic', 'lightweight'],
+                            choices=['dynamic', 'XXlightweightXX'],
                             help='type of convolution')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],

Mutant 2578

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -143,7 +143,7 @@
                             help='glu after in proj')
         parser.add_argument('--encoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
-                            help='type of convolution')
+                            help='XXtype of convolutionXX')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')

Mutant 2579

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -144,7 +144,7 @@
         parser.add_argument('--encoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
-        parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
+        parser.add_argument('XX--decoder-conv-typeXX', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)

Mutant 2580

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -144,7 +144,7 @@
         parser.add_argument('--encoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
-        parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
+        parser.add_argument('--decoder-conv-type', default='XXdynamicXX', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)

Mutant 2581

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -145,7 +145,7 @@
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
-                            choices=['dynamic', 'lightweight'],
+                            choices=['XXdynamicXX', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
         parser.add_argument('--weight-dropout', type=float, metavar='D',

Mutant 2582

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -145,7 +145,7 @@
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
-                            choices=['dynamic', 'lightweight'],
+                            choices=['dynamic', 'XXlightweightXX'],
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
         parser.add_argument('--weight-dropout', type=float, metavar='D',

Mutant 2583

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -146,7 +146,7 @@
                             help='type of convolution')
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
-                            help='type of convolution')
+                            help='XXtype of convolutionXX')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
         parser.add_argument('--weight-dropout', type=float, metavar='D',
                             help='dropout probability for conv weights')

Mutant 2584

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -147,7 +147,7 @@
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
-        parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
+        parser.add_argument('XX--weight-softmaxXX', default=True, type=options.eval_bool)
         parser.add_argument('--weight-dropout', type=float, metavar='D',
                             help='dropout probability for conv weights')
 

Mutant 2585

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -147,7 +147,7 @@
         parser.add_argument('--decoder-conv-type', default='dynamic', type=str,
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
-        parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
+        parser.add_argument('--weight-softmax', default=False, type=options.eval_bool)
         parser.add_argument('--weight-dropout', type=float, metavar='D',
                             help='dropout probability for conv weights')
 

Mutant 2586

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -148,7 +148,7 @@
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
-        parser.add_argument('--weight-dropout', type=float, metavar='D',
+        parser.add_argument('XX--weight-dropoutXX', type=float, metavar='D',
                             help='dropout probability for conv weights')
 
     @classmethod

Mutant 2587

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -148,7 +148,7 @@
                             choices=['dynamic', 'lightweight'],
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
-        parser.add_argument('--weight-dropout', type=float, metavar='D',
+        parser.add_argument('--weight-dropout', type=float, metavar='XXDXX',
                             help='dropout probability for conv weights')
 
     @classmethod

Mutant 2588

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -149,7 +149,7 @@
                             help='type of convolution')
         parser.add_argument('--weight-softmax', default=True, type=options.eval_bool)
         parser.add_argument('--weight-dropout', type=float, metavar='D',
-                            help='dropout probability for conv weights')
+                            help='XXdropout probability for conv weightsXX')
 
     @classmethod
     def build_model(cls, args, task):

Mutant 2589

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -151,7 +151,6 @@
         parser.add_argument('--weight-dropout', type=float, metavar='D',
                             help='dropout probability for conv weights')
 
-    @classmethod
     def build_model(cls, args, task):
         """Build a new model instance."""
 

Mutant 2590

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -316,7 +316,7 @@
             Default: ``False``
     """
 
-    def __init__(self, args, dictionary, embed_tokens, no_encoder_attn=False, final_norm=True):
+    def __init__(self, args, dictionary, embed_tokens, no_encoder_attn=True, final_norm=True):
         super().__init__(dictionary)
         self.dropout_module = FairseqDropout(args.dropout, module_name=self.__class__.__name__)
         self.share_input_output_embed = args.share_decoder_input_output_embed

Mutant 2591

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -316,7 +316,7 @@
             Default: ``False``
     """
 
-    def __init__(self, args, dictionary, embed_tokens, no_encoder_attn=False, final_norm=True):
+    def __init__(self, args, dictionary, embed_tokens, no_encoder_attn=False, final_norm=False):
         super().__init__(dictionary)
         self.dropout_module = FairseqDropout(args.dropout, module_name=self.__class__.__name__)
         self.share_input_output_embed = args.share_decoder_input_output_embed

Mutant 2592

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -462,7 +462,7 @@
         kernel_size: kernel size of the convolution
     """
 
-    def __init__(self, args, kernel_size=0):
+    def __init__(self, args, kernel_size=1):
         super().__init__()
         self.embed_dim = args.encoder_embed_dim
         self.conv_dim = args.encoder_conv_dim

Mutant 2593

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -530,7 +530,7 @@
         x = self.maybe_layer_norm(1, x, after=True)
         return x
 
-    def maybe_layer_norm(self, i, x, before=False, after=False):
+    def maybe_layer_norm(self, i, x, before=True, after=False):
         assert before ^ after
         if after ^ self.normalize_before:
             return self.layer_norms[i](x)

Mutant 2594

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -530,7 +530,7 @@
         x = self.maybe_layer_norm(1, x, after=True)
         return x
 
-    def maybe_layer_norm(self, i, x, before=False, after=False):
+    def maybe_layer_norm(self, i, x, before=False, after=True):
         assert before ^ after
         if after ^ self.normalize_before:
             return self.layer_norms[i](x)

Mutant 2595

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -552,7 +552,7 @@
         kernel_size: kernel size of the convolution
     """
 
-    def __init__(self, args, no_encoder_attn=False, kernel_size=0):
+    def __init__(self, args, no_encoder_attn=True, kernel_size=0):
         super().__init__()
         self.embed_dim = args.decoder_embed_dim
         self.conv_dim = args.decoder_conv_dim

Mutant 2596

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -552,7 +552,7 @@
         kernel_size: kernel size of the convolution
     """
 
-    def __init__(self, args, no_encoder_attn=False, kernel_size=0):
+    def __init__(self, args, no_encoder_attn=False, kernel_size=1):
         super().__init__()
         self.embed_dim = args.decoder_embed_dim
         self.conv_dim = args.decoder_conv_dim

Mutant 2597

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -660,7 +660,7 @@
         x = self.maybe_layer_norm(self.final_layer_norm, x, after=True)
         return x, attn
 
-    def maybe_layer_norm(self, layer_norm, x, before=False, after=False):
+    def maybe_layer_norm(self, layer_norm, x, before=True, after=False):
         assert before ^ after
         if after ^ self.normalize_before:
             return layer_norm(x)

Mutant 2598

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -660,7 +660,7 @@
         x = self.maybe_layer_norm(self.final_layer_norm, x, after=True)
         return x, attn
 
-    def maybe_layer_norm(self, layer_norm, x, before=False, after=False):
+    def maybe_layer_norm(self, layer_norm, x, before=False, after=True):
         assert before ^ after
         if after ^ self.normalize_before:
             return layer_norm(x)

Mutant 2599

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -667,7 +667,7 @@
         else:
             return x
 
-    def make_generation_fast_(self, need_attn=False, **kwargs):
+    def make_generation_fast_(self, need_attn=True, **kwargs):
         self.need_attn = need_attn
 
     def extra_repr(self):

Mutant 2600

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -682,7 +682,7 @@
     return m
 
 
-def Linear(in_features, out_features, bias=True):
+def Linear(in_features, out_features, bias=False):
     m = nn.Linear(in_features, out_features, bias)
     nn.init.xavier_uniform_(m.weight)
     if bias:

Mutant 2602

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -690,7 +690,7 @@
     return m
 
 
-@register_model_architecture('lightconv', 'lightconv')
+@register_model_architecture('lightconv', 'XXlightconvXX')
 def base_architecture(args):
     args.encoder_embed_path = getattr(args, 'encoder_embed_path', None)
     args.encoder_embed_dim = getattr(args, 'encoder_embed_dim', 512)

Mutant 2603

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -689,8 +689,6 @@
         nn.init.constant_(m.bias, 0.)
     return m
 
-
-@register_model_architecture('lightconv', 'lightconv')
 def base_architecture(args):
     args.encoder_embed_path = getattr(args, 'encoder_embed_path', None)
     args.encoder_embed_dim = getattr(args, 'encoder_embed_dim', 512)

Mutant 2605

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -735,7 +735,7 @@
     args.weight_dropout = getattr(args, 'weight_dropout', args.attention_dropout)
 
 
-@register_model_architecture('lightconv', 'lightconv_iwslt_de_en')
+@register_model_architecture('lightconv', 'XXlightconv_iwslt_de_enXX')
 def lightconv_iwslt_de_en(args):
     args.encoder_embed_dim = getattr(args, 'encoder_embed_dim', 512)
     args.encoder_ffn_embed_dim = getattr(args, 'encoder_ffn_embed_dim', 1024)

Mutant 2606

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -734,8 +734,6 @@
     args.input_dropout = getattr(args, 'input_dropout', 0.1)
     args.weight_dropout = getattr(args, 'weight_dropout', args.attention_dropout)
 
-
-@register_model_architecture('lightconv', 'lightconv_iwslt_de_en')
 def lightconv_iwslt_de_en(args):
     args.encoder_embed_dim = getattr(args, 'encoder_embed_dim', 512)
     args.encoder_ffn_embed_dim = getattr(args, 'encoder_ffn_embed_dim', 1024)

Mutant 2608

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -753,7 +753,7 @@
     base_architecture(args)
 
 
-@register_model_architecture('lightconv', 'lightconv_wmt_en_de')
+@register_model_architecture('lightconv', 'XXlightconv_wmt_en_deXX')
 def lightconv_wmt_en_de(args):
     base_architecture(args)
 

Mutant 2609

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -752,8 +752,6 @@
     args.input_dropout = getattr(args, 'input_dropout', 0.0)
     base_architecture(args)
 
-
-@register_model_architecture('lightconv', 'lightconv_wmt_en_de')
 def lightconv_wmt_en_de(args):
     base_architecture(args)
 

Mutant 2611

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -758,7 +758,7 @@
     base_architecture(args)
 
 
-@register_model_architecture('lightconv', 'lightconv_wmt_en_de_big')
+@register_model_architecture('lightconv', 'XXlightconv_wmt_en_de_bigXX')
 def lightconv_wmt_en_de_big(args):
     args.attention_dropout = getattr(args, 'attention_dropout', 0.1)
     args.encoder_embed_dim = getattr(args, 'encoder_embed_dim', 1024)

Mutant 2612

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -757,8 +757,6 @@
 def lightconv_wmt_en_de(args):
     base_architecture(args)
 
-
-@register_model_architecture('lightconv', 'lightconv_wmt_en_de_big')
 def lightconv_wmt_en_de_big(args):
     args.attention_dropout = getattr(args, 'attention_dropout', 0.1)
     args.encoder_embed_dim = getattr(args, 'encoder_embed_dim', 1024)

Mutant 2614

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -772,7 +772,7 @@
     base_architecture(args)
 
 
-@register_model_architecture('lightconv', 'lightconv_wmt_en_fr_big')
+@register_model_architecture('lightconv', 'XXlightconv_wmt_en_fr_bigXX')
 def lightconv_wmt_en_fr_big(args):
     args.dropout = getattr(args, 'dropout', 0.1)
     lightconv_wmt_en_de_big(args)

Mutant 2615

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -771,8 +771,6 @@
     args.dropout = getattr(args, 'dropout', 0.3)
     base_architecture(args)
 
-
-@register_model_architecture('lightconv', 'lightconv_wmt_en_fr_big')
 def lightconv_wmt_en_fr_big(args):
     args.dropout = getattr(args, 'dropout', 0.1)
     lightconv_wmt_en_de_big(args)

Mutant 2617

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -778,7 +778,7 @@
     lightconv_wmt_en_de_big(args)
 
 
-@register_model_architecture('lightconv', 'lightconv_wmt_zh_en_big')
+@register_model_architecture('lightconv', 'XXlightconv_wmt_zh_en_bigXX')
 def lightconv_wmt_zh_en_big(args):
     args.dropout = getattr(args, 'dropout', 0.2)
     args.attention_dropout = getattr(args, 'attention_dropout', 0.2)

Mutant 2618

--- fairseq/models/lightconv.py
+++ fairseq/models/lightconv.py
@@ -777,8 +777,6 @@
     args.dropout = getattr(args, 'dropout', 0.1)
     lightconv_wmt_en_de_big(args)
 
-
-@register_model_architecture('lightconv', 'lightconv_wmt_zh_en_big')
 def lightconv_wmt_zh_en_big(args):
     args.dropout = getattr(args, 'dropout', 0.2)
     args.attention_dropout = getattr(args, 'attention_dropout', 0.2)