fairseq/tasks/legacy_masked_lm.py
Killed 1 out of 27 mutantsSurvived
Survived mutation testing. These mutants show holes in your test suite.Mutant 3297
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -24,7 +24,7 @@
from fairseq import utils
-logger = logging.getLogger(__name__)
+logger = None
@register_task('legacy_masked_lm')
Mutant 3298
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -27,7 +27,7 @@
logger = logging.getLogger(__name__)
-@register_task('legacy_masked_lm')
+@register_task('XXlegacy_masked_lmXX')
class LegacyMaskedLMTask(FairseqTask):
"""
Task for training Masked LM (BERT) model.
Mutant 3299
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -26,8 +26,6 @@
logger = logging.getLogger(__name__)
-
-@register_task('legacy_masked_lm')
class LegacyMaskedLMTask(FairseqTask):
"""
Task for training Masked LM (BERT) model.
Mutant 3300
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -35,7 +35,6 @@
dictionary (Dictionary): the dictionary for the input of the task
"""
- @staticmethod
def add_args(parser):
"""Add task-specific arguments to the parser."""
parser.add_argument('data', help='colon separated path to data directories list, \
Mutant 3301
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -38,7 +38,7 @@
@staticmethod
def add_args(parser):
"""Add task-specific arguments to the parser."""
- parser.add_argument('data', help='colon separated path to data directories list, \
+ parser.add_argument('XXdataXX', help='colon separated path to data directories list, \
will be iterated upon during epochs in round-robin manner')
parser.add_argument('--tokens-per-sample', default=512, type=int,
help='max number of total tokens over all segments'
Mutant 3302
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -38,8 +38,8 @@
@staticmethod
def add_args(parser):
"""Add task-specific arguments to the parser."""
- parser.add_argument('data', help='colon separated path to data directories list, \
- will be iterated upon during epochs in round-robin manner')
+ parser.add_argument('data', help='XXcolon separated path to data directories list, \
+ will be iterated upon during epochs in round-robin mannerXX')
parser.add_argument('--tokens-per-sample', default=512, type=int,
help='max number of total tokens over all segments'
' per sample for BERT dataset')
Mutant 3303
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -40,7 +40,7 @@
"""Add task-specific arguments to the parser."""
parser.add_argument('data', help='colon separated path to data directories list, \
will be iterated upon during epochs in round-robin manner')
- parser.add_argument('--tokens-per-sample', default=512, type=int,
+ parser.add_argument('XX--tokens-per-sampleXX', default=512, type=int,
help='max number of total tokens over all segments'
' per sample for BERT dataset')
parser.add_argument('--break-mode', default="doc", type=str, help='mode for breaking sentence')
Mutant 3304
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -40,7 +40,7 @@
"""Add task-specific arguments to the parser."""
parser.add_argument('data', help='colon separated path to data directories list, \
will be iterated upon during epochs in round-robin manner')
- parser.add_argument('--tokens-per-sample', default=512, type=int,
+ parser.add_argument('--tokens-per-sample', default=513, type=int,
help='max number of total tokens over all segments'
' per sample for BERT dataset')
parser.add_argument('--break-mode', default="doc", type=str, help='mode for breaking sentence')
Mutant 3305
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -41,7 +41,7 @@
parser.add_argument('data', help='colon separated path to data directories list, \
will be iterated upon during epochs in round-robin manner')
parser.add_argument('--tokens-per-sample', default=512, type=int,
- help='max number of total tokens over all segments'
+ help='XXmax number of total tokens over all segmentsXX'
' per sample for BERT dataset')
parser.add_argument('--break-mode', default="doc", type=str, help='mode for breaking sentence')
parser.add_argument('--shuffle-dataset', action='store_true', default=False)
Mutant 3306
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -43,7 +43,7 @@
parser.add_argument('--tokens-per-sample', default=512, type=int,
help='max number of total tokens over all segments'
' per sample for BERT dataset')
- parser.add_argument('--break-mode', default="doc", type=str, help='mode for breaking sentence')
+ parser.add_argument('XX--break-modeXX', default="doc", type=str, help='mode for breaking sentence')
parser.add_argument('--shuffle-dataset', action='store_true', default=False)
def __init__(self, args, dictionary):
Mutant 3307
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -43,7 +43,7 @@
parser.add_argument('--tokens-per-sample', default=512, type=int,
help='max number of total tokens over all segments'
' per sample for BERT dataset')
- parser.add_argument('--break-mode', default="doc", type=str, help='mode for breaking sentence')
+ parser.add_argument('--break-mode', default="XXdocXX", type=str, help='mode for breaking sentence')
parser.add_argument('--shuffle-dataset', action='store_true', default=False)
def __init__(self, args, dictionary):
Mutant 3308
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -43,7 +43,7 @@
parser.add_argument('--tokens-per-sample', default=512, type=int,
help='max number of total tokens over all segments'
' per sample for BERT dataset')
- parser.add_argument('--break-mode', default="doc", type=str, help='mode for breaking sentence')
+ parser.add_argument('--break-mode', default="doc", type=str, help='XXmode for breaking sentenceXX')
parser.add_argument('--shuffle-dataset', action='store_true', default=False)
def __init__(self, args, dictionary):
Mutant 3309
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -44,7 +44,7 @@
help='max number of total tokens over all segments'
' per sample for BERT dataset')
parser.add_argument('--break-mode', default="doc", type=str, help='mode for breaking sentence')
- parser.add_argument('--shuffle-dataset', action='store_true', default=False)
+ parser.add_argument('XX--shuffle-datasetXX', action='store_true', default=False)
def __init__(self, args, dictionary):
super().__init__(args)
Mutant 3311
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -44,7 +44,7 @@
help='max number of total tokens over all segments'
' per sample for BERT dataset')
parser.add_argument('--break-mode', default="doc", type=str, help='mode for breaking sentence')
- parser.add_argument('--shuffle-dataset', action='store_true', default=False)
+ parser.add_argument('--shuffle-dataset', action='store_true', default=True)
def __init__(self, args, dictionary):
super().__init__(args)
Mutant 3312
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -51,7 +51,6 @@
self.dictionary = dictionary
self.seed = args.seed
- @classmethod
def load_dictionary(cls, filename):
return BertDictionary.load(filename)
Mutant 3313
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -55,7 +55,6 @@
def load_dictionary(cls, filename):
return BertDictionary.load(filename)
- @classmethod
def build_dictionary(cls, filenames, workers=1, threshold=-1, nwords=-1, padding_factor=8):
d = BertDictionary()
for filename in filenames:
Mutant 3314
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -56,7 +56,7 @@
return BertDictionary.load(filename)
@classmethod
- def build_dictionary(cls, filenames, workers=1, threshold=-1, nwords=-1, padding_factor=8):
+ def build_dictionary(cls, filenames, workers=2, threshold=-1, nwords=-1, padding_factor=8):
d = BertDictionary()
for filename in filenames:
Dictionary.add_file_to_dictionary(filename, d, tokenizer.tokenize_line, workers)
Mutant 3315
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -56,7 +56,7 @@
return BertDictionary.load(filename)
@classmethod
- def build_dictionary(cls, filenames, workers=1, threshold=-1, nwords=-1, padding_factor=8):
+ def build_dictionary(cls, filenames, workers=1, threshold=+1, nwords=-1, padding_factor=8):
d = BertDictionary()
for filename in filenames:
Dictionary.add_file_to_dictionary(filename, d, tokenizer.tokenize_line, workers)
Mutant 3316
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -56,7 +56,7 @@
return BertDictionary.load(filename)
@classmethod
- def build_dictionary(cls, filenames, workers=1, threshold=-1, nwords=-1, padding_factor=8):
+ def build_dictionary(cls, filenames, workers=1, threshold=-2, nwords=-1, padding_factor=8):
d = BertDictionary()
for filename in filenames:
Dictionary.add_file_to_dictionary(filename, d, tokenizer.tokenize_line, workers)
Mutant 3317
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -56,7 +56,7 @@
return BertDictionary.load(filename)
@classmethod
- def build_dictionary(cls, filenames, workers=1, threshold=-1, nwords=-1, padding_factor=8):
+ def build_dictionary(cls, filenames, workers=1, threshold=-1, nwords=+1, padding_factor=8):
d = BertDictionary()
for filename in filenames:
Dictionary.add_file_to_dictionary(filename, d, tokenizer.tokenize_line, workers)
Mutant 3318
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -56,7 +56,7 @@
return BertDictionary.load(filename)
@classmethod
- def build_dictionary(cls, filenames, workers=1, threshold=-1, nwords=-1, padding_factor=8):
+ def build_dictionary(cls, filenames, workers=1, threshold=-1, nwords=-2, padding_factor=8):
d = BertDictionary()
for filename in filenames:
Dictionary.add_file_to_dictionary(filename, d, tokenizer.tokenize_line, workers)
Mutant 3319
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -56,7 +56,7 @@
return BertDictionary.load(filename)
@classmethod
- def build_dictionary(cls, filenames, workers=1, threshold=-1, nwords=-1, padding_factor=8):
+ def build_dictionary(cls, filenames, workers=1, threshold=-1, nwords=-1, padding_factor=9):
d = BertDictionary()
for filename in filenames:
Dictionary.add_file_to_dictionary(filename, d, tokenizer.tokenize_line, workers)
Mutant 3320
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -63,7 +63,6 @@
d.finalize(threshold=threshold, nwords=nwords, padding_factor=padding_factor)
return d
- @property
def target_dictionary(self):
return self.dictionary
Mutant 3321
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -67,7 +67,6 @@
def target_dictionary(self):
return self.dictionary
- @classmethod
def setup_task(cls, args, **kwargs):
"""Setup the task.
"""
Mutant 3322
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -78,7 +78,7 @@
return cls(args, dictionary)
- def load_dataset(self, split, epoch=1, combine=False):
+ def load_dataset(self, split, epoch=2, combine=False):
"""Load a given dataset split.
Args:
Mutant 3323
--- fairseq/tasks/legacy_masked_lm.py
+++ fairseq/tasks/legacy_masked_lm.py
@@ -78,7 +78,7 @@
return cls(args, dictionary)
- def load_dataset(self, split, epoch=1, combine=False):
+ def load_dataset(self, split, epoch=1, combine=True):
"""Load a given dataset split.
Args: