diff --git a/dataset/preprocessing/data_processor.py b/dataset/preprocessing/data_processor.py index 266ac2d..8a2c388 100644 --- a/dataset/preprocessing/data_processor.py +++ b/dataset/preprocessing/data_processor.py @@ -83,9 +83,9 @@ def __init__(self, outer_instance): transformations_per_example=random.randint(1, 3) ) - self.augmenter_insert = Augmenter( + self.insert_augmenter = Augmenter( transformation=WordSwapRandomCharacterInsertion(), - pct_words_to_swap=0.5, + pct_words_to_swap=0.4, transformations_per_example=random.randint(1, 3) ) @@ -125,7 +125,7 @@ def augment(self): # Esto es de textattack, creo que serĂ¡ buena idea... veamos. swapped_names = self.swap_augmenter.augment(name) - insertions_names = self.augmenter_insert.augment(name) + insertions_names = self.insert_augmenter.augment(name) for aug_name in swapped_names + insertions_names: augmented_data.append(f"{label} {aug_name}")