from argparse import ArgumentParser | |
from typing import List | |
def get_args(): | |
""" | |
Parses command-line arguments for ALIGN-Multilingual. | |
Returns: | |
argparse.Namespace: Parsed arguments. | |
""" | |
parser = ArgumentParser(description="ALIGN-SentencePerturbation Argument Parser") | |
parser.add_argument( | |
"--dataset_name", | |
dest="dataset_name", | |
type=str, | |
default="mrpc", | |
choices=["mrpc", "qqp","paws"], | |
help="Name of the dataset to use.", | |
) | |
parser.add_argument( | |
"--task", | |
dest="task", | |
type=str, | |
default="syn", | |
choices=["syn", "anto","jumb","jumbling","paraphrase","para"], | |
help="Perturbation task to perform.", | |
) | |
parser.add_argument( | |
"--target_lang", | |
dest="target_lang", | |
type=str, | |
default="en", | |
help="Target language for translation.", | |
) | |
parser.add_argument( | |
"--output_dir", | |
dest="output_dir", | |
type=str, | |
default="./data/perturbed_dataset/", | |
help="Output directory for perturbed dataset.", | |
) | |
parser.add_argument( | |
"--save", | |
dest="save", | |
type=bool, | |
help="Whether to save the translated dataset to a file.", | |
) | |
parser.add_argument( | |
"--sample_size", | |
dest="sample_size", | |
type=int, | |
default=None, | |
help="Number of rows to process.", | |
) | |
return parser.parse_args() |