Spaces:
Running
Running
from datasets import load_dataset | |
import shutil | |
import os | |
# Define the directory where the dataset should be saved | |
lan = "eng" | |
download_dir = os.path.join("../env/data", lan) | |
# Create the directory if it does not exist, or remove it if it already exists | |
if os.path.exists(download_dir): | |
shutil.rmtree(download_dir) | |
os.makedirs(download_dir) | |
# Load the dataset with the specified splits | |
dataset = load_dataset("SemRel/SemRel2024", lan, split=['train', 'dev', 'test']) | |
# Save each split to a CSV file in the specified directory | |
for split_name, split_data in zip(['train', 'dev', 'test'], dataset): | |
split_data.to_csv(f"{download_dir}/{lan}_{split_name}.csv", index=False) | |
# Print a message indicating where the dataset has been saved and display the splits | |
print(f"Dataset downloaded and saved to {download_dir}") | |
for split_name in ['train', 'dev', 'test']: | |
print(f"{lan}_{split_name} split saved to {download_dir}/{lan}_{split_name}.csv") | |