File size: 1,316 Bytes
d187b57 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 |
import pandas as pd
def check_dataset():
try:
# Check train dataset
print("\nChecking train dataset...")
train_df = pd.read_csv("dataset/split/train.csv")
print("\nTrain Dataset Columns:")
print("-" * 50)
for col in train_df.columns:
print(f"- {col}")
print(f"\nTrain Dataset Shape: {train_df.shape}")
print("\nTrain Dataset Info:")
print(train_df.info())
print("\nFirst few rows of train dataset:")
print(train_df.head())
# Check validation dataset
print("\nChecking validation dataset...")
val_df = pd.read_csv("dataset/split/val.csv")
print("\nValidation Dataset Columns:")
print("-" * 50)
for col in val_df.columns:
print(f"- {col}")
print(f"\nValidation Dataset Shape: {val_df.shape}")
# Check test dataset
print("\nChecking test dataset...")
test_df = pd.read_csv("dataset/split/test.csv")
print("\nTest Dataset Columns:")
print("-" * 50)
for col in test_df.columns:
print(f"- {col}")
print(f"\nTest Dataset Shape: {test_df.shape}")
except Exception as e:
print(f"Error: {str(e)}")
if __name__ == "__main__":
check_dataset() |