TunisianEncodersArena / scripts /explore_arabml.py
hamzabouajila's picture
implement scripts for checking , add logging and update submission and integrate evaluation
742dfc3
raw
history blame contribute delete
557 Bytes
from datasets import load_dataset
def explore_arabml():
# Load the ArabML dataset
dataset = load_dataset("arbml/Tunisian_Dialect_Corpus", split="test")
# Print dataset info
print("\nDataset Info:")
print(dataset.info)
# Print first example
print("\nFirst Example:")
print(dataset[0])
# Print all column names
print("\nColumn Names:")
print(dataset.column_names)
# Print first few rows
print("\nFirst few rows:")
print(dataset[:3])
if __name__ == "__main__":
explore_arabml()