File size: 625 Bytes
f29d474
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
from data_loader import load_mk_dataset

def test_dataset():
    print("Testing Macedonian dataset loader...")
    
    # Load the dataset
    dataset = load_mk_dataset()
    
    # Print basic statistics
    print(f"\nDataset size: {len(dataset)} examples")
    
    # Show first few examples
    print("\nFirst 3 examples:")
    for i in range(min(3, len(dataset))):
        text = dataset[i]['text']
        print(f"\nExample {i+1}:")
        print(f"Length: {len(text)} characters")
        print(f"Preview: {text[:200]}...")  # Show first 200 characters

if __name__ == "__main__":
    test_dataset()