| | import pandas as pd |
| | import os |
| |
|
| | def load_data(data_dir): |
| | """ |
| | Loads train and test data from the specified directory. |
| | |
| | Args: |
| | data_dir (str): Path to the directory containing 'train.csv' and 'test.csv'. |
| | |
| | Returns: |
| | tuple: (train_df, test_df) |
| | """ |
| | train_path = os.path.join(data_dir, 'train.csv') |
| | test_path = os.path.join(data_dir, 'test.csv') |
| | |
| | if not os.path.exists(train_path): |
| | raise FileNotFoundError(f"Train file not found at {train_path}") |
| | if not os.path.exists(test_path): |
| | raise FileNotFoundError(f"Test file not found at {test_path}") |
| | |
| | print("Loading training data...") |
| | train_df = pd.read_csv(train_path, parse_dates=['Dates']) |
| | print(f"Training data loaded: {train_df.shape}") |
| | |
| | print("Loading test data...") |
| | test_df = pd.read_csv(test_path, parse_dates=['Dates']) |
| | print(f"Test data loaded: {test_df.shape}") |
| | |
| | return train_df, test_df |
| |
|
| | if __name__ == "__main__": |
| | |
| | data_dir = os.path.join(os.path.dirname(__file__), '../data/crimedataset') |
| | try: |
| | train, test = load_data(data_dir) |
| | print(train.head()) |
| | except Exception as e: |
| | print(e) |
| |
|