File size: 590 Bytes
d29b763
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
from pathlib import Path

from preprocessing.artifact_manager import manager

BASE_DIR = Path(__file__).resolve().parents[2]
OUTPUT_PATH = BASE_DIR / 'data' / 'processed' / 'ddinter_combined.parquet'


def main() -> None:
    df = manager.load_artifact('ddinter_combined')
    print(f'Loaded processed DDInter artifact: {len(df)} rows, {len(df.columns)} columns')
    print(df.head())
    OUTPUT_PATH.parent.mkdir(parents=True, exist_ok=True)
    df.to_parquet(OUTPUT_PATH, index=False)
    print(f'Saved processed DDInter artifact to {OUTPUT_PATH}')


if __name__ == '__main__':
    main()