Spaces:
Running
Running
File size: 590 Bytes
d29b763 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 | from pathlib import Path
from preprocessing.artifact_manager import manager
BASE_DIR = Path(__file__).resolve().parents[2]
OUTPUT_PATH = BASE_DIR / 'data' / 'processed' / 'ddinter_combined.parquet'
def main() -> None:
df = manager.load_artifact('ddinter_combined')
print(f'Loaded processed DDInter artifact: {len(df)} rows, {len(df.columns)} columns')
print(df.head())
OUTPUT_PATH.parent.mkdir(parents=True, exist_ok=True)
df.to_parquet(OUTPUT_PATH, index=False)
print(f'Saved processed DDInter artifact to {OUTPUT_PATH}')
if __name__ == '__main__':
main() |