AB_Testing_RAG_Agent / simple_package.py
kamkol's picture
Add simplified data packaging functionality
ece2d3a
import os
import tarfile
from pathlib import Path
# Define paths
PROCESSED_DATA_DIR = Path("processed_data")
TARGET_PACKAGE = "processed_data.tar.gz"
def simple_package():
"""
Package the processed data into a single compressed file without validation.
This creates a tar.gz file containing the entire processed_data directory.
"""
print("Starting simple packaging process...")
# Check if folder exists
if not os.path.exists(PROCESSED_DATA_DIR):
print(f"ERROR: Directory {PROCESSED_DATA_DIR} not found!")
return
# Create tar.gz file
print(f"Creating package file: {TARGET_PACKAGE}")
with tarfile.open(TARGET_PACKAGE, "w:gz") as tar:
# Add the entire directory
tar.add(PROCESSED_DATA_DIR, arcname=PROCESSED_DATA_DIR.name)
# Verify the tarfile was created
if os.path.exists(TARGET_PACKAGE):
size_mb = os.path.getsize(TARGET_PACKAGE) / (1024 * 1024)
print(f"Package created successfully: {TARGET_PACKAGE} ({size_mb:.2f} MB)")
print("\nInstructions:")
print(f"1. Upload {TARGET_PACKAGE} to your Hugging Face Space")
print("2. The app will automatically extract it on startup")
else:
print("Failed to create package file")
if __name__ == "__main__":
simple_package()