Add docker-compose, multi-stage builds, and developer tooling
Browse files- scripts/eda.py +2 -2
scripts/eda.py
CHANGED
|
@@ -5,6 +5,8 @@
|
|
| 5 |
# data distributions, quality issues, and inform modeling decisions.
|
| 6 |
|
| 7 |
# %% Imports
|
|
|
|
|
|
|
| 8 |
import pandas as pd
|
| 9 |
import matplotlib.pyplot as plt
|
| 10 |
|
|
@@ -315,8 +317,6 @@ print(f"Data quality issues: {empty_reviews + very_short + duplicate_texts}")
|
|
| 315 |
print(f"\nPlots saved to: {FIGURES_DIR}")
|
| 316 |
|
| 317 |
# %% Generate markdown report
|
| 318 |
-
from pathlib import Path
|
| 319 |
-
|
| 320 |
REPORTS_DIR = Path("reports")
|
| 321 |
REPORTS_DIR.mkdir(exist_ok=True)
|
| 322 |
|
|
|
|
| 5 |
# data distributions, quality issues, and inform modeling decisions.
|
| 6 |
|
| 7 |
# %% Imports
|
| 8 |
+
from pathlib import Path
|
| 9 |
+
|
| 10 |
import pandas as pd
|
| 11 |
import matplotlib.pyplot as plt
|
| 12 |
|
|
|
|
| 317 |
print(f"\nPlots saved to: {FIGURES_DIR}")
|
| 318 |
|
| 319 |
# %% Generate markdown report
|
|
|
|
|
|
|
| 320 |
REPORTS_DIR = Path("reports")
|
| 321 |
REPORTS_DIR.mkdir(exist_ok=True)
|
| 322 |
|