File size: 463 Bytes
565e754 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 |
import os
import sys
sys.path.append(os.getcwd())
import pandas as pd
from src.db_utils.sql_utils import sql_drop, sql_dump_df
from src.data.clean import clean_df
if __name__ == "__main__":
# Предобработка документов
rbc = pd.read_csv("src/dataset/rbc/channel_rbc_news_posts.csv")
rbc = clean_df(rbc)
# Загрузка в бд
table = "posts"
sql_drop(table)
sql_dump_df(rbc, table, if_exists="replace")
|