Test / src /scripts /1_dump_texts.py
Архипов Дмитрий
test
565e754
import os
import sys
sys.path.append(os.getcwd())
import pandas as pd
from src.db_utils.sql_utils import sql_drop, sql_dump_df
from src.data.clean import clean_df
if __name__ == "__main__":
# Предобработка документов
rbc = pd.read_csv("src/dataset/rbc/channel_rbc_news_posts.csv")
rbc = clean_df(rbc)
# Загрузка в бд
table = "posts"
sql_drop(table)
sql_dump_df(rbc, table, if_exists="replace")