FinGraph / scripts /delete_zero_rel_articles.py
dev-yuje's picture
refactor: clean up root directory by removing cache, old data, and moving scripts
080ff86
# -*- coding: utf-8 -*-
"""
FinGraph ์ง€์‹ ๊ทธ๋ž˜ํ”„ ๋ฌด๊ฒฐ์„ฑ ๊ด€๋ฆฌ ์œ ํ‹ธ๋ฆฌํ‹ฐ
- ์ €์ž‘๊ถŒ: (c) 2026 yujetak / FinGraph Contributors (MIT License)
- ์—ญํ• : ์ง์ ‘์ ์ธ ์—”ํ‹ฐํ‹ฐ ๊ฐ„ ๊ด€๊ณ„์„ (DEVELOPS, APPLIES ๋“ฑ)์ด 0๊ฐœ์ธ ๊ณ ๋ฆฝ ๊ธฐ์‚ฌ ๋…ธ๋“œ๋ฅผ ํƒ์ƒ‰ํ•˜๊ณ  ์ œ๊ฑฐํ•˜์—ฌ
๊ทธ๋ž˜ํ”„์˜ ์—ฐ๊ฒฐ ๋ฐ€๋„์™€ RAG ๊ฒ€์ƒ‰ ๋ฌด๊ฒฐ์„ฑ์„ ๋†’์ž…๋‹ˆ๋‹ค.
"""
import os
import dotenv
import neo4j
dotenv.load_dotenv()
def get_neo4j_driver() -> neo4j.Driver:
uri = os.getenv("NEO4J_URI", "neo4j://localhost:7687")
client_id = os.getenv("NEO4J_CLIENT_ID")
client_secret = os.getenv("NEO4J_CLIENT_SECRET")
if client_id and client_secret:
try:
d = neo4j.GraphDatabase.driver(uri, auth=(client_id, client_secret))
d.verify_connectivity()
return d
except Exception:
pass
username = os.getenv("NEO4J_USERNAME", "neo4j")
password = os.getenv("NEO4J_PASSWORD", "password")
d = neo4j.GraphDatabase.driver(uri, auth=(username, password))
d.verify_connectivity()
return d
if __name__ == "__main__":
driver = get_neo4j_driver()
with driver.session() as s:
res = s.run('''
MATCH (a:Article)
OPTIONAL MATCH (a)-[:MENTIONS]->(n)
OPTIONAL MATCH (n)-[r:DEVELOPS|INVESTS_IN|PARTNERS_WITH|APPLIES|USED_IN|RELATED_TO]-()
WITH a, count(r) as rel_cnt
WHERE rel_cnt = 0
DETACH DELETE a
RETURN count(a) as deleted_count
''')
record = res.single()
if record:
print(f'Deleted articles with 0 relations: {record["deleted_count"]}')
driver.close()