ramayan_rag / main.py
anshumanpatil's picture
RAG referances changed
e8586c9
import os
substring = "Canto "
def main():
page = []
page_no = 0
with open("ramayan.txt", "r", encoding="utf8") as f:
output = f.readlines()
for line in output:
sentence = line.strip()
if substring in sentence:
print(sentence, "\n")
with open(f"ramayan/ramayan_cleaned_{page_no}.txt", "w", encoding="utf8") as f:
f.write(f"{sentence}\n\n")
f.write("\n".join(page))
page_no += 1
page = []
else:
page.append(sentence)
if __name__ == "__main__":
main()