osellight commited on
Commit
815ab21
·
1 Parent(s): 6deb76a

Upload app.py

Browse files
Files changed (1) hide show
  1. app.py +10 -10
app.py CHANGED
@@ -3,17 +3,17 @@ from langchain.vectorstores import Chroma
3
  from langchain.text_splitter import CharacterTextSplitter
4
  from langchain.chains.question_answering import load_qa_chain
5
  from langchain.llms import OpenAI
6
- from dotenv import load_dotenv
7
  import os
8
  import subprocess
9
 
10
  # Load environment variables from .env file
11
- load_dotenv()
12
- # Access environment variables
13
- OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
14
- SERPAPI_API_KEY = os.getenv("SERPAPI_API_KEY")
15
 
16
- # subprocess.run(["git", "clone", "https://github.com/TheMITTech/shakespeare"], check=True)
17
 
18
  from glob import glob
19
  files = glob("./shakespeare/**/*.html")
@@ -21,10 +21,10 @@ files = glob("./shakespeare/**/*.html")
21
 
22
  import shutil
23
  import os
24
- # os.mkdir('./data')
25
- # destination_folder = './data/'
26
- # for html_file in files:
27
- # shutil.move(html_file, destination_folder + html_file.split("/")[-1])
28
 
29
 
30
  from langchain.document_loaders import BSHTMLLoader, DirectoryLoader
 
3
  from langchain.text_splitter import CharacterTextSplitter
4
  from langchain.chains.question_answering import load_qa_chain
5
  from langchain.llms import OpenAI
6
+ # from dotenv import load_dotenv
7
  import os
8
  import subprocess
9
 
10
  # Load environment variables from .env file
11
+ # load_dotenv()
12
+ # # Access environment variables
13
+ # OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
14
+ # SERPAPI_API_KEY = os.getenv("SERPAPI_API_KEY")
15
 
16
+ subprocess.run(["git", "clone", "https://github.com/TheMITTech/shakespeare"], check=True)
17
 
18
  from glob import glob
19
  files = glob("./shakespeare/**/*.html")
 
21
 
22
  import shutil
23
  import os
24
+ os.mkdir('./data')
25
+ destination_folder = './data/'
26
+ for html_file in files:
27
+ shutil.move(html_file, destination_folder + html_file.split("/")[-1])
28
 
29
 
30
  from langchain.document_loaders import BSHTMLLoader, DirectoryLoader