File size: 775 Bytes
c2b1920
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
import os
import pinecone
from langchain.document_loaders import PyPDFLoader
from langchain.text_splitter import RecursiveCharacterTextSplitter
from langchain.embeddings import OpenAIEmbeddings
from langchain.vectorstores import Pinecone

OPENAI_API_KEY = os.environ.get("OPENAI_API_KEY")
PINECONE_API_KEY = os.environ.get("PINECONE_API_KEY")
PINECONE_ENV = os.environ.get("PINECONE_ENV")

pinecone.init(api_key=PINECONE_API_KEY, environment=PINECONE_ENV)
index_name = "workflow-helper-index"

embedding = OpenAIEmbeddings(openai_api_key=OPENAI_API_KEY)

loader = PyPDFLoader("your_doc.pdf")
pages = loader.load_and_split()

vectorstore = Pinecone.from_documents(pages, embedding, index_name=index_name)
print(f"Uploaded {len(pages)} pages to Pinecone index '{index_name}'")