Spaces:
BHO
/
Runtime error

BHO commited on
Commit
7fbc363
·
0 Parent(s):

Duplicate from BHO/URDtest

Browse files
.gitattributes ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tflite filter=lfs diff=lfs merge=lfs -text
29
+ *.tgz filter=lfs diff=lfs merge=lfs -text
30
+ *.wasm filter=lfs diff=lfs merge=lfs -text
31
+ *.xz filter=lfs diff=lfs merge=lfs -text
32
+ *.zip filter=lfs diff=lfs merge=lfs -text
33
+ *.zst filter=lfs diff=lfs merge=lfs -text
34
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ TC[[:space:]]-[[:space:]]URD[[:space:]]2019[[:space:]]EN[[:space:]]mise[[:space:]]en[[:space:]]ligne.pdf filter=lfs diff=lfs merge=lfs -text
36
+ tik2020-urd-fr-chap6-v2021-03-16-en[[:space:]](1).pdf filter=lfs diff=lfs merge=lfs -text
37
+ tik2020-urd-fr-chap6-v2021-03-16-en.pdf filter=lfs diff=lfs merge=lfs -text
38
+ Tikehau[[:space:]]Capital[[:space:]]-[[:space:]]Investor[[:space:]]Teaser.pdf filter=lfs diff=lfs merge=lfs -text
39
+ Tikehau[[:space:]]Capital[[:space:]]-[[:space:]]Universal[[:space:]]Registration[[:space:]]Document[[:space:]]9[[:space:]]April[[:space:]]2021.pdf filter=lfs diff=lfs merge=lfs -text
40
+ Tikehau[[:space:]]Capital[[:space:]]_RFS[[:space:]]sept[[:space:]]2021_EN.pdf filter=lfs diff=lfs merge=lfs -text
41
+ tikehau-capital-2022-cmd-presentation.pdf filter=lfs diff=lfs merge=lfs -text
42
+ Tikehau-Capital-2022-Universal-Registration-Document-24-March-2023.pdf filter=lfs diff=lfs merge=lfs -text
43
+ tikehau-capital-activity-report-2020-en.pdf filter=lfs diff=lfs merge=lfs -text
44
+ Tikehau-Capital-FY21-results-presentation.pdf filter=lfs diff=lfs merge=lfs -text
45
+ tikehau-capital-fy22-results-presentation-v2.pdf filter=lfs diff=lfs merge=lfs -text
46
+ Tikehau-Capital-H1-2022-results-presentation.pdf filter=lfs diff=lfs merge=lfs -text
47
+ Tikehau-Capital-HY-Financial-Report-30-June-2022-EN.pdf filter=lfs diff=lfs merge=lfs -text
48
+ Tikehau-Capital-Investor-Presentation.pdf filter=lfs diff=lfs merge=lfs -text
49
+ Tikehau-Capital-RA-EN.pdf filter=lfs diff=lfs merge=lfs -text
50
+ Tikehau-Capital-RDD-EN.pdf filter=lfs diff=lfs merge=lfs -text
51
+ tikehau-capital-universal-registration-document-2021-1-april-2022.pdf filter=lfs diff=lfs merge=lfs -text
52
+ tikehau-capital-urd-including-rfs-en-vdef.pdf filter=lfs diff=lfs merge=lfs -text
53
+ TIKEHAU-RA-RT-VA-v15-240x180.pdf filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ title: URDtest
3
+ emoji: 😻
4
+ colorFrom: blue
5
+ colorTo: green
6
+ sdk: gradio
7
+ sdk_version: 3.24.1
8
+ app_file: app.py
9
+ pinned: false
10
+ license: openrail
11
+ duplicated_from: BHO/URDtest
12
+ ---
13
+
14
+ Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
README1.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ Test2
app.py ADDED
@@ -0,0 +1,63 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import gradio as gr
2
+ import os
3
+ from langchain.chains import RetrievalQA
4
+ from langchain.llms import OpenAI
5
+ from langchain.document_loaders import PyPDFLoader
6
+ from langchain.document_loaders import DirectoryLoader
7
+ from langchain.text_splitter import CharacterTextSplitter
8
+ from langchain.embeddings import OpenAIEmbeddings
9
+ from langchain.vectorstores import Chroma
10
+
11
+
12
+ # Set the path of your new directory
13
+ dir_path = "./docs"
14
+
15
+ # Create the directory using the os module
16
+ os.makedirs(dir_path, exist_ok=True)
17
+
18
+ # Print a confirmation message
19
+ print(f"New directory created at {dir_path}")
20
+
21
+ def qa_system(pdf_file, openai_key, prompt, chain_type, k):
22
+ os.environ["OPENAI_API_KEY"] = openai_key
23
+
24
+ # load document
25
+ # loader = PyPDFLoader(pdf_file.name)
26
+ loader = DirectoryLoader(dir_path, glob="**/*.pdf") #, loader_cls=PDFLoader)
27
+ documents = loader.load()
28
+
29
+ # split the documents into chunks
30
+ text_splitter = CharacterTextSplitter(chunk_size=1000, chunk_overlap=0)
31
+ texts = text_splitter.split_documents(documents)
32
+
33
+ # select which embeddings we want to use
34
+ embeddings = OpenAIEmbeddings()
35
+
36
+ # create the vectorestore to use as the index
37
+ db = Chroma.from_documents(texts, embeddings)
38
+
39
+ # expose this index in a retriever interface
40
+ retriever = db.as_retriever(search_type="similarity", search_kwargs={"k": k})
41
+
42
+ # create a chain to answer questions
43
+ qa = RetrievalQA.from_chain_type(
44
+ llm=OpenAI(), chain_type=chain_type, retriever=retriever, return_source_documents=True)
45
+
46
+ # get the result
47
+ result = qa({"query": prompt})
48
+ return result['result'], [doc.page_content for doc in result["source_documents"]]
49
+
50
+ # define the Gradio interface
51
+ input_file = gr.inputs.File(label="PDF File")
52
+ openai_key = gr.inputs.Textbox(label="OpenAI API Key", type="password")
53
+ prompt = gr.inputs.Textbox(label="Question Prompt")
54
+ chain_type = gr.inputs.Radio(['stuff', 'map_reduce', "refine", "map_rerank"], label="Chain Type")
55
+ k = gr.inputs.Slider(minimum=1, maximum=5, default=1, label="Number of Relevant Chunks")
56
+
57
+ output_text = gr.outputs.Textbox(label="Answer")
58
+ output_docs = gr.outputs.Textbox(label="Relevant Source Text")
59
+
60
+ gr.Interface(qa_system, inputs=[input_file, openai_key, prompt, chain_type, k], outputs=[output_text, output_docs],
61
+ title="Question Answering with PDF File and OpenAI",
62
+ description="Upload a PDF file, enter your OpenAI API key, type a question prompt, select a chain type, and choose the number of relevant chunks to use for the answer.").launch(debug = True)
63
+
docs/TC - URD 2019 EN mise en ligne.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15088bec09fbd6c4658980ab90ad5bb325273eb0267468da6ac6434f3bfee1f3
3
+ size 7532243
docs/TIKEHAU-RA-RT-VA-v15-240x180.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8676af4ccd9079a6faedfd39ba57c8ccfa6d05aaa208cc744966593df1db1118
3
+ size 22690486
docs/Tikehau Capital - Investor Teaser.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:667e1da4c7e5dfa69b6c62ce94f01b6a3e5eba567601feff216fa885997a2de6
3
+ size 5064914
docs/Tikehau Capital - Universal Registration Document 9 April 2021.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd8f33e2cdefa8ff6e84a47b6598fec0912c601ccccdfc4ad61f4603a4e586b9
3
+ size 6376414
docs/Tikehau Capital _RFS sept 2021_EN.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10058d01b009a0a74e6547fc461e2da78424783e36fe059e6b61b37fd3593dd6
3
+ size 2448714
docs/Tikehau-Capital-2022-Universal-Registration-Document-24-March-2023.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67a19b987f0197078018f45839871518aec37618f6cbc2ab95f52f8c772de5b7
3
+ size 7985418
docs/Tikehau-Capital-FY21-results-presentation.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5930c2bce25a8af42cb8c1b6394f847486ebc554c8ed694c35cd0887a7255ff
3
+ size 2715981
docs/Tikehau-Capital-H1-2022-results-presentation.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:829d65bb2b2058b3cf387b03a8eaaa572c1f23966230c468642b8b58b89470ec
3
+ size 6500940
docs/Tikehau-Capital-HY-Financial-Report-30-June-2022-EN.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2cac86d544737133bae6223132465b7f0192edd80ca0947d03879d84b335660
3
+ size 2354549
docs/Tikehau-Capital-Investor-Presentation.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b925fc588cac372fa27bdc4226a3e841069640dfd2f36820360b218443bf77c3
3
+ size 1926237
docs/Tikehau-Capital-RA-EN.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22a03aa5aaac0c3675a263455f3adb70dce4625e77a6654f05ed538c8b912c4f
3
+ size 37922926
docs/Tikehau-Capital-RDD-EN.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a99996fa6fc60dcafece65c5d03692a9814edb36a970d92c3da6a0845ac9f375
3
+ size 6527550
docs/tik2020-urd-fr-chap6-v2021-03-16-en (1).pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e2c19928a0d455bc00feadeb1c5288d2b51caa86fc0c570bbaa6698d973dd24
3
+ size 1733343
docs/tik2020-urd-fr-chap6-v2021-03-16-en.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e2c19928a0d455bc00feadeb1c5288d2b51caa86fc0c570bbaa6698d973dd24
3
+ size 1733343
docs/tikehau-capital-2022-cmd-presentation.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6d2a33aa87a637b3f223b7aea784bee1442cc094c3b36a4b8dc50e5840ebbbf
3
+ size 15985504
docs/tikehau-capital-activity-report-2020-en.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d267be427cfb81bc3cf17232fa4ebb51a11387544e2f59ff16a25f4b80803f39
3
+ size 5820690
docs/tikehau-capital-fy22-results-presentation-v2.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7699efd04b1aa98c074c5189f8c1d4935a91de0c4f8f85b96abd30f2794f5da3
3
+ size 1489144
docs/tikehau-capital-universal-registration-document-2021-1-april-2022.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a057d7eb72b08ddbb1b61dc04a4b98575201b2addc0c8ab3ca9fd105fedb3d42
3
+ size 2927862
docs/tikehau-capital-urd-including-rfs-en-vdef.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25144aafbfcda4febe0cc149572f0128fed61bcd5706f047f11379234d04cb89
3
+ size 2691260
requirements.txt ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ pdfminer.six
2
+ unstructured
3
+ langchain
4
+ openai
5
+ chromadb
6
+ pypdf
7
+ tiktoken
8
+ panel
9
+ gradio