Spaces:

oliverwang15
/

DAN_AI

Sleeping

App Files Files Community

oliverwang15 commited on Dec 5, 2023

Commit

d29770b

1 Parent(s): 8650c17

updates on the experiment

Browse files

Files changed (5) hide show

app.py +5 -3
backend.py +39 -20
offline_results/exp_ga.csv +0 -0
offline_results/exp_gb.csv +0 -0
offline_results/exp_test.csv +0 -0

app.py CHANGED Viewed

@@ -35,7 +35,9 @@ with gr.Blocks(theme="dark") as demo:
                     openai_key = gr.Textbox(
                         label='Enter your OpenAI API key here',
                         type='password')
                     file = gr.File(label='Upload your .txt or .pdf file here', file_types=['.txt', '.pdf'], file_count = 'multiple')
                     btn_submit_txt_online = gr.Button(value='Submit')
                     # btn_submit_txt.style(full_width=True)
@@ -43,7 +45,7 @@ with gr.Blocks(theme="dark") as demo:
                 with gr.Group():
                     gr.Markdown(f'<center><h2>Or Load Offline</h2></center>')
                     questions = gr.CheckboxGroup(choices = QUESTIONS, value = QUESTIONS, label="Questions (Please don't change this part now)", info="Please select the question you want to ask")
-                    answer_type = gr.Radio(choices = ["ChatGPT_txt", "GPT4_txt", 'New_GPT_4_pdf'], label="Answer_type", info="Please select the type of answer you want to show")
                     btn_submit_txt_offline = gr.Button(value='Show Answers')
                     # btn_submit_txt.style(full_width=True)
@@ -119,7 +121,7 @@ with gr.Blocks(theme="dark") as demo:
     # Submit button
     btn_submit_txt_online.click(
             backend.process_file_online,
-            inputs=[file, questions, openai_key],
             outputs=[filename_box, question_box, answer_box, reference_box, highlighted_text, correct_answer, correct_reference],
     )

                     openai_key = gr.Textbox(
                         label='Enter your OpenAI API key here',
                         type='password')
+                    model_selection = gr.Radio(choices = ["ChatGPT", "GPT4"], label="Model Selection", info="Please select the model you want to use")
                     file = gr.File(label='Upload your .txt or .pdf file here', file_types=['.txt', '.pdf'], file_count = 'multiple')
                     btn_submit_txt_online = gr.Button(value='Submit')
                     # btn_submit_txt.style(full_width=True)
                 with gr.Group():
                     gr.Markdown(f'<center><h2>Or Load Offline</h2></center>')
                     questions = gr.CheckboxGroup(choices = QUESTIONS, value = QUESTIONS, label="Questions (Please don't change this part now)", info="Please select the question you want to ask")
+                    answer_type = gr.Radio(choices = ["ChatGPT_txt", "GPT4_txt", 'New_GPT_4_pdf', 'Exp_text', 'Exp_Group_A', 'Exp_Group_B'], label="Answer_type", info="Please select the type of answer you want to show")
                     btn_submit_txt_offline = gr.Button(value='Show Answers')
                     # btn_submit_txt.style(full_width=True)
     # Submit button
     btn_submit_txt_online.click(
             backend.process_file_online,
+            inputs=[file, questions, openai_key, model_selection],
             outputs=[filename_box, question_box, answer_box, reference_box, highlighted_text, correct_answer, correct_reference],
     )

backend.py CHANGED Viewed

@@ -73,7 +73,7 @@ class Backend:
         return text
-    def process_file_online(self, file, questions, openai_key, progress = gr.Progress()):
         # record the questions
         self.questions = questions
@@ -83,10 +83,16 @@ class Backend:
         # make the prompt
         prompt_list = [self.prompt.get(text, questions, 'v3') for text in self.text_list]
         # interact with openai
         self.res_list = []
         for prompt in progress.tqdm(prompt_list, desc = 'Generating answers...'):
-            res = self.agent(prompt, with_history = False, temperature = 0.1, model = 'gpt-3.5-turbo-16k', api_key = openai_key)
             res = self.prompt.process_result(res, 'v3')
             self.res_list.append(res)
@@ -362,29 +368,42 @@ class Backend:
             df = pd.read_csv('./offline_results/results_all_gpt4.csv')
         elif answer_type == 'New_GPT_4_pdf':
             df = pd.read_csv('./offline_results/results_new_pdf.csv')
         # make the prompt
         self.res_list = self.phase_df(df)
-        if answer_type == 'ChatGPT_txt' or answer_type == 'GPT4_txt':
-            txt_root_path = './20230808-AI coding-1st round'
-            self.filename_list = df['fn'].tolist()
-        elif answer_type == 'New_GPT_4_pdf':
-            txt_root_path = './new_pdfs'
             self.filename_list = df['fn'].tolist()
-            self.filename_list = ['.'.join(f.split('.')[:-1]) + '.txt' for f in self.filename_list]
-        self.text_list = []
-        for file in progress.tqdm(self.filename_list):
-            if file.split('.')[-1] == 'pdf':
-                # convert pdf to txt
-                text = self.phrase_pdf(os.path.join(txt_root_path, file))
-            else:
-                text_path = os.path.join(txt_root_path, file)
-                with open(text_path, 'r', encoding='utf-8') as f:
-                    text = f.read()
-            self.text_list.append(text)
         # Use the first file as default
         # Use the first question for multiple questions

         return text
+    def process_file_online(self, file, questions, openai_key, model_selection, progress = gr.Progress()):
         # record the questions
         self.questions = questions
         # make the prompt
         prompt_list = [self.prompt.get(text, questions, 'v3') for text in self.text_list]
+        # select the model
+        if model_selection == 'ChatGPT':
+            model = 'gpt-3.5-turbo-16k'
+        elif model_selection == 'GPT4':
+            model = 'gpt-4-1106-preview'
         # interact with openai
         self.res_list = []
         for prompt in progress.tqdm(prompt_list, desc = 'Generating answers...'):
+            res = self.agent(prompt, with_history = False, temperature = 0.1, model = model, api_key = openai_key)
             res = self.prompt.process_result(res, 'v3')
             self.res_list.append(res)
             df = pd.read_csv('./offline_results/results_all_gpt4.csv')
         elif answer_type == 'New_GPT_4_pdf':
             df = pd.read_csv('./offline_results/results_new_pdf.csv')
+        elif answer_type == 'Exp_text':
+            df = pd.read_csv('./offline_results/exp_test.csv')
+        elif answer_type == 'Exp_Group_A':
+            df = pd.read_csv('./offline_results/exp_ga.csv')
+        elif answer_type == 'Exp_Group_B':
+            df = pd.read_csv('./offline_results/exp_gb.csv')
         # make the prompt
         self.res_list = self.phase_df(df)
+        if answer_type in ['ChatGPT_txt', 'GPT4_txt', 'New_GPT_4_pdf']:
+            if answer_type == 'ChatGPT_txt' or answer_type == 'GPT4_txt':
+                txt_root_path = './20230808-AI coding-1st round'
+                self.filename_list = df['fn'].tolist()
+            elif answer_type == 'New_GPT_4_pdf':
+                txt_root_path = './new_pdfs'
+                self.filename_list = df['fn'].tolist()
+                self.filename_list = ['.'.join(f.split('.')[:-1]) + '.txt' for f in self.filename_list]
+            self.text_list = []
+            for file in progress.tqdm(self.filename_list):
+                if file.split('.')[-1] == 'pdf':
+                    # convert pdf to txt
+                    text = self.phrase_pdf(os.path.join(txt_root_path, file))
+                else:
+                    text_path = os.path.join(txt_root_path, file)
+                    with open(text_path, 'r', encoding='utf-8') as f:
+                        text = f.read()
+                self.text_list.append(text)
+        elif answer_type in ['Exp_text', 'Exp_Group_A', 'Exp_Group_B']:
             self.filename_list = df['fn'].tolist()
+            self.text_list = df['content'].tolist()
         # Use the first file as default
         # Use the first question for multiple questions

offline_results/exp_ga.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

offline_results/exp_gb.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

offline_results/exp_test.csv ADDED Viewed

The diff for this file is too large to render. See raw diff