Spaces:

rawpowertools
/

Template_Generator

Running

App Files Files

DJHumanRPT commited on Mar 6, 2025

Commit

136fb03

verified ·

1 Parent(s): e25ab06

Update app.py

Browse files

Files changed (1) hide show

app.py +222 -21

app.py CHANGED Viewed

@@ -125,9 +125,7 @@ def call_llm(prompt, model="gpt-3.5-turbo"):
         if st.session_state.show_template_editor and st.session_state.template_spec:
             output_vars = st.session_state.template_spec.get("output", [])
             if output_vars:
-                output_specs = (
-                    "Please generate output with the following specifications:\n"
-                )
                 for var in output_vars:
                     output_specs += (
                         f"- {var['name']}: {var['description']} (Type: {var['type']})"
@@ -137,15 +135,49 @@ def call_llm(prompt, model="gpt-3.5-turbo"):
                     output_specs += "\n"
                 # Add the output specs to the prompt
-                prompt = f"{prompt}\n\n{output_specs}"
         response = client.chat.completions.create(
             model=model,
             messages=[{"role": "user", "content": prompt}],
             max_tokens=1000,
-            temperature=0.7,
         )
-        return response.choices[0].message.content
     except Exception as e:
         st.error(f"Error calling LLM API: {str(e)}")
         return f"Error: {str(e)}"
@@ -200,6 +232,8 @@ Generate a JSON template specification with the following structure:
 }}
 Make sure the prompt includes all input variables and is designed to produce the expected outputs.
 If a 'lore' or 'knowledge_base' should be incorporated, include {{lore}} in the prompt template.
 If document content was provided, design the template to effectively use that information.
 """
@@ -1463,15 +1497,31 @@ with tab3:
         if st.session_state.generated_output:
             st.header("Generated Output")
             st.markdown("### Result")
-            st.write(st.session_state.generated_output)
-            # Option to save the output
-            st.download_button(
-                label="Download Output",
-                data=st.session_state.generated_output,
-                file_name="generated_output.txt",
-                mime="text/plain",
-            )
     else:
         st.info(
             "No template has been generated yet. Go to the 'Setup' tab to create one."
@@ -1511,6 +1561,10 @@ with tab4:
             st.session_state.combined_data = []
         if "show_json_columns" not in st.session_state:
             st.session_state.show_json_columns = False
         # Generate inputs button
         if st.button("Generate Synthetic Inputs"):
@@ -1528,6 +1582,12 @@ with tab4:
                     st.success(
                         f"Generated {len(st.session_state.synthetic_inputs)} input samples"
                     )
         # Display generated inputs if available
         if st.session_state.synthetic_inputs:
@@ -1546,21 +1606,162 @@ with tab4:
                 mime="text/csv",
             )
             # Generate outputs button
-            if st.button("Generate Outputs for These Inputs"):
                 if not st.session_state.get("api_key"):
                     st.error("Please provide an OpenAI API key in the sidebar.")
                 else:
-                    with st.spinner("Generating outputs for each input..."):
-                        st.session_state.combined_data = generate_synthetic_outputs(
-                            st.session_state.template_spec,
-                            st.session_state.synthetic_inputs,
                             st.session_state.knowledge_base,
                         )
-                    if st.session_state.combined_data:
                         st.success(
-                            f"Generated outputs for {len(st.session_state.combined_data)} inputs"
                         )
         # Display combined data if available

         if st.session_state.show_template_editor and st.session_state.template_spec:
             output_vars = st.session_state.template_spec.get("output", [])
             if output_vars:
+                output_specs = "Please generate output with the following specifications in JSON format:\n"
                 for var in output_vars:
                     output_specs += (
                         f"- {var['name']}: {var['description']} (Type: {var['type']})"
                     output_specs += "\n"
                 # Add the output specs to the prompt
+                prompt = f"{prompt}\n\n{output_specs}\n\nReturn ONLY a JSON object with the output variables, with no additional text or explanation."
         response = client.chat.completions.create(
             model=model,
             messages=[{"role": "user", "content": prompt}],
             max_tokens=1000,
+            temperature=st.session_state.get("temperature", 0.7),
         )
+        result = response.choices[0].message.content
+        # Try to parse as JSON if the template has output variables
+        if (
+            st.session_state.show_template_editor
+            and st.session_state.template_spec
+            and st.session_state.template_spec.get("output")
+        ):
+            # Extract JSON from the response
+            json_pattern = r"```json\s*([\s\S]*?)\s*```|^\s*\{[\s\S]*\}\s*$"
+            json_match = re.search(json_pattern, result)
+            if json_match:
+                json_str = json_match.group(1) if json_match.group(1) else result
+                # Clean up any remaining markdown or comments
+                json_str = re.sub(r"```.*|```", "", json_str).strip()
+                try:
+                    output_data = json.loads(json_str)
+                    # Store the parsed JSON in session state for proper rendering
+                    st.session_state.json_output = output_data
+                    return output_data
+                except:
+                    pass
+            else:
+                try:
+                    output_data = json.loads(result)
+                    # Store the parsed JSON in session state for proper rendering
+                    st.session_state.json_output = output_data
+                    return output_data
+                except:
+                    pass
+        # If we couldn't parse as JSON or it's not meant to be JSON, return as is
+        return result
     except Exception as e:
         st.error(f"Error calling LLM API: {str(e)}")
         return f"Error: {str(e)}"
 }}
 Make sure the prompt includes all input variables and is designed to produce the expected outputs.
+The prompt should address an LLM as if it was a combination of a system prompt and user input, and must contain information around formatting,
+structure and context for the LLM to generate the desired content as derived from these instructions and/or documents.
 If a 'lore' or 'knowledge_base' should be incorporated, include {{lore}} in the prompt template.
 If document content was provided, design the template to effectively use that information.
 """
         if st.session_state.generated_output:
             st.header("Generated Output")
             st.markdown("### Result")
+            # Check if the output is a dictionary (JSON)
+            if isinstance(st.session_state.generated_output, dict):
+                # Display as JSON
+                st.json(st.session_state.generated_output)
+                # Option to save the output as JSON
+                output_json = json.dumps(st.session_state.generated_output, indent=2)
+                st.download_button(
+                    label="Download Output (JSON)",
+                    data=output_json,
+                    file_name="generated_output.json",
+                    mime="application/json",
+                )
+            else:
+                # Display as text
+                st.write(st.session_state.generated_output)
+                # Option to save the output as text
+                st.download_button(
+                    label="Download Output",
+                    data=str(st.session_state.generated_output),
+                    file_name="generated_output.txt",
+                    mime="text/plain",
+                )
     else:
         st.info(
             "No template has been generated yet. Go to the 'Setup' tab to create one."
             st.session_state.combined_data = []
         if "show_json_columns" not in st.session_state:
             st.session_state.show_json_columns = False
+        if "modified_prompt_template" not in st.session_state:
+            st.session_state.modified_prompt_template = ""
+        if "selected_samples" not in st.session_state:
+            st.session_state.selected_samples = []
         # Generate inputs button
         if st.button("Generate Synthetic Inputs"):
                     st.success(
                         f"Generated {len(st.session_state.synthetic_inputs)} input samples"
                     )
+                    # Reset selected samples when new inputs are generated
+                    st.session_state.selected_samples = []
+                    # Reset modified prompt when new inputs are generated
+                    st.session_state.modified_prompt_template = (
+                        st.session_state.template_spec["prompt"]
+                    )
         # Display generated inputs if available
         if st.session_state.synthetic_inputs:
                 mime="text/csv",
             )
+            # Sample selection for output generation
+            st.subheader("Generate Outputs")
+            # Initialize the modified prompt template if not already done
+            if not st.session_state.modified_prompt_template:
+                st.session_state.modified_prompt_template = (
+                    st.session_state.template_spec["prompt"]
+                )
+            # Allow editing the prompt template
+            with st.expander("View/Edit Prompt Template", expanded=False):
+                st.info(
+                    "You can modify the prompt template used for generating outputs. Use {variable_name} to refer to input variables."
+                )
+                st.session_state.modified_prompt_template = st.text_area(
+                    "Prompt Template",
+                    value=st.session_state.modified_prompt_template,
+                    height=200,
+                )
+                # Button to reset to original template
+                if st.button("Reset to Original Template"):
+                    st.session_state.modified_prompt_template = (
+                        st.session_state.template_spec["prompt"]
+                    )
+                    st.success("Prompt template reset to original")
+            # Sample selection options
+            selection_method = st.radio(
+                "Select samples for output generation",
+                options=["Generate for all samples", "Select specific samples"],
+                index=0,
+            )
+            if selection_method == "Select specific samples":
+                # Create a list of sample indices for selection
+                sample_options = [
+                    f"Sample {i+1}"
+                    for i in range(len(st.session_state.synthetic_inputs))
+                ]
+                # Allow multi-selection of samples
+                selected_indices = st.multiselect(
+                    "Select samples to generate outputs for",
+                    options=range(len(sample_options)),
+                    format_func=lambda i: sample_options[i],
+                )
+                # Store selected samples
+                st.session_state.selected_samples = selected_indices
+                # Preview selected samples
+                if selected_indices:
+                    st.write(f"Selected {len(selected_indices)} samples:")
+                    selected_df = pd.DataFrame(
+                        [st.session_state.synthetic_inputs[i] for i in selected_indices]
+                    )
+                    st.dataframe(selected_df)
+            else:
+                # Use all samples
+                st.session_state.selected_samples = list(
+                    range(len(st.session_state.synthetic_inputs))
+                )
+            # Preview the prompt for a selected sample
+            if st.session_state.selected_samples:
+                with st.expander("Preview Prompt for Sample", expanded=False):
+                    # Let user select which sample to preview
+                    preview_index = st.selectbox(
+                        "Select a sample to preview prompt",
+                        options=st.session_state.selected_samples,
+                        format_func=lambda i: f"Sample {i+1}",
+                    )
+                    # Get the selected sample
+                    sample = st.session_state.synthetic_inputs[preview_index]
+                    # Fill the prompt template with sample values
+                    filled_prompt = st.session_state.modified_prompt_template
+                    for var_name, var_value in sample.items():
+                        filled_prompt = filled_prompt.replace(
+                            f"{{{var_name}}}", str(var_value)
+                        )
+                    # Replace {lore} with knowledge base if present
+                    if "{lore}" in filled_prompt:
+                        filled_prompt = filled_prompt.replace(
+                            "{lore}", st.session_state.knowledge_base
+                        )
+                    # Show the filled prompt
+                    st.text_area(
+                        "Filled Prompt", value=filled_prompt, height=300, disabled=True
+                    )
             # Generate outputs button
+            if st.button("Generate Outputs for Selected Samples"):
                 if not st.session_state.get("api_key"):
                     st.error("Please provide an OpenAI API key in the sidebar.")
+                elif not st.session_state.selected_samples:
+                    st.error("No samples selected for output generation.")
                 else:
+                    # Create a copy of the template spec with the modified prompt
+                    modified_template = st.session_state.template_spec.copy()
+                    modified_template["prompt"] = (
+                        st.session_state.modified_prompt_template
+                    )
+                    # Get only the selected samples
+                    selected_inputs = [
+                        st.session_state.synthetic_inputs[i]
+                        for i in st.session_state.selected_samples
+                    ]
+                    with st.spinner(
+                        f"Generating outputs for {len(selected_inputs)} samples..."
+                    ):
+                        generated_outputs = generate_synthetic_outputs(
+                            modified_template,
+                            selected_inputs,
                             st.session_state.knowledge_base,
                         )
+                    if generated_outputs:
+                        # If we're generating for all samples, replace the combined data
+                        if selection_method == "Generate for all samples":
+                            st.session_state.combined_data = generated_outputs
+                        else:
+                            # If we're generating for specific samples, update only those samples
+                            # First, ensure combined_data exists and has the right size
+                            if not st.session_state.combined_data or len(
+                                st.session_state.combined_data
+                            ) != len(st.session_state.synthetic_inputs):
+                                st.session_state.combined_data = [None] * len(
+                                    st.session_state.synthetic_inputs
+                                )
+                            # Update only the selected samples
+                            for i, output_idx in enumerate(
+                                st.session_state.selected_samples
+                            ):
+                                if i < len(generated_outputs):
+                                    st.session_state.combined_data[output_idx] = (
+                                        generated_outputs[i]
+                                    )
+                            # Remove any None values (samples that haven't been generated yet)
+                            st.session_state.combined_data = [
+                                item
+                                for item in st.session_state.combined_data
+                                if item is not None
+                            ]
                         st.success(
+                            f"Generated outputs for {len(generated_outputs)} samples"
                         )
         # Display combined data if available