Spaces:

subashdvorak
/

Brain-Stroming-Story-Gen-Refining

Build error

App Files Files Community

subashdvorak commited on Jan 8, 2025

Commit

956a6ec

verified ·

1 Parent(s): 29970fa

Upload 5 files

Browse files

Files changed (5) hide show

app.py +20 -0
brain_strom_with_influencer_input.py +281 -0
recommendations_and_engagement_predict.py +127 -0
requirements.txt +10 -0
shared_resources.py +24 -0

app.py ADDED Viewed

	@@ -0,0 +1,20 @@

+import gradio as gr
+from brain_strom_with_influencer_input import ResponseGeneratorApp
+from recommendations_and_engagement_predict import StoryRecommendationApp
+# Instantiate the two apps
+brainstorm_app = ResponseGeneratorApp().build_ui()
+print("Brainstorm App:", type(brainstorm_app))
+recommendation_app = StoryRecommendationApp().launch_interface()
+print("Recommendation App:", type(recommendation_app))
+# Combine the two apps into a tabbed interface
+app = gr.TabbedInterface(
+    [brainstorm_app, recommendation_app],  # List of apps/interfaces
+    ["Brainstorm with Influencer Input", "Recommendations with Engagement Predictions"],  # Tab names
+)
+if __name__ == "__main__":
+    app.launch(share=True)

brain_strom_with_influencer_input.py ADDED Viewed

	@@ -0,0 +1,281 @@

+import os
+import gradio as gr
+import torch
+import re
+# from transformers import AutoTokenizer, AutoModelForCausalLM
+from keybert import KeyBERT
+from sentence_transformers import SentenceTransformer
+from datasets import load_dataset,Dataset
+from shared_resources import shared_resources
+from phi.agent import Agent
+from phi.tools.duckduckgo import DuckDuckGo
+from phi.agent import Agent, RunResponse
+from phi.model.huggingface import HuggingFaceChat
+class ResponseGenerator:
+    def __init__(self):
+        self.ST = shared_resources.sentence_transformer
+        self.data = shared_resources.data
+        self.original_query = ""
+        # Define the search function
+    def search(self, query: str, usernames=None, k: int = 3):
+        """Function to get recommended videos based on user input"""
+        self.embedded_query = self.ST.encode(query)  # Embed the user input
+        self.all_retrievals=[]
+        if usernames:
+          dataset=self.data.to_pandas()
+          for username in usernames:
+            username = [username]
+            filtered_df = dataset[dataset['username'].isin(username)]
+            self.temp_data = Dataset.from_pandas(filtered_df)
+            self.temp_data=self.temp_data.add_faiss_index("embeddings")
+            self.scores, self.retrieved_examples = self.temp_data.get_nearest_examples("embeddings", self.embedded_query, k=k)  # Search for top k results
+            self.all_retrievals.append(str(self.retrieved_examples['Caption'][0]))
+            self.temp_data=None
+          print('All retrievals are:',self.all_retrievals)
+          return self.all_retrievals
+        self.scores, self.retrieved_examples = self.data.get_nearest_examples("embeddings", self.embedded_query, k=k)  # Search for top k results
+        return self.scores, self.retrieved_examples
+    def generate_response(self, query, username=None, additional_focus=None):
+        # print('The usernames are:',username)
+        """
+        Generates text using the Llama 3.1 model.
+        """
+        self.original_query = query  # Save the original query for future focus
+        # If we are going deeper, add the additional focus to the prompt
+        if additional_focus:
+            # prompt = f"Explain the Given topic:\n{self.original_query}. Also focus on: {additional_focus}\n1."
+            prompt = f"""
+        I want to create a detailed storyline for a video primarily focusing on the sentence: **{additional_focus}**, keeping it under 500 words. Please provide the storyline in 6 concise paragraphs that must incorporate the following key features everytime:
+        1. **Story:** How to introduce the scene and set the tone. What is happening in the scence? Describe key visuals and actions.
+        2. **Narration or Voiceover:** Suggestions for narration or voiceover that complements the visuals.
+        3. **Text in the Video:** Propose important text overlays for key moments.
+        4. **Transitions:** Smooth transitions between scenes to maintain flow.
+        5. **Emotional Tone:** The mood and energy of the scenes (e.g., excitement, calm, tension, joy).
+        6. **Key Visuals & Sounds:** Important props, locations, sound effects, or background music to enhance the video.
+        The storyline should flow naturally, without repeating the same information or listing individual features. Ensure the output is engaging and cohesive.
+        Also, suggest **5 relevant hashtags** for the video that reflect its content and themes commonly used on social media for similar videos.
+        """
+        else:
+            # prompt = f"Explain the Given topic:\n{query}\n1."
+            prompt = f"""
+        I want to create a detailed storyline for a video in any domain, keeping it under 500 words. Please provide the storyline in 6 concise paragraphs that must incorporate the following key features everytime:
+        1. **Story:** How to introduce the scene and set the tone. What is happening in the scene? Describe key visuals and actions.
+        2. **Narration or Voiceover:** Suggestions for narration or voiceover that complements the visuals.
+        3. **Text in the Video:** Propose important text overlays for key moments.
+        4. **Transitions:** Smooth transitions between scenes to maintain flow.
+        5. **Emotional Tone:** The mood and energy of the scenes (e.g., excitement, calm, tension, joy).
+        6. **Key Visuals & Sounds:** Important props, locations, sound effects, or background music to enhance the video.
+        The storyline should flow naturally, without repeating the same information or listing individual features. Ensure the output is engaging and cohesive.
+        Also, suggest **5 relevant hashtags** for the video that reflect its content and themes commonly used on social media for similar videos.
+        """
+        # prefix = f"The question is:{self.original_query}"
+        # print('The data is:',self.data)
+        if username:
+            retrieved_list = self.search(query,username,1)
+            retrieved_context = "\n".join(retrieved_list)
+            prompt = prompt + f"\n Here is the random video story from the dataset for you. You can use it just for analysing purpose, not for similar generation. This is the story:\n{retrieved_context}"
+            prompt = prompt + f"\nNow finally i am providing you a question to create a detailed story line for a video. The question is: **{self.original_query}**"
+        else:
+            prompt = prompt + f"\nNow finally i am providing you a question to create a detailed story line for a video. The question is: **{self.original_query}**"
+        agent = Agent(
+            model=HuggingFaceChat(
+                id="meta-llama/Meta-Llama-3-8B-Instruct",
+                max_tokens=4096,
+            ),
+            # tools=[DuckDuckGo()],
+            markdown=True
+        )
+        # Get the response in a variable
+        run: RunResponse = agent.run(prompt)
+        return run.content
+    def extract_topics(self, story):
+        """
+        Extracts 5 key sentences from the generated text using KeyBERT.
+        """
+        prompt = f'''I want to brainstorm ways to diversify or improve a storyline in exactly 5 sentences. No more than 5 nor less than 5.
+The goal is to generate creative and actionable ideas that are not on the storyline on how the storyline can be expanded or modified for better engagement.
+For example: If the storyline is about creating a promotional video for a restaurant, the new suggestions might include:
+- I want to showcase the chef preparing a signature dish.
+- I want to add a sequence of customers sharing their experiences at the restaurant.
+- I want to highlight the farm-to-table sourcing of ingredients with a short segment showing local farms.
+- I want to include a time-lapse of the restaurant transforming from day to night, capturing its unique ambiance.
+- I want to feature a quick interview with the owner sharing the story behind the restaurant.
+Now, I will provide you with the storyline. The storyline is:\n{story}
+Please remember, don't give any introduction or explanations. Just generate 5 sentences directly, focusing on creative suggestions for diversifying or modifying the storyline.  '''
+        agent = Agent(
+            model=HuggingFaceChat(
+                id="meta-llama/Meta-Llama-3-8B-Instruct",
+                max_tokens=4096,
+            ),
+            # tools=[DuckDuckGo()],
+            markdown=True
+        )
+        # Get the response in a variable
+        run: RunResponse = agent.run(prompt)
+        generated_text=run.content
+        # Split the text into sentences and strip each one
+        sentences = [sentence.strip() for sentence in re.split(r'[.?]', generated_text) if sentence.strip()]
+        print('The sentences are:',sentences)
+        return sentences[-4:]
+    def on_select_topic(self, selected_topic, history_stack, current_state):
+        """
+        Generates new points for the selected topic and updates history.
+        """
+        # Save current state in history
+        history_stack.append(current_state)
+        # Generate new outputs with the selected topic as additional focus
+        new_response = self.generate_response(self.original_query, additional_focus=selected_topic)
+        new_topics = self.extract_topics(new_response)
+        # Prepare new state
+        new_state = {
+            "response": new_response,
+            "topics": new_topics,
+            "key_topics": new_topics
+        }
+        return new_state, history_stack, gr.update(value=new_response), gr.update(choices=new_topics)
+    def on_back(self, history_stack):
+        """
+        Restores the previous state for all outputs.
+        """
+        if history_stack:
+            # Pop the last state from history
+            previous_state = history_stack.pop()
+            return history_stack, gr.update(value=previous_state["response"]), \
+                gr.update(choices=previous_state["key_topics"])
+        # If no history, clear outputs
+        return history_stack, gr.update(value=""), gr.update(choices=[])
+class ResponseGeneratorApp:
+    def __init__(self):
+        self.point_generator = ResponseGenerator()
+    def build_ui(self):
+        with gr.Blocks() as demo:
+            gr.Markdown(
+                """
+                #Brainstorming App
+                Enter a query to generate a detailed response and start brainstroming for further exploration.
+                """
+            )
+            query_input = gr.Textbox(
+                label="Enter your query",
+                placeholder="Type a query, e.g., 'I want to create a promotional video of Begnas Lake.'",
+                lines=2,
+            )
+            usernames = [
+        "_travelwithsapana", "givina_9", "rajen.rb", "wh0z.khu5h1", "palam061",
+        "prettiest_sky", "explorepokhara", "ggkaam610", "anjana_dhl1"
+            ]
+            # username_inputs =gr.Radio(label="Select Username of whose you want similar story::", choices=usernames, type="value")
+            username_inputs = gr.CheckboxGroup(choices=usernames,label="Choose one or more username of whose you want similar story::",type="value")
+            generate_btn = gr.Button(value="Generate")
+            # Output box for the generated text
+            response_output = gr.Textbox(
+                label="Generated Response",
+                lines=10,
+                interactive=False
+            )
+            # Dynamic radio buttons area for the extracted topics
+            topics_radio = gr.Radio(
+                label="Brain Stroming Areas....",
+                choices=[],
+                type="value",
+                interactive=True
+            )
+            back_btn = gr.Button(value="Back")
+            # State for managing current topics and history
+            current_state = gr.State({})  # Store response, topics, and key_topics
+            history_stack = gr.State([])  # Stack of previous states
+            # Link the generate button to the processing function
+            generate_btn.click(
+                fn=lambda query,usernames: self.generate_handler(query,usernames),
+                inputs=[query_input,username_inputs],
+                outputs=[current_state, response_output, topics_radio],
+            )
+            # Handle selection of a topic (generate new stage)
+            topics_radio.change(
+                fn=self.point_generator.on_select_topic,
+                inputs=[topics_radio, history_stack, current_state],
+                outputs=[current_state, history_stack, response_output, topics_radio]
+            )
+            # Handle back button
+            back_btn.click(
+                fn=self.point_generator.on_back,
+                inputs=[history_stack],
+                outputs=[history_stack, response_output, topics_radio]
+            )
+        return demo
+    def generate_handler(self, query,usernames):
+        """
+        Handles the generation of the response and topics.
+        """
+        response = self.point_generator.generate_response(query,usernames)
+        topics = self.point_generator.extract_topics(response)
+        # Prepare the current state
+        current_state = {
+            "response": response,
+            "topics": topics,
+            "key_topics": topics
+        }
+        return current_state, gr.update(value=response), gr.update(choices=topics)

recommendations_and_engagement_predict.py ADDED Viewed

	@@ -0,0 +1,127 @@

+import os
+import gradio as gr
+# from transformers import AutoTokenizer, AutoModelForCausalLM
+from sentence_transformers import SentenceTransformer
+from datasets import load_dataset
+import numpy as np
+import torch
+from shared_resources import shared_resources
+from phi.agent import Agent
+from phi.tools.duckduckgo import DuckDuckGo
+from phi.agent import Agent, RunResponse
+from phi.model.huggingface import HuggingFaceChat
+class StoryRecommendationApp:
+    def __init__(self):
+        # self.tokenizer = shared_resources.tokenizer
+        # self.model = shared_resources.model
+        self.device = shared_resources.device
+        self.sentence_transformer = shared_resources.sentence_transformer
+        self.data = shared_resources.data
+    def search(self, query: str, k: int = 3):
+        """Search for recommended videos based on user input."""
+        embedded_query = self.sentence_transformer.encode(query)
+        scores, retrieved_examples = self.data.get_nearest_examples("embeddings", embedded_query, k=k)
+        if isinstance(retrieved_examples, np.ndarray):
+            retrieved_examples = np.nan_to_num(retrieved_examples, nan=0)
+        elif isinstance(retrieved_examples, list):
+            retrieved_examples = [
+                [0 if np.isnan(val) else val for val in example] if isinstance(example, list) else example
+                for example in retrieved_examples
+            ]
+        return scores, retrieved_examples
+    def compute_mean_and_predict(self, retrieved_examples):
+        """Compute mean for likesCount, commentCount, and shareCount."""
+        features = ["LikesCount", "commentCount", "shareCount"]
+        predictions = {}
+        for feature in features:
+            values = np.array(retrieved_examples[feature])
+            values = np.array([np.nan if v is None else v for v in values])
+            values = np.nan_to_num(values, nan=0.0)
+            mean_value = int(np.mean(values))
+            predictions[f"predicted_{feature}"] = mean_value
+        return predictions
+    def generate_prompt(self, query: str):
+        """Generate a prompt for video generation based on the input story."""
+        input_text = f'''
+        I want to summarize a story in exactly 3 sentences. No more than 3 nor less than 3.
+        But the sentences have to be good enough to use as a prompt for video generation, because I have to give those 3 sentences to the video generation model.
+        For example: This prompt is about A heartwarming family reunion celebrating love and cherished memories in exactly 3 sentences.
+        -A warm, heartfelt reunion in a cozy living room, where family members embrace each other after a long time apart, soft lighting enhances the intimate atmosphere, and laughter fills the air.
+        -A close-up shot of a grandmother’s hands carefully arranging a family photo album, as the camera pans over old pictures, evoking cherished memories and a deep sense of love.
+        -A final moment around the dinner table, family members sharing a meal together, toasts are made, and the soft glow of candles reflects the joy and connection between generations.
+        So, I will provide you that story now. The story is:\n{query}
+        Please remember, don't give any background descriptions. Just generate 3 sentences likewise the example above. Don't even give the starting text like: "Here are the 3 sentences that summarize the story:" or any other like this. Just give the answers in 3 sentences directly
+        '''
+        agent = Agent(
+            model=HuggingFaceChat(
+                id="meta-llama/Meta-Llama-3-8B-Instruct",
+                max_tokens=4096,
+            ),
+            # tools=[DuckDuckGo()],
+            markdown=True
+        )
+        # Get the response in a variable
+        run: RunResponse = agent.run(input_text)
+        generated_text=run.content
+        sentences = [sentence.strip() for sentence in generated_text.split('.') if sentence]
+        return '. '.join(sentences[-3:]) + ('.' if len(sentences) > 0 else '')
+    def generate_story_and_recommendation(self, generated_response: str):
+        """Generate story recommendations and predictions based on the user input."""
+        scores, result = self.search(generated_response, 4)
+        recommended_videos_text = ""
+        predictions = {}
+        if scores is not None and result is not None:
+            recommendations = []
+            for idx in range(len(result['url'])):
+                recommendations.append(
+                    f"Video {idx+1}: {result['url'][idx]}\nPlaycount: {int(result['playCount'][idx])}\n"
+                )
+            recommended_text = "\n\n".join(recommendations)
+            recommended_influencer = f"\nYou can use these influencers for this type of video {str(result['username'][:3])}"
+            predictions = self.compute_mean_and_predict(result)
+            generated_prompt = self.generate_prompt(generated_response)
+        return recommended_text + recommended_influencer, predictions, generated_prompt
+    def format_predictions(self, predictions):
+        """Format predictions for display."""
+        if predictions:
+            return "\n".join([f"{key}: {value}" for key, value in predictions.items()])
+        else:
+            return "No predictions available."
+    def launch_interface(self):
+        """Launch the Gradio interface."""
+        interface=gr.Interface(
+            fn=self.generate_story_and_recommendation,
+            inputs=gr.Textbox(label="Enter your generated story.", lines=15),
+            outputs=[
+                gr.Textbox(label="Our Recommendations for you."),
+                gr.Textbox(label="Predicted Metrics (Likes, Comments, Shares)", type="text"),
+                gr.Textbox(label="Recommended Prompt for video generation:"),
+            ],
+            title="Video Story Generation and Recommendation",
+            description="Enter a request for a video storyline, and get a detailed story along with recommended videos and predicted engagement metrics based on the same input."
+        )
+        return interface

requirements.txt ADDED Viewed

	@@ -0,0 +1,10 @@

+gradio
+transformers
+sentence-transformers
+datasets
+faiss-cpu
+pydub
+torch
+scipy
+phidata
+duckduckgo-search

shared_resources.py ADDED Viewed

	@@ -0,0 +1,24 @@

+# shared_resources.py
+import torch
+# from transformers import AutoTokenizer, AutoModelForCausalLM
+from sentence_transformers import SentenceTransformer
+from datasets import load_dataset
+# from transformers import AutoProcessor, MusicgenForConditionalGeneration
+import re
+class SharedResources:
+    def __init__(self):
+        # Set the device
+        self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+        # Load SentenceTransformer
+        self.sentence_transformer = SentenceTransformer("mixedbread-ai/mxbai-embed-large-v1")
+        # Load the dataset
+        self.dataset = load_dataset("subashdvorak/tiktok-story-data1", revision="embedded")
+        self.data = self.dataset["train"]
+        self.data = self.data.add_faiss_index("embeddings")
+# Create a single instance of SharedResources
+shared_resources = SharedResources()