Spaces:

Manaranjan
/

llmtimeline

Runtime error

App Files Files Community

Manaranjan commited on Aug 21, 2024

Commit

05caf50

verified ·

1 Parent(s): ab67d2e

deploy at 2024-08-21 10:24:01.130174

Browse files

Files changed (3) hide show

config.ini +5 -0
main.py +48 -11
timeline.csv +15 -20

config.ini ADDED Viewed

	@@ -0,0 +1,5 @@

+[DEFAULT]
+dataset_id = space-backup
+db_dir = data
+private_backup = True

main.py CHANGED Viewed

@@ -4,6 +4,7 @@ import os
 import json
 import pandas as pd
 import traceback
 from datetime import datetime
 from typing import Literal
 from pydantic_core import from_json
@@ -16,6 +17,7 @@ from langchain_openai import ChatOpenAI
 from langchain_anthropic import ChatAnthropic
 from pydantic import BaseModel, Field, ValidationError
 from langchain_openai import ChatOpenAI
 from fasthtml.common import *
 from fasthtml.components import Svg
 from langchain_community.utilities.wikipedia import WikipediaAPIWrapper
@@ -36,7 +38,7 @@ class Event(BaseModel):
     sentiment: Literal["Positive", "Negative"] = Field(..., description="Categorization of the event sentiment")
 class EventResponse(BaseModel):
-    events: List[Event] = Field(min_length=10, max_length=30, description="List of events extracted from the context")
 # Set up the Pydantic output parser
 parser = PydanticOutputParser(pydantic_object=EventResponse)
@@ -44,7 +46,7 @@ parser = PydanticOutputParser(pydantic_object=EventResponse)
 # LangChain prompt template with format instructions
 event_extraction_template = """
 Extract the time based informations or events from the context and return a list of events with time,  event description and event sentiment type whether it was positive or negative event.
-The context may contain information about people, organization or any other entity. Try to get detailed and unique list of events as possible.
 <context>
 {context}
@@ -56,6 +58,8 @@ The response must follow the following schema strictly. There will be penalty fo
 {format_instructions}
 </schema>
 Output:
 """
@@ -67,14 +71,23 @@ event_prompt = PromptTemplate(
 # Function to get the appropriate language model based on user selection
 def getModel(model, key):
-    if(model == 'OpenAI'):
         os.environ['OPENAI_API_KEY'] = key
         return ChatOpenAI(temperature=0,  # Set to 0 for deterministic output
                     model="gpt-4o-2024-08-06",  # Using the GPT-4 Turbo model
                     max_tokens=8000)  # Limit the response length
-    else:
         os.environ['ANTHROPIC_API_KEY'] = key
         return ChatAnthropic(model='claude-3-5-sonnet-20240620')  # Limit the response length
 # Function to generate an HTML table from the summary object
@@ -96,11 +109,19 @@ def generate_timeline_html(timeline):
     for idx, tline in timeline.iterrows():
         if idx % 2 == 0:
             rows.append(Li(Div(File("./assets/circle.svg"), cls = "timeline-middle"),
-                        Div(Time(tline['TimeStr'], cls = "font-mono italic"), Div(tline['Event'], cls = 'text-lg font-black'), cls = "timeline-start mb-10 md:text-end"),
                         Hr()))
         else:
             rows.append(Li(Div(File("./assets/circle.svg"), cls = "timeline-middle"),
-                        Div(Time(tline['TimeStr'], cls = "font-mono italic"), Div(tline['Event'], cls = 'text-lg font-black'), cls = "timeline-end mb-10"),
                         Hr()))
     return  Ul(*rows, cls="timeline timeline-vertical")
@@ -139,16 +160,26 @@ def get_timeline_df(result):
     return df
 # Placeholder function for Q&A generation
-def generate_timeline(topic, llm):
     # This function will be implemented later
     # For now, return a sample DataFrame
-    wikipedia = WikipediaQueryRun(api_wrapper=WikipediaAPIWrapper())
     wiki_content = wikipedia.run(topic)
     chain = event_prompt | llm | parser
-    result = chain.invoke({"context" : wiki_content})
     try:
         # Parse the output using PydanticOutputParser
@@ -178,7 +209,7 @@ def getConfigForm():
             ),
             Div(
                 Span(Strong('Model: '), cls ="badge"),
-                Select(Option("OpenAI"), Option("Anthropic"), id="model", cls = 'select w-full max-w-xs')
             ),
             Div(
                 Span(Strong('Topic for timeline (Person/Organization/Event): '), cls ="badge"),
@@ -191,6 +222,10 @@ def getConfigForm():
                       cls = "input w-full max-w-xs",
                       placeholder = "Type here")
             ),
             Div(
                 Button("Generate Timeline", cls = 'btn')
             ),
@@ -231,7 +266,9 @@ async def post(d:dict):
         model = getModel(d['model'], d['secret'])
         # Perform one-pass summarization
-        timeline_df = generate_timeline(d['topic'], model)
         #qas = pd.read_csv("results_tesla.csv")
         timeline_df.head(10)

 import json
 import pandas as pd
 import traceback
+import wikipedia
 from datetime import datetime
 from typing import Literal
 from pydantic_core import from_json
 from langchain_anthropic import ChatAnthropic
 from pydantic import BaseModel, Field, ValidationError
 from langchain_openai import ChatOpenAI
+from langchain_google_genai import ChatGoogleGenerativeAI
 from fasthtml.common import *
 from fasthtml.components import Svg
 from langchain_community.utilities.wikipedia import WikipediaAPIWrapper
     sentiment: Literal["Positive", "Negative"] = Field(..., description="Categorization of the event sentiment")
 class EventResponse(BaseModel):
+    events: List[Event] = Field(min_length=10, max_length=20, description="List of events extracted from the context")
 # Set up the Pydantic output parser
 parser = PydanticOutputParser(pydantic_object=EventResponse)
 # LangChain prompt template with format instructions
 event_extraction_template = """
 Extract the time based informations or events from the context and return a list of events with time,  event description and event sentiment type whether it was positive or negative event.
+The context may contain information about people, organization or any other entity.
 <context>
 {context}
 {format_instructions}
 </schema>
+Must ensure the event belongs to the topic {topic} and try to get at least {numevents} unique events possible from the context.
 Output:
 """
 # Function to get the appropriate language model based on user selection
 def getModel(model, key):
+    if(model == 'OpenAI Gpt-o'):
         os.environ['OPENAI_API_KEY'] = key
         return ChatOpenAI(temperature=0,  # Set to 0 for deterministic output
                     model="gpt-4o-2024-08-06",  # Using the GPT-4 Turbo model
                     max_tokens=8000)  # Limit the response length
+    elif (model == 'Anthropic Claude'):
         os.environ['ANTHROPIC_API_KEY'] = key
         return ChatAnthropic(model='claude-3-5-sonnet-20240620')  # Limit the response length
+    else:
+        os.environ['GOOGLE_API_KEY'] = key
+        return ChatGoogleGenerativeAI(
+            model="gemini-1.5-pro",
+            temperature=0,
+            max_tokens=8000,
+            max_retries=2,
+        )
 # Function to generate an HTML table from the summary object
     for idx, tline in timeline.iterrows():
         if idx % 2 == 0:
             rows.append(Li(Div(File("./assets/circle.svg"), cls = "timeline-middle"),
+                        Div(Time(tline['TimeStr'],
+                                 cls = "font-mono italic"),
+                            Div(tline['Event'],
+                                 cls = 'text-lg font-black'),
+                                 cls = "timeline-start mb-10 md:text-end"),
                         Hr()))
         else:
             rows.append(Li(Div(File("./assets/circle.svg"), cls = "timeline-middle"),
+                        Div(Time(tline['TimeStr'],
+                                 cls = "font-mono italic"),
+                             Div(tline['Event'],
+                                 cls = 'text-lg font-black'),
+                                 cls = "timeline-end mb-10"),
                         Hr()))
     return  Ul(*rows, cls="timeline timeline-vertical")
     return df
 # Placeholder function for Q&A generation
+def generate_timeline(topic, numevents, llm):
     # This function will be implemented later
     # For now, return a sample DataFrame
+#    titles = wikipedia.search(topic, results = 1)
+#    page = wikipedia.page(titles[0])
+#    wiki_content = page.content
+    wikipedia = WikipediaQueryRun(api_wrapper=WikipediaAPIWrapper(top_k_results=1, doc_content_chars_max=5000))
     wiki_content = wikipedia.run(topic)
+    print(f"wiki_content: {wiki_content}")
+#    print(f"wiki_artifact: {wiki_artifact}")
     chain = event_prompt | llm | parser
+    result = chain.invoke({"context" : wiki_content,
+                           "topic": topic,
+                           "numevents": numevents})
     try:
         # Parse the output using PydanticOutputParser
             ),
             Div(
                 Span(Strong('Model: '), cls ="badge"),
+                Select(Option("OpenAI Gpt-4o"), Option("Anthropic Claude"), Option("Google Gemini"), id="model", cls = 'select w-full max-w-xs')
             ),
             Div(
                 Span(Strong('Topic for timeline (Person/Organization/Event): '), cls ="badge"),
                       cls = "input w-full max-w-xs",
                       placeholder = "Type here")
             ),
+            Div(
+                Span(Strong('How many events: '), cls ="badge"),
+                Select(Option("5"), Option("10"), Option("20"), Option("30"), id="numevents", cls = 'select w-full max-w-xs')
+            ),
             Div(
                 Button("Generate Timeline", cls = 'btn')
             ),
         model = getModel(d['model'], d['secret'])
         # Perform one-pass summarization
+        timeline_df = generate_timeline(d['topic'],
+                                        d['numevents'],
+                                        model)
         #qas = pd.read_csv("results_tesla.csv")
         timeline_df.head(10)

timeline.csv CHANGED Viewed

@@ -1,21 +1,16 @@
 ,index,Time,Event,Sentiment,TimeStr
-0,6,1999-01-01 00:00:00+00:00,Dhoni made his first-class debut for Bihar.,Positive,01/01/1999
-1,7,2004-12-23 00:00:00+00:00,Dhoni debuted for the Indian cricket team in an ODI.,Positive,23/12/2004
-2,0,2007-09-24 00:00:00+00:00,India won the 2007 ICC World Twenty20 under Dhoni's captaincy.,Positive,24/09/2007
-3,18,2008-01-01 00:00:00+00:00,Dhoni received the Major Dhyan Chand Khel Ratna Award.,Positive,01/01/2008
-4,8,2008-01-01 00:00:00+00:00,Dhoni became captain of the Indian cricket team in all formats.,Positive,01/01/2008
-5,11,2010-04-25 00:00:00+00:00,CSK won the IPL under Dhoni's captaincy.,Positive,25/04/2010
-6,3,2010-06-24 00:00:00+00:00,India won the Asia Cup in 2010 under Dhoni's captaincy.,Positive,24/06/2010
-7,16,2010-09-26 00:00:00+00:00,CSK won the Champions League T20 under Dhoni.,Positive,26/09/2010
-8,19,2011-01-01 00:00:00+00:00,Dhoni received honorary rank of Lieutenant Colonel.,Positive,01/01/2011
-9,1,2011-04-02 00:00:00+00:00,India won the 2011 Cricket World Cup under Dhoni's leadership.,Positive,02/04/2011
-10,12,2011-05-28 00:00:00+00:00,CSK won the IPL again with Dhoni as captain.,Positive,28/05/2011
-11,2,2013-06-23 00:00:00+00:00,India won the 2013 ICC Champions Trophy with Dhoni as captain.,Positive,23/06/2013
-12,17,2014-10-04 00:00:00+00:00,CSK won the Champions League T20 again with Dhoni.,Positive,04/10/2014
-13,9,2014-12-30 00:00:00+00:00,Dhoni retired from Test cricket.,Negative,30/12/2014
-14,4,2016-03-06 00:00:00+00:00,India won the Asia Cup in 2016 with Dhoni as captain.,Positive,06/03/2016
-15,13,2018-05-27 00:00:00+00:00,CSK won the IPL for the third time under Dhoni.,Positive,27/05/2018
-16,5,2018-09-28 00:00:00+00:00,Dhoni was part of the 2018 Asia Cup winning squad.,Positive,28/09/2018
-17,10,2019-07-10 00:00:00+00:00,Dhoni retired from international limited-overs cricket.,Negative,10/07/2019
-18,14,2021-10-15 00:00:00+00:00,CSK won the IPL for the fourth time with Dhoni.,Positive,15/10/2021
-19,15,2023-05-29 00:00:00+00:00,CSK won the IPL for the fifth time under Dhoni.,Positive,29/05/2023

 ,index,Time,Event,Sentiment,TimeStr
+0,0,1981-07-07 00:00:00+00:00,MS Dhoni is born,Positive,07/07/1981
+1,1,1999-01-01 00:00:00+00:00,Dhoni makes his first class debut for Bihar,Positive,01/01/1999
+2,2,2004-12-23 00:00:00+00:00,Dhoni makes his debut for the Indian cricket team in an ODI against Bangladesh,Positive,23/12/2004
+3,3,2005-12-01 00:00:00+00:00,Dhoni plays his first test match against Sri Lanka,Positive,01/12/2005
+4,4,2007-01-01 00:00:00+00:00,Dhoni becomes captain of the ODI side,Positive,01/01/2007
+5,5,2007-09-24 00:00:00+00:00,Dhoni leads India to victory in the ICC World Twenty20,Positive,24/09/2007
+6,6,2008-01-01 00:00:00+00:00,Dhoni takes over as captain in all formats of cricket,Positive,01/01/2008
+7,7,2008-01-01 00:00:00+00:00,Dhoni is awarded India's highest sport honor Major Dhyan Chand Khel Ratna Award,Positive,01/01/2008
+8,8,2009-01-01 00:00:00+00:00,"Dhoni receives the Padma Shri, India's fourth highest civilian award",Positive,01/01/2009
+9,10,2011-01-01 00:00:00+00:00,Dhoni is awarded honorary rank of Lieutenant Colonel in the Indian Territorial Army,Positive,01/01/2011
+10,9,2011-04-02 00:00:00+00:00,Dhoni leads India to victory in the Cricket World Cup,Positive,02/04/2011
+11,11,2013-06-23 00:00:00+00:00,Dhoni leads India to victory in the ICC Champions Trophy,Positive,23/06/2013
+12,12,2014-12-30 00:00:00+00:00,Dhoni retires from test cricket,Negative,30/12/2014
+13,13,2018-01-01 00:00:00+00:00,"Dhoni receives the Padma Bhushan, India's third highest civilian award",Positive,01/01/2018
+14,14,2019-12-31 00:00:00+00:00,Dhoni retires from limited overs international cricket,Negative,31/12/2019