Spaces:
Runtime error
Runtime error
Update embedding model configuration and simplify tool initialization in `tools.py`
Browse files
src/gaia_solving_agent/tools.py
CHANGED
|
@@ -1,3 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
| 1 |
from llama_index.core.schema import ImageDocument, Document
|
| 2 |
from llama_index.core.tools import FunctionTool
|
| 3 |
from llama_index.core.tools.ondemand_loader_tool import OnDemandLoaderTool
|
|
@@ -15,7 +18,9 @@ from workflows import Context
|
|
| 15 |
|
| 16 |
from gaia_solving_agent import TAVILY_API_KEY, NEBIUS_API_KEY, MISTRAL_API_KEY, OPENAI_API_KEY
|
| 17 |
|
|
|
|
| 18 |
embedding_model = "text-embedding-3-small"
|
|
|
|
| 19 |
|
| 20 |
|
| 21 |
def load_and_search_tools_from_toolspec(tool_spec: BaseToolSpec, **kwargs) -> list[FunctionTool]:
|
|
@@ -161,7 +166,6 @@ async def vllm_ask_image(query: str, images: ImageDocument | list[ImageDocument]
|
|
| 161 |
|
| 162 |
simple_web_page_reader_tool = OnDemandLoaderTool.from_defaults(
|
| 163 |
SimpleWebPageReader(html_to_text=True),
|
| 164 |
-
index_kwargs={"embed_model": embedding_model},
|
| 165 |
name="simple_web_page_reader_tool",
|
| 166 |
description="""
|
| 167 |
Tool for loading content from a web page and return it as text.
|
|
@@ -179,12 +183,10 @@ Do not use this tool for:
|
|
| 179 |
)
|
| 180 |
simple_web_page_reader_toolspec = LoadAndSearchToolSpec.from_defaults(
|
| 181 |
simple_web_page_reader_tool,
|
| 182 |
-
index_kwargs={"embed_model": embedding_model},
|
| 183 |
)
|
| 184 |
|
| 185 |
youtube_transcript_reader_tool = OnDemandLoaderTool.from_defaults(
|
| 186 |
YoutubeTranscriptReader(),
|
| 187 |
-
index_kwargs={"embed_model": embedding_model},
|
| 188 |
name="youtube_transcript_reader_tool",
|
| 189 |
description=r"""
|
| 190 |
Tool for loading the audio transcript from a youtube video and return it as text.
|
|
@@ -200,13 +202,11 @@ If you are provided with a youtube link in the wrong format, make it fit one the
|
|
| 200 |
)
|
| 201 |
youtube_transcript_reader_toolspec = LoadAndSearchToolSpec.from_defaults(
|
| 202 |
youtube_transcript_reader_tool,
|
| 203 |
-
index_kwargs={"embed_model": embedding_model},
|
| 204 |
)
|
| 205 |
|
| 206 |
|
| 207 |
research_paper_reader_tool = OnDemandLoaderTool.from_defaults(
|
| 208 |
ArxivReader(),
|
| 209 |
-
index_kwargs={"embed_model": embedding_model},
|
| 210 |
name="research_paper_reader_tool",
|
| 211 |
description=r"""
|
| 212 |
Gets a search query, return a list of Documents of the top corresponding scientific papers on Arxiv.
|
|
@@ -214,10 +214,8 @@ Gets a search query, return a list of Documents of the top corresponding scienti
|
|
| 214 |
)
|
| 215 |
research_paper_reader_toolspec = LoadAndSearchToolSpec.from_defaults(
|
| 216 |
research_paper_reader_tool,
|
| 217 |
-
index_kwargs={"embed_model": embedding_model},
|
| 218 |
)
|
| 219 |
|
| 220 |
wikipedia_toolspec = load_and_search_tools_from_toolspec(
|
| 221 |
WikipediaToolSpec(),
|
| 222 |
-
index_kwargs={"embed_model": embedding_model},
|
| 223 |
)
|
|
|
|
| 1 |
+
from llama_index.core import Settings
|
| 2 |
+
from llama_index.embeddings.openai import OpenAIEmbedding
|
| 3 |
+
|
| 4 |
from llama_index.core.schema import ImageDocument, Document
|
| 5 |
from llama_index.core.tools import FunctionTool
|
| 6 |
from llama_index.core.tools.ondemand_loader_tool import OnDemandLoaderTool
|
|
|
|
| 18 |
|
| 19 |
from gaia_solving_agent import TAVILY_API_KEY, NEBIUS_API_KEY, MISTRAL_API_KEY, OPENAI_API_KEY
|
| 20 |
|
| 21 |
+
# changing the global default
|
| 22 |
embedding_model = "text-embedding-3-small"
|
| 23 |
+
Settings.embed_model = OpenAIEmbedding(model=embedding_model, api_key=OPENAI_API_KEY)
|
| 24 |
|
| 25 |
|
| 26 |
def load_and_search_tools_from_toolspec(tool_spec: BaseToolSpec, **kwargs) -> list[FunctionTool]:
|
|
|
|
| 166 |
|
| 167 |
simple_web_page_reader_tool = OnDemandLoaderTool.from_defaults(
|
| 168 |
SimpleWebPageReader(html_to_text=True),
|
|
|
|
| 169 |
name="simple_web_page_reader_tool",
|
| 170 |
description="""
|
| 171 |
Tool for loading content from a web page and return it as text.
|
|
|
|
| 183 |
)
|
| 184 |
simple_web_page_reader_toolspec = LoadAndSearchToolSpec.from_defaults(
|
| 185 |
simple_web_page_reader_tool,
|
|
|
|
| 186 |
)
|
| 187 |
|
| 188 |
youtube_transcript_reader_tool = OnDemandLoaderTool.from_defaults(
|
| 189 |
YoutubeTranscriptReader(),
|
|
|
|
| 190 |
name="youtube_transcript_reader_tool",
|
| 191 |
description=r"""
|
| 192 |
Tool for loading the audio transcript from a youtube video and return it as text.
|
|
|
|
| 202 |
)
|
| 203 |
youtube_transcript_reader_toolspec = LoadAndSearchToolSpec.from_defaults(
|
| 204 |
youtube_transcript_reader_tool,
|
|
|
|
| 205 |
)
|
| 206 |
|
| 207 |
|
| 208 |
research_paper_reader_tool = OnDemandLoaderTool.from_defaults(
|
| 209 |
ArxivReader(),
|
|
|
|
| 210 |
name="research_paper_reader_tool",
|
| 211 |
description=r"""
|
| 212 |
Gets a search query, return a list of Documents of the top corresponding scientific papers on Arxiv.
|
|
|
|
| 214 |
)
|
| 215 |
research_paper_reader_toolspec = LoadAndSearchToolSpec.from_defaults(
|
| 216 |
research_paper_reader_tool,
|
|
|
|
| 217 |
)
|
| 218 |
|
| 219 |
wikipedia_toolspec = load_and_search_tools_from_toolspec(
|
| 220 |
WikipediaToolSpec(),
|
|
|
|
| 221 |
)
|