lwant commited on
Commit
5e9156a
Β·
1 Parent(s): 37c6430

Update embedding model configuration and simplify tool initialization in `tools.py`

Browse files
Files changed (1) hide show
  1. src/gaia_solving_agent/tools.py +5 -7
src/gaia_solving_agent/tools.py CHANGED
@@ -1,3 +1,6 @@
 
 
 
1
  from llama_index.core.schema import ImageDocument, Document
2
  from llama_index.core.tools import FunctionTool
3
  from llama_index.core.tools.ondemand_loader_tool import OnDemandLoaderTool
@@ -15,7 +18,9 @@ from workflows import Context
15
 
16
  from gaia_solving_agent import TAVILY_API_KEY, NEBIUS_API_KEY, MISTRAL_API_KEY, OPENAI_API_KEY
17
 
 
18
  embedding_model = "text-embedding-3-small"
 
19
 
20
 
21
  def load_and_search_tools_from_toolspec(tool_spec: BaseToolSpec, **kwargs) -> list[FunctionTool]:
@@ -161,7 +166,6 @@ async def vllm_ask_image(query: str, images: ImageDocument | list[ImageDocument]
161
 
162
  simple_web_page_reader_tool = OnDemandLoaderTool.from_defaults(
163
  SimpleWebPageReader(html_to_text=True),
164
- index_kwargs={"embed_model": embedding_model},
165
  name="simple_web_page_reader_tool",
166
  description="""
167
  Tool for loading content from a web page and return it as text.
@@ -179,12 +183,10 @@ Do not use this tool for:
179
  )
180
  simple_web_page_reader_toolspec = LoadAndSearchToolSpec.from_defaults(
181
  simple_web_page_reader_tool,
182
- index_kwargs={"embed_model": embedding_model},
183
  )
184
 
185
  youtube_transcript_reader_tool = OnDemandLoaderTool.from_defaults(
186
  YoutubeTranscriptReader(),
187
- index_kwargs={"embed_model": embedding_model},
188
  name="youtube_transcript_reader_tool",
189
  description=r"""
190
  Tool for loading the audio transcript from a youtube video and return it as text.
@@ -200,13 +202,11 @@ If you are provided with a youtube link in the wrong format, make it fit one the
200
  )
201
  youtube_transcript_reader_toolspec = LoadAndSearchToolSpec.from_defaults(
202
  youtube_transcript_reader_tool,
203
- index_kwargs={"embed_model": embedding_model},
204
  )
205
 
206
 
207
  research_paper_reader_tool = OnDemandLoaderTool.from_defaults(
208
  ArxivReader(),
209
- index_kwargs={"embed_model": embedding_model},
210
  name="research_paper_reader_tool",
211
  description=r"""
212
  Gets a search query, return a list of Documents of the top corresponding scientific papers on Arxiv.
@@ -214,10 +214,8 @@ Gets a search query, return a list of Documents of the top corresponding scienti
214
  )
215
  research_paper_reader_toolspec = LoadAndSearchToolSpec.from_defaults(
216
  research_paper_reader_tool,
217
- index_kwargs={"embed_model": embedding_model},
218
  )
219
 
220
  wikipedia_toolspec = load_and_search_tools_from_toolspec(
221
  WikipediaToolSpec(),
222
- index_kwargs={"embed_model": embedding_model},
223
  )
 
1
+ from llama_index.core import Settings
2
+ from llama_index.embeddings.openai import OpenAIEmbedding
3
+
4
  from llama_index.core.schema import ImageDocument, Document
5
  from llama_index.core.tools import FunctionTool
6
  from llama_index.core.tools.ondemand_loader_tool import OnDemandLoaderTool
 
18
 
19
  from gaia_solving_agent import TAVILY_API_KEY, NEBIUS_API_KEY, MISTRAL_API_KEY, OPENAI_API_KEY
20
 
21
+ # changing the global default
22
  embedding_model = "text-embedding-3-small"
23
+ Settings.embed_model = OpenAIEmbedding(model=embedding_model, api_key=OPENAI_API_KEY)
24
 
25
 
26
  def load_and_search_tools_from_toolspec(tool_spec: BaseToolSpec, **kwargs) -> list[FunctionTool]:
 
166
 
167
  simple_web_page_reader_tool = OnDemandLoaderTool.from_defaults(
168
  SimpleWebPageReader(html_to_text=True),
 
169
  name="simple_web_page_reader_tool",
170
  description="""
171
  Tool for loading content from a web page and return it as text.
 
183
  )
184
  simple_web_page_reader_toolspec = LoadAndSearchToolSpec.from_defaults(
185
  simple_web_page_reader_tool,
 
186
  )
187
 
188
  youtube_transcript_reader_tool = OnDemandLoaderTool.from_defaults(
189
  YoutubeTranscriptReader(),
 
190
  name="youtube_transcript_reader_tool",
191
  description=r"""
192
  Tool for loading the audio transcript from a youtube video and return it as text.
 
202
  )
203
  youtube_transcript_reader_toolspec = LoadAndSearchToolSpec.from_defaults(
204
  youtube_transcript_reader_tool,
 
205
  )
206
 
207
 
208
  research_paper_reader_tool = OnDemandLoaderTool.from_defaults(
209
  ArxivReader(),
 
210
  name="research_paper_reader_tool",
211
  description=r"""
212
  Gets a search query, return a list of Documents of the top corresponding scientific papers on Arxiv.
 
214
  )
215
  research_paper_reader_toolspec = LoadAndSearchToolSpec.from_defaults(
216
  research_paper_reader_tool,
 
217
  )
218
 
219
  wikipedia_toolspec = load_and_search_tools_from_toolspec(
220
  WikipediaToolSpec(),
 
221
  )