| import re |
| import inspect |
| import requests |
| import pandas as pd |
| import yfinance as yf |
| import concurrent.futures |
|
|
| from typing import List |
| from bs4 import BeautifulSoup |
| from utils import inference_logger |
| from langchain.tools import tool |
| from langchain_core.utils.function_calling import convert_to_openai_tool |
|
|
| @tool |
| def google_search_and_scrape(query: str) -> dict: |
| """ |
| Performs a Google search for the given query, retrieves the top search result URLs, |
| and scrapes the text content and table data from those pages in parallel. |
| |
| Args: |
| query (str): The search query. |
| Returns: |
| list: A list of dictionaries containing the URL, text content, and table data for each scraped page. |
| """ |
| num_results = 2 |
| url = 'https://www.google.com/search' |
| params = {'q': query, 'num': num_results} |
| headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/94.0.4606.61 Safari/537.3'} |
| |
| inference_logger.info(f"Performing google search with query: {query}\nplease wait...") |
| response = requests.get(url, params=params, headers=headers) |
| soup = BeautifulSoup(response.text, 'html.parser') |
| urls = [result.find('a')['href'] for result in soup.find_all('div', class_='tF2Cxc')] |
| |
| inference_logger.info(f"Scraping text from urls, please wait...") |
| [inference_logger.info(url) for url in urls] |
| with concurrent.futures.ThreadPoolExecutor(max_workers=5) as executor: |
| futures = [executor.submit(lambda url: (url, requests.get(url, headers=headers).text if isinstance(url, str) else None), url) for url in urls[:num_results] if isinstance(url, str)] |
| results = [] |
| for future in concurrent.futures.as_completed(futures): |
| url, html = future.result() |
| soup = BeautifulSoup(html, 'html.parser') |
| paragraphs = [p.text.strip() for p in soup.find_all('p') if p.text.strip()] |
| text_content = ' '.join(paragraphs) |
| text_content = re.sub(r'\s+', ' ', text_content) |
| table_data = [[cell.get_text(strip=True) for cell in row.find_all('td')] for table in soup.find_all('table') for row in table.find_all('tr')] |
| if text_content or table_data: |
| results.append({'url': url, 'content': text_content, 'tables': table_data}) |
| return results |
|
|
| @tool |
| def get_current_stock_price(symbol: str) -> float: |
| """ |
| Get the current stock price for a given symbol. |
| |
| Args: |
| symbol (str): The stock symbol. |
| |
| Returns: |
| float: The current stock price, or None if an error occurs. |
| """ |
| try: |
| stock = yf.Ticker(symbol) |
| |
| current_price = stock.info.get("regularMarketPrice", stock.info.get("currentPrice")) |
| return current_price if current_price else None |
| except Exception as e: |
| print(f"Error fetching current price for {symbol}: {e}") |
| return None |
|
|
| @tool |
| def get_stock_fundamentals(symbol: str) -> dict: |
| """ |
| Get fundamental data for a given stock symbol using yfinance API. |
| |
| Args: |
| symbol (str): The stock symbol. |
| |
| Returns: |
| dict: A dictionary containing fundamental data. |
| Keys: |
| - 'symbol': The stock symbol. |
| - 'company_name': The long name of the company. |
| - 'sector': The sector to which the company belongs. |
| - 'industry': The industry to which the company belongs. |
| - 'market_cap': The market capitalization of the company. |
| - 'pe_ratio': The forward price-to-earnings ratio. |
| - 'pb_ratio': The price-to-book ratio. |
| - 'dividend_yield': The dividend yield. |
| - 'eps': The trailing earnings per share. |
| - 'beta': The beta value of the stock. |
| - '52_week_high': The 52-week high price of the stock. |
| - '52_week_low': The 52-week low price of the stock. |
| """ |
| try: |
| stock = yf.Ticker(symbol) |
| info = stock.info |
| fundamentals = { |
| 'symbol': symbol, |
| 'company_name': info.get('longName', ''), |
| 'sector': info.get('sector', ''), |
| 'industry': info.get('industry', ''), |
| 'market_cap': info.get('marketCap', None), |
| 'pe_ratio': info.get('forwardPE', None), |
| 'pb_ratio': info.get('priceToBook', None), |
| 'dividend_yield': info.get('dividendYield', None), |
| 'eps': info.get('trailingEps', None), |
| 'beta': info.get('beta', None), |
| '52_week_high': info.get('fiftyTwoWeekHigh', None), |
| '52_week_low': info.get('fiftyTwoWeekLow', None) |
| } |
| return fundamentals |
| except Exception as e: |
| print(f"Error getting fundamentals for {symbol}: {e}") |
| return {} |
|
|
| @tool |
| def get_financial_statements(symbol: str) -> dict: |
| """ |
| Get financial statements for a given stock symbol. |
| |
| Args: |
| symbol (str): The stock symbol. |
| |
| Returns: |
| dict: Dictionary containing financial statements (income statement, balance sheet, cash flow statement). |
| """ |
| try: |
| stock = yf.Ticker(symbol) |
| financials = stock.financials |
| return financials |
| except Exception as e: |
| print(f"Error fetching financial statements for {symbol}: {e}") |
| return {} |
|
|
| @tool |
| def get_key_financial_ratios(symbol: str) -> dict: |
| """ |
| Get key financial ratios for a given stock symbol. |
| |
| Args: |
| symbol (str): The stock symbol. |
| |
| Returns: |
| dict: Dictionary containing key financial ratios. |
| """ |
| try: |
| stock = yf.Ticker(symbol) |
| key_ratios = stock.info |
| return key_ratios |
| except Exception as e: |
| print(f"Error fetching key financial ratios for {symbol}: {e}") |
| return {} |
|
|
| @tool |
| def get_analyst_recommendations(symbol: str) -> pd.DataFrame: |
| """ |
| Get analyst recommendations for a given stock symbol. |
| |
| Args: |
| symbol (str): The stock symbol. |
| |
| Returns: |
| pd.DataFrame: DataFrame containing analyst recommendations. |
| """ |
| try: |
| stock = yf.Ticker(symbol) |
| recommendations = stock.recommendations |
| return recommendations |
| except Exception as e: |
| print(f"Error fetching analyst recommendations for {symbol}: {e}") |
| return pd.DataFrame() |
|
|
| @tool |
| def get_dividend_data(symbol: str) -> pd.DataFrame: |
| """ |
| Get dividend data for a given stock symbol. |
| |
| Args: |
| symbol (str): The stock symbol. |
| |
| Returns: |
| pd.DataFrame: DataFrame containing dividend data. |
| """ |
| try: |
| stock = yf.Ticker(symbol) |
| dividends = stock.dividends |
| return dividends |
| except Exception as e: |
| print(f"Error fetching dividend data for {symbol}: {e}") |
| return pd.DataFrame() |
|
|
| @tool |
| def get_company_news(symbol: str) -> pd.DataFrame: |
| """ |
| Get company news and press releases for a given stock symbol. |
| |
| Args: |
| symbol (str): The stock symbol. |
| |
| Returns: |
| pd.DataFrame: DataFrame containing company news and press releases. |
| """ |
| try: |
| news = yf.Ticker(symbol).news |
| return news |
| except Exception as e: |
| print(f"Error fetching company news for {symbol}: {e}") |
| return pd.DataFrame() |
|
|
| @tool |
| def get_technical_indicators(symbol: str) -> pd.DataFrame: |
| """ |
| Get technical indicators for a given stock symbol. |
| |
| Args: |
| symbol (str): The stock symbol. |
| |
| Returns: |
| pd.DataFrame: DataFrame containing technical indicators. |
| """ |
| try: |
| indicators = yf.Ticker(symbol).history(period="max") |
| return indicators |
| except Exception as e: |
| print(f"Error fetching technical indicators for {symbol}: {e}") |
| return pd.DataFrame() |
|
|
| @tool |
| def get_company_profile(symbol: str) -> dict: |
| """ |
| Get company profile and overview for a given stock symbol. |
| |
| Args: |
| symbol (str): The stock symbol. |
| |
| Returns: |
| dict: Dictionary containing company profile and overview. |
| """ |
| try: |
| profile = yf.Ticker(symbol).info |
| return profile |
| except Exception as e: |
| print(f"Error fetching company profile for {symbol}: {e}") |
| return {} |
|
|
| def get_openai_tools() -> List[dict]: |
| functions = [ |
| google_search_and_scrape, |
| get_current_stock_price, |
| get_company_news, |
| get_company_profile, |
| get_stock_fundamentals, |
| get_financial_statements, |
| get_key_financial_ratios, |
| get_analyst_recommendations, |
| get_dividend_data, |
| get_technical_indicators |
| ] |
|
|
| tools = [convert_to_openai_tool(f) for f in functions] |
| return tools |
|
|