import re import inspect import requests import pandas as pd import yfinance as yf import concurrent.futures from datetime import datetime from typing import List from bs4 import BeautifulSoup from logger import logger from langchain.tools import tool from langchain_core.utils.function_calling import convert_to_openai_tool from config import config from azure.core.credentials import AzureKeyCredential from azure.search.documents import SearchClient az_creds = AzureKeyCredential(config.az_search_api_key) az_search_client = SearchClient(config.az_search_endpoint, config.az_search_idx_name, az_creds) @tool def get_analysis(query: str) -> dict: """ Full text search through your database of company and crypto analysis, retrieves top 4 pieces of analysis relevant to your query. You MUST ALWAYS use this function to help form your opinions and predictions. Args: query (str): The search query Returns: list: A list of dictionaries containing the pieces of analysis. """ results = az_search_client.search( query_type="semantic", search_text=query, select="title,content,asset_name,write_date", include_total_count=True, top=config.az_search_top_k, semantic_configuration_name="basic-keywords", vector_queries=None, # Docs are too semantically similar, disable for now ) output = [] for x in results: if x["@search.score"] >= config.az_search_min_score: output.append({ "security": x["asset_name"], "date written": datetime.strptime(x["write_date"], "%Y%m%d").date(), "title": x["title"], "content": x["content"] }) return output @tool def google_search_and_scrape(query: str) -> dict: """ Performs a Google search for the given query, retrieves the top search result URLs, and scrapes the text content and table data from those pages in parallel. Args: query (str): The search query. Returns: list: A list of dictionaries containing the URL, text content, and table data for each scraped page. """ num_results = 2 url = 'https://www.google.com/search' params = {'q': query, 'num': num_results} headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/94.0.4606.61 Safari/537.3'} logger.info(f"Performing google search with query: {query}\nplease wait...") response = requests.get(url, params=params, headers=headers) soup = BeautifulSoup(response.text, 'html.parser') urls = [result.find('a')['href'] for result in soup.find_all('div', class_='tF2Cxc')] logger.info(f"Scraping text from urls, please wait...") [logger.info(url) for url in urls] with concurrent.futures.ThreadPoolExecutor(max_workers=5) as executor: futures = [executor.submit(lambda url: (url, requests.get(url, headers=headers).text if isinstance(url, str) else None), url) for url in urls[:num_results] if isinstance(url, str)] results = [] for future in concurrent.futures.as_completed(futures): url, html = future.result() soup = BeautifulSoup(html, 'html.parser') paragraphs = [p.text.strip() for p in soup.find_all('p') if p.text.strip()] text_content = ' '.join(paragraphs) text_content = re.sub(r'\s+', ' ', text_content) table_data = [[cell.get_text(strip=True) for cell in row.find_all('td')] for table in soup.find_all('table') for row in table.find_all('tr')] if text_content or table_data: results.append({'url': url, 'content': text_content, 'tables': table_data}) return results @tool def get_current_stock_price(symbol: str) -> float: """ Get the current stock price for a given symbol. Args: symbol (str): The stock symbol. Returns: float: The current stock price, or None if an error occurs. """ try: config.status.update(label=":chart_with_upwards_trend: Getting price") stock = yf.Ticker(symbol) # Use "regularMarketPrice" for regular market hours, or "currentPrice" for pre/post market current_price = stock.info.get("regularMarketPrice", stock.info.get("currentPrice")) return current_price if current_price else None except Exception as e: print(f"Error fetching current price for {symbol}: {e}") return None @tool def get_stock_fundamentals(symbol: str) -> dict: """ Get fundamental data for a given stock symbol using yfinance API. Args: symbol (str): The stock symbol. Returns: dict: A dictionary containing fundamental data. Keys: - 'symbol': The stock symbol. - 'company_name': The long name of the company. - 'sector': The sector to which the company belongs. - 'industry': The industry to which the company belongs. - 'market_cap': The market capitalization of the company. - 'pe_ratio': The forward price-to-earnings ratio. - 'pb_ratio': The price-to-book ratio. - 'dividend_yield': The dividend yield. - 'eps': The trailing earnings per share. - 'beta': The beta value of the stock. - '52_week_high': The 52-week high price of the stock. - '52_week_low': The 52-week low price of the stock. """ try: stock = yf.Ticker(symbol) info = stock.info fundamentals = { 'symbol': symbol, 'company_name': info.get('longName', ''), 'sector': info.get('sector', ''), 'industry': info.get('industry', ''), 'market_cap': info.get('marketCap', None), 'pe_ratio': info.get('forwardPE', None), 'pb_ratio': info.get('priceToBook', None), 'dividend_yield': info.get('dividendYield', None), 'eps': info.get('trailingEps', None), 'beta': info.get('beta', None), '52_week_high': info.get('fiftyTwoWeekHigh', None), '52_week_low': info.get('fiftyTwoWeekLow', None) } return fundamentals except Exception as e: print(f"Error getting fundamentals for {symbol}: {e}") return {} @tool def get_financial_statements(symbol: str) -> dict: """ Get financial statements for a given stock symbol. Args: symbol (str): The stock symbol. Returns: dict: Dictionary containing financial statements (income statement, balance sheet, cash flow statement). """ try: stock = yf.Ticker(symbol) financials = stock.financials return financials except Exception as e: print(f"Error fetching financial statements for {symbol}: {e}") return {} @tool def get_key_financial_ratios(symbol: str) -> dict: """ Get key financial ratios for a given stock symbol. Args: symbol (str): The stock symbol. Returns: dict: Dictionary containing key financial ratios. """ try: config.status.update(label=":chart_with_upwards_trend: Gathering financial data") stock = yf.Ticker(symbol) key_ratios = stock.info return key_ratios except Exception as e: print(f"Error fetching key financial ratios for {symbol}: {e}") return {} @tool def get_dividend_data(symbol: str) -> pd.DataFrame: """ Get dividend data for a given stock symbol. Args: symbol (str): The stock symbol. Returns: pd.DataFrame: DataFrame containing dividend data. """ try: stock = yf.Ticker(symbol) dividends = stock.dividends return dividends except Exception as e: print(f"Error fetching dividend data for {symbol}: {e}") return pd.DataFrame() @tool def get_company_news(symbol: str) -> pd.DataFrame: """ Get company news and press releases for a given stock symbol. Args: symbol (str): The stock symbol. Returns: pd.DataFrame: DataFrame containing company news and press releases. """ config.status.update(label=":newspaper: Getting news") try: news = yf.Ticker(symbol).news return news except Exception as e: print(f"Error fetching company news for {symbol}: {e}") return pd.DataFrame() @tool def get_technical_indicators(symbol: str) -> pd.DataFrame: """ Get technical indicators for a given stock symbol. Args: symbol (str): The stock symbol. Returns: pd.DataFrame: DataFrame containing technical indicators. """ try: indicators = yf.Ticker(symbol).history(period="max") return indicators except Exception as e: print(f"Error fetching technical indicators for {symbol}: {e}") return pd.DataFrame() @tool def get_company_profile(symbol: str) -> dict: """ Get company profile and overview for a given stock symbol. Args: symbol (str): The stock symbol. Returns: dict: Dictionary containing company profile and overview. """ try: profile = yf.Ticker(symbol).info return profile except Exception as e: print(f"Error fetching company profile for {symbol}: {e}") return {} def get_openai_tools() -> List[dict]: functions = [ get_analysis, # google_search_and_scrape, get_current_stock_price, get_company_news, # get_company_profile, # get_stock_fundamentals, # get_financial_statements, get_key_financial_ratios, # get_analyst_recommendations, # get_dividend_data, # get_technical_indicators ] tools = [convert_to_openai_tool(f) for f in functions] return tools