Spaces:

jsolow
/

YFDashboard

Sleeping

Jon Solow commited on Sep 20, 2023

Commit

958ade1

1 Parent(s): c412d07

Add fix for players with no team in player news

Files changed (1) hide show

src/queries/nbcsports/player_news.py CHANGED Viewed

@@ -14,12 +14,19 @@ def get_text_from_find_all(soup, element: str, find_search_map: Mapping[str, str
     return text_list
 def get_nfl_player_news(page_number: int = 1) -> pd.DataFrame:
     url = f"{NEWS_URL}?p={page_number}"
     request_page = requests.get(url)
     soup = BeautifulSoup(request_page.content)
     player_names_list = get_text_from_find_all(soup, "div", {"class": "PlayerNewsPost-name"})
-    team_abbr_list = get_text_from_find_all(soup, "span", {"class": "PlayerNewsPost-team-abbr"})
     position_list = get_text_from_find_all(soup, "span", {"class": "PlayerNewsPost-position"})
     headline_list = get_text_from_find_all(soup, "div", {"class": "PlayerNewsPost-headline"})
     analysis_list = get_text_from_find_all(soup, "div", {"class": "PlayerNewsPost-analysis"})

     return text_list
+def get_team_names(soup):
+    player_team_div_list = soup.find_all("div", "PlayerNewsPost-team")
+    player_team_abbr_span_list = [x.find("span", {"class": "PlayerNewsPost-team-abbr"}) for x in player_team_div_list]
+    player_team_abbr_list = [x.text.upper() if x else "" for x in player_team_abbr_span_list]
+    return player_team_abbr_list
 def get_nfl_player_news(page_number: int = 1) -> pd.DataFrame:
     url = f"{NEWS_URL}?p={page_number}"
     request_page = requests.get(url)
     soup = BeautifulSoup(request_page.content)
     player_names_list = get_text_from_find_all(soup, "div", {"class": "PlayerNewsPost-name"})
+    team_abbr_list = get_team_names(soup)
     position_list = get_text_from_find_all(soup, "span", {"class": "PlayerNewsPost-position"})
     headline_list = get_text_from_find_all(soup, "div", {"class": "PlayerNewsPost-headline"})
     analysis_list = get_text_from_find_all(soup, "div", {"class": "PlayerNewsPost-analysis"})