Spaces:

Multichem
/

NHL_Macro_Sheets

Running

James McCool

Add .gitignore and refactor app.py and database.py for improved secret management

9330cee 6 days ago

5.9 kB

	import streamlit as st
	st.set_page_config(layout="wide")

	for name in dir():
	if not name.startswith('_'):
	del globals()[name]

	import numpy as np
	import pandas as pd
	import streamlit as st
	import gspread
	from database import gcservice_account, NHL_data


	percentages_format = {'Shots': '{:.2%}', 'HDCF': '{:.2%}', 'Goals': '{:.2%}', 'Assists': '{:.2%}', 'Blocks': '{:.2%}',
	'L14_Shots': '{:.2%}', 'L14_HDCF': '{:.2%}', 'L14_Goals': '{:.2%}', 'L14_Assists': '{:.2%}',
	'L14_Blocks': '{:.2%}', 'Max Goal%': '{:.2%}', 'L14 Max Goal%': '{:.2%}'}

	matchups_format = {'HDCF%': '{:.2%}', 'o_HDCA%': '{:.2%}', 'HDCF_m%': '{:.2%}'}

	@st.cache_resource(ttl = 599)
	def init_baselines():
	parse_hold = pd.DataFrame(columns=['Line', 'SK1', 'SK2', 'SK3', 'Cost', 'Team Total', 'Shots', 'HDCF', 'Goals', 'Assists', 'Blocks',
	'L14_Shots', 'L14_HDCF', 'L14_Goals', 'L14_Assists', 'L14_Blocks', 'Max Goal%'])

	sh = gcservice_account.open_by_url(NHL_data)

	worksheet = sh.worksheet('Player_Level_ROO')
	raw_display = pd.DataFrame(worksheet.get_values())
	raw_display.columns = raw_display.iloc[0]
	raw_display = raw_display[1:]
	raw_display = raw_display.reset_index(drop=True)
	raw_display = raw_display[raw_display['Opp'] != ""]
	team_frame = raw_display[['Team', 'Opp']]
	team_list = team_frame['Team'].unique()
	team_dict = dict(zip(team_frame['Team'], team_frame['Opp']))

	worksheet = sh.worksheet('Matchups')
	raw_display = pd.DataFrame(worksheet.get_values())
	raw_display.columns = raw_display.iloc[0]
	raw_display = raw_display[1:]
	raw_display = raw_display.reset_index(drop=True)
	raw_display = raw_display[raw_display['Opp'] != ""]
	matchups = raw_display[['Team', 'Opp', 'FL1$', 'FL2$', 'FL3$', 'Team Total', 'Game Pace', 'SF', 'o_SA', 'SF_m', 'HDCF',
	'o_HDCA', 'HDCF_m', 'HDCF%', 'o_HDCA%', 'HDCF_m%', 'HDSF+']]
	data_cols = matchups.columns.drop(['Team', 'Opp'])
	matchups[data_cols] = matchups[data_cols].apply(pd.to_numeric, errors='coerce')
	matchups = matchups.dropna(subset='HDSF+')
	matchups = matchups.sort_values(by='HDCF_m', ascending=False)

	worksheet = sh.worksheet('Marketshares')
	raw_display = pd.DataFrame(worksheet.get_values())
	raw_display.columns = raw_display.iloc[0]
	raw_display = raw_display[1:]
	raw_display = raw_display.reset_index(drop=True)
	# raw_display = raw_display[raw_display['Line'] != ""]
	overall_ms = raw_display[['Line', 'SK1', 'SK2', 'SK3', 'Cost', 'Team Total', 'Shots', 'HDCF', 'Goals', 'Assists', 'Blocks',
	'L14_Shots', 'L14_HDCF', 'L14_Goals', 'L14_Assists', 'L14_Blocks']]
	pat = '\|'.join(team_list)
	s = overall_ms['Line'].str.extract('('+ pat + ')', expand=False)
	overall_ms['Max Goal%'] = overall_ms.groupby(s)['Goals'].transform('max')
	overall_ms['L14 Max Goal%'] = overall_ms.groupby(s)['L14_Goals'].transform('max')

	data_cols = overall_ms.columns.drop(['Line', 'SK1', 'SK2', 'SK3'])
	overall_ms[data_cols] = overall_ms[data_cols].apply(pd.to_numeric, errors='coerce')
	overall_ms['Proj Goal'] = overall_ms['Goals'] * overall_ms['Team Total']
	overall_ms['L14 Proj Goal'] = overall_ms['L14_Goals'] * overall_ms['Team Total']
	overall_ms = overall_ms[['Line', 'SK1', 'SK2', 'SK3', 'Cost', 'Team Total', 'Shots', 'HDCF', 'Goals', 'Max Goal%', 'Proj Goal',
	'Assists', 'Blocks', 'L14_Shots', 'L14_HDCF', 'L14_Goals', 'L14 Max Goal%', 'L14 Proj Goal', 'L14_Assists', 'L14_Blocks']]
	overall_ms = overall_ms.sort_values(by='Shots', ascending=False)

	return matchups, overall_ms, team_frame, team_list, team_dict

	def convert_df_to_csv(df):
	return df.to_csv().encode('utf-8')

	matchups, overall_ms, team_frame, team_list, team_dict = init_baselines()

	col1, col2 = st.columns([1, 9])
	with col1:
	if st.button("Reset Data", key='reset1'):
	st.cache_data.clear()
	matchups, overall_ms, team_frame, team_list, team_dict = init_baselines()
	split_var1 = st.radio("View matchups or line marketshares?", ('Slate Matchups', 'Line Marketshares'), key='split_var1')
	if split_var1 == "Line Marketshares":
	team_var = st.radio("View all teams or specific teams?", ('All Teams', 'Specific Teams'), key='team_var')
	if team_var == "All Teams":
	team_split = team_frame.Team.values.tolist()
	elif team_var == "Specific Teams":
	team_split = st.multiselect('Which teams would you like to include in the tables?', options = team_frame['Team'].unique(), key='team_var1')

	with col2:
	if split_var1 == 'Slate Matchups':
	display_table = matchups
	display_table = display_table.set_index('Team')
	st.dataframe(display_table.style.background_gradient(axis=0).background_gradient(cmap='RdYlGn').format(matchups_format, precision=2), height=500, use_container_width = True)
	elif split_var1 == 'Line Marketshares':
	display_table = overall_ms
	display_parsed = display_table[display_table['Line'].str.contains('\|'.join(team_split))]
	# display_parsed = display_parsed.set_index('Line')
	st.dataframe(display_parsed.style.background_gradient(axis=0).background_gradient(cmap='RdYlGn').format(percentages_format, precision=2), height=500, use_container_width = True)

	if split_var1 == 'Line Marketshares':
	st.download_button(
	label="Export Marketshares (CSV)",
	data=convert_df_to_csv(display_table),
	file_name='Marketshares_export.csv',
	mime='text/csv',
	)
	elif split_var1 == 'Slate Matchups':
	st.download_button(
	label="Export Matchups (CSV)",
	data=convert_df_to_csv(display_table),
	file_name='Matchups_export.csv',
	mime='text/csv',
	)