import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
from matplotlib import dates as mdates
import matplotlib.ticker as ticker
from matplotlib.ticker import FuncFormatter
import qtsprojectfunctions

from qtsprojectfunctions import fetch_qm_prices, fetch_zacks_fc, fetch_zacks_shrs, fetch_zacks_mktv
qm_prices = fetch_qm_prices()
# PRICES_20240304.zip
zacks_fc = fetch_zacks_fc()
# FC_20240129.zip
zacks_shrs = fetch_zacks_shrs()
# SHRS_20240304.zip
zacks_mktv = fetch_zacks_mktv()
# MKTV_20240304.zip

Skipping any possible download of QUOTEMEDIA/PRICES
Skipping any possible download of ZACKS/FC
Skipping any possible download of ZACKS/SHRS
Skipping any possible download of ZACKS/MKTV

fundamental_data = pd.DataFrame()
fundamental_data = pd.merge(zacks_fc, zacks_shrs, left_on=['ticker', zacks_fc.index], right_on=['ticker', zacks_shrs.index], how='outer').rename(columns={'key_1':'per_end_date'}).set_index('per_end_date')
fundamental_data = fundamental_data.merge(zacks_mktv, left_on=['ticker', fundamental_data.index], right_on=['ticker', zacks_mktv.index], how='outer')
fundamental_data = fundamental_data[['ticker', 'eps_diluted_net', 'shares_out', 'mkt_val', 'filing_date']]
fundamental_data['filing_date'] = pd.to_datetime(fundamental_data['filing_date'])
fundamental_data = fundamental_data[(fundamental_data['filing_date'] > '2008') & (fundamental_data['filing_date'] < '2024')]

prices = qm_prices[(qm_prices.index >= '2008-01-01') & (qm_prices.index <= '2023-12-31')]
prices = prices[['ticker', 'adj_open', 'adj_high', 'adj_low', 'adj_close']].reset_index()
prices['date'] = pd.to_datetime(prices['date'])

merged_data = pd.merge(prices.sort_values('date'), 
                       fundamental_data.sort_values('filing_date'),
                       left_on=['ticker', 'date'],
                       right_on=['ticker', 'filing_date'],
                       how='left').set_index('date')
# start date 01/01/2010
merged_data = merged_data[merged_data.index >= '2010']
qtsprojectfunctions.dp(2)
qtsprojectfunctions.df_info(merged_data)

There are  31204695  rows and  9  columns
The columns and data types are:
ticker                     object
adj_open                  float64
adj_high                  float64
adj_low                   float64
adj_close                 float64
eps_diluted_net           float64
shares_out                float64
mkt_val                   float64
filing_date        datetime64[ns]
dtype: object

qtsprojectfunctions.plot_eps_price(fundamental_data, prices, 'NVDA')

qtsprojectfunctions.plot_eps_price(fundamental_data, prices, 'AAPL')

qtsprojectfunctions.plot_eps_price(fundamental_data, prices, 'GOOGL')

qtsprojectfunctions.plot_eps_price(fundamental_data, prices, 'PFE')

qtsprojectfunctions.plot_eps_price(fundamental_data, prices, 'INTC')

qtsprojectfunctions.plot_eps_price(fundamental_data, prices, 'WM')

# Keep only data with a filing date
signals_df = merged_data[merged_data['filing_date'].notna()]

# Fill missing values with 0
signals_df['eps_diluted_net'] = signals_df['eps_diluted_net'].fillna(0)

# Filter out for positive EPS only
signals_df = signals_df[signals_df['eps_diluted_net'] > 0]

# Calc market cap
signals_df['mkt_val'] = signals_df['adj_close'] * signals_df['shares_out']

# Keep market cap only greater than 10 bil
signals_df = signals_df[signals_df['mkt_val'] >= 10000]

len(signals_df['ticker'].unique())

863

# Find % change in earnings 
sorted_df = signals_df.sort_values(by = ['ticker', 'date'])

# Shift EPS data
sorted_df['previous_eps_diluted_net'] = sorted_df.groupby('ticker')['eps_diluted_net'].shift(1)

# Calc the change in EPS
sorted_df['pct_change_eps_diluted_net'] = (sorted_df['eps_diluted_net'] - sorted_df['previous_eps_diluted_net']) / sorted_df['previous_eps_diluted_net']

# Shift adjusted close prices
sorted_df['previous_adj_close'] = sorted_df.groupby('ticker')['adj_close'].shift(1)

# Calculate change in price
sorted_df['pct_change_adj_close'] = (sorted_df['adj_close'] - sorted_df['previous_adj_close']) / sorted_df['previous_adj_close']

# Drop any na values
sorted_df.dropna(subset=['previous_eps_diluted_net'], inplace=True)

signals_df = signals_df.merge(sorted_df[['ticker', 'previous_eps_diluted_net', 'pct_change_eps_diluted_net']],
                              left_on=['ticker', signals_df.index], right_on=['ticker', sorted_df.index], 
                              how='left').rename(columns={'key_1':'date'}).set_index('date')

qtsprojectfunctions.dp(2)
qtsprojectfunctions.df_info(signals_df)

There are  6225  rows and  11  columns
The columns and data types are:
ticker                                object
adj_open                             float64
adj_high                             float64
adj_low                              float64
adj_close                            float64
eps_diluted_net                      float64
shares_out                           float64
mkt_val                              float64
filing_date                   datetime64[ns]
previous_eps_diluted_net             float64
pct_change_eps_diluted_net           float64
dtype: object

# Copy dataframe
trades_to_make = signals_df.copy().dropna()

# using filing date here to make sure the company did actually file in the previous year and that we actually have the data
trades_to_make['filing_year'] = pd.to_datetime(trades_to_make['filing_date']).dt.year

# Filter out filing date for after 2010
trades_to_make = trades_to_make[trades_to_make['filing_year'] > 2010]

# Set number of trades to handle on an annual basis
num_largest = 50

# Group by filing year, and then keep the 50 largest percent changes
top_50_trades_per_year = trades_to_make.groupby('filing_year').apply(lambda x: x.nlargest(num_largest, 'pct_change_eps_diluted_net')).reset_index(drop=True)

# Keep only needed columns
top_50_trades_per_year = top_50_trades_per_year[['ticker', 'adj_close', 'eps_diluted_net', 'previous_eps_diluted_net', 
                                                 'pct_change_eps_diluted_net', 'filing_date', 'filing_year']]

# Rename adjsuted close to avoid confusion later
top_50_trades_per_year.rename(columns = {'adj_close':'adj_close_filing_date'}, inplace = True)

# Adding 1 to year since we will be placing trades on first trading day of the next year, so
# if a company reported outstanding earnings growth in 2011 we will buy on the first trading day of 2012
top_50_trades_per_year['trade_year'] = top_50_trades_per_year['filing_year'] + 1

# Establish trade year
prices['trade_year'] = pd.to_datetime(prices['date']).dt.year

# Combine trades dataframe with prices dataframe
filtered_prices = pd.merge(prices, top_50_trades_per_year, on=['ticker', 'trade_year'], how='inner')

# Sort by date and then ticker
filtered_prices = filtered_prices.sort_values(by=['date', 'ticker'])

# Rename the adjusted price columns so that we know these are the prices we are trading on
filtered_prices.rename(columns = {'adj_open':'adj_open_trade', 
                                  'adj_high':'adj_high_trade', 
                                  'adj_low':'adj_low_trade', 
                                  'adj_close':'adj_close_trade'}, inplace = True)

filtered_prices.drop(columns = {'adj_close_filing_date', 'eps_diluted_net', 'previous_eps_diluted_net', 
                                'pct_change_eps_diluted_net', 'filing_date', 'filing_year'}, inplace = True)

qtsprojectfunctions.dp(2)
qtsprojectfunctions.df_info(filtered_prices)

There are  150900  rows and  7  columns
The columns and data types are:
date               datetime64[ns]
ticker                     object
adj_open_trade            float64
adj_high_trade            float64
adj_low_trade             float64
adj_close_trade           float64
trade_year                  int64
dtype: object

# Create column for entry date
filtered_prices['entry_price'] = filtered_prices.groupby(['ticker', 'trade_year'])['adj_close_trade'].transform('first')

# Create column for entry price
filtered_prices['entry_date'] = filtered_prices.groupby(['ticker', 'trade_year'])['date'].transform('first')

qtsprojectfunctions.dp(2)
qtsprojectfunctions.df_info(filtered_prices)

There are  150900  rows and  9  columns
The columns and data types are:
date               datetime64[ns]
ticker                     object
adj_open_trade            float64
adj_high_trade            float64
adj_low_trade             float64
adj_close_trade           float64
trade_year                  int64
entry_price               float64
entry_date         datetime64[ns]
dtype: object

# Create empty column for stop loss price
filtered_prices['stop_loss_price'] = 0

# Set trailing stop percentage variable
trailing_stop = 0.10

def calc_stop_loss(group):
    for index, row in group.iterrows():
        try:
            previous_stop_loss = group.at[index - 1, 'stop_loss_price']
            group.at[index, 'stop_loss_price'] = np.where(row['adj_high_trade'] * (1 - trailing_stop) >= previous_stop_loss, row['adj_high_trade'] * (1 - trailing_stop), previous_stop_loss)
        except:
            pass
    return group

# Apply stop loss function to the price data for each ticker for the specific trade year
filtered_prices = filtered_prices.groupby(['ticker', 'trade_year']).apply(calc_stop_loss).reset_index(drop=True)

# Implement stop loss
filtered_prices['Stop_Loss'] = np.where(filtered_prices['adj_low_trade'] <= filtered_prices['stop_loss_price'], 'Stop Loss Or Exit Position', None)

# If position never hits actual stop loss, then implement a sell signal at the end of the year
def exit_position(group):
    group['Stop_Loss'].iloc[-1] = 'Stop Loss Or Exit Position'
    return group

# Implement end of year sell signal to exit the position
filtered_prices = filtered_prices.groupby(['ticker', 'trade_year']).apply(exit_position).reset_index(drop=True)

# Fill down stop loss status
filtered_prices['Stop_Loss'] = filtered_prices.groupby(['ticker', 'trade_year'])['Stop_Loss'].fillna(method='ffill')

# Calc duplicated values, mark duplicates as True and keep the first value marked as False
filtered_prices['duplicated'] = filtered_prices.groupby(['ticker', 'trade_year'])['Stop_Loss'].transform(lambda x: x.duplicated(keep='first'))

# Remove any entries were the stop loss indication is duplicated, 
# thereby filtering the dates to inlude only prices data between the entry date and exit date
filtered_prices = filtered_prices[~((filtered_prices['Stop_Loss'] == 'Stop Loss Or Exit Position') & (filtered_prices['duplicated'] == True))]

qtsprojectfunctions.dp(2)
qtsprojectfunctions.df_info(filtered_prices)

There are  34631  rows and  12  columns
The columns and data types are:
date               datetime64[ns]
ticker                     object
adj_open_trade            float64
adj_high_trade            float64
adj_low_trade             float64
adj_close_trade           float64
trade_year                  int64
entry_price               float64
entry_date         datetime64[ns]
stop_loss_price           float64
Stop_Loss                  object
duplicated                   bool
dtype: object

# Add column for exit price
filtered_prices['exit_price'] = np.where(filtered_prices['Stop_Loss'] == 'Stop Loss Or Exit Position', filtered_prices['stop_loss_price'], None)
filtered_prices['exit_price'] = filtered_prices['exit_price'].astype(float)

# Set the exit date where the stop loss is hit / when the position exits at the end of the year
filtered_prices['exit_date'] = np.where(filtered_prices['Stop_Loss'] == 'Stop Loss Or Exit Position', filtered_prices['date'], None)
filtered_prices['exit_date'] = pd.to_datetime(filtered_prices['exit_date'])

qtsprojectfunctions.dp(2)
qtsprojectfunctions.df_info(filtered_prices)

There are  34631  rows and  14  columns
The columns and data types are:
date               datetime64[ns]
ticker                     object
adj_open_trade            float64
adj_high_trade            float64
adj_low_trade             float64
adj_close_trade           float64
trade_year                  int64
entry_price               float64
entry_date         datetime64[ns]
stop_loss_price           float64
Stop_Loss                  object
duplicated                   bool
exit_price                float64
exit_date          datetime64[ns]
dtype: object

position_capital = 2000000
filtered_prices['Shares'] = position_capital / filtered_prices.groupby(['ticker', 'trade_year'])['adj_close_trade'].transform('first')
filtered_prices['Shares'] = filtered_prices['Shares'].round()
filtered_prices['Share_Value'] = np.where(filtered_prices['Stop_Loss'] == 'Stop Loss Or Exit Position', filtered_prices['exit_price'] * filtered_prices['Shares'], filtered_prices['Shares'] * filtered_prices['adj_close_trade'])
filtered_prices['Starting_Value'] = filtered_prices['entry_price'] * filtered_prices['Shares']
filtered_prices['Starting_Value'] = filtered_prices['Starting_Value'].astype(float)
filtered_prices['Ending_Value'] = np.where(filtered_prices['Stop_Loss'] == 'Stop Loss Or Exit Position', filtered_prices['exit_price'] * filtered_prices['Shares'], None)
filtered_prices['Ending_Value'] = filtered_prices['Ending_Value'].astype(float)
filtered_prices['Ending_Value'] = filtered_prices['Ending_Value'].fillna(0)

# Add column for daily PnL
filtered_prices['Daily_PnL'] = filtered_prices.groupby(['ticker', 'trade_year'])['Share_Value'].diff()

# Add column for total trade PnL
filtered_prices['Trade_PnL'] = filtered_prices.groupby(['ticker', 'trade_year'])['Daily_PnL'].cumsum()

# daily returns
filtered_prices['Daily_Return'] = (filtered_prices['adj_close_trade'] / filtered_prices['entry_price'])-1

# Calculate daily share value
filtered_prices['Daily_Share_Value'] = filtered_prices['Share_Value'] - filtered_prices['Ending_Value']

# Create new dataframe with daily share value
Daily_Share_Value = filtered_prices.groupby(['date'])['Daily_Share_Value'].sum()
Daily_Share_Value = Daily_Share_Value.to_frame()

# Create new dataframe for daily cash flow (happens only when we are exiting positions)
Daily_Cash_Flow = filtered_prices[filtered_prices['Ending_Value'] != 0].groupby(['date'])['Ending_Value'].sum()
Daily_Cash_Flow = Daily_Cash_Flow.to_frame()

# Merge
returns = pd.merge(Daily_Share_Value, Daily_Cash_Flow, how = 'left', on = 'date')

# Rename columns
returns.rename(columns = {'Ending_Value':'Daily_Cash_Flow','Daily_Share_Value':'Total_Position_Value'}, inplace = True)

# Fill missing values
returns['Daily_Cash_Flow'] = returns['Daily_Cash_Flow'].fillna(0)
returns['temp'] = returns['Total_Position_Value'].diff()
returns['Daily_Cash_Flow'] = np.where(returns['temp'] > 99000000, returns['Daily_Cash_Flow'] - returns['temp'], returns['Daily_Cash_Flow'])
returns.drop(columns = {'temp'}, inplace = True)

# Calculate portfolio cash position
returns['Portfolio_Cash'] = returns['Daily_Cash_Flow'].cumsum()
returns['Portfolio_Cash'].ffill(inplace = True)

# Calculate trading costs - assume 10 basis points or 0.10% for trading costs
returns['Trading_Costs'] = returns['Daily_Cash_Flow'] * 0.001

# Total portfolio value
returns['Total_Portfolio_Value'] = returns['Total_Position_Value'] + returns['Portfolio_Cash'] - returns['Trading_Costs']

from qtsprojectfunctions import fetch_fed_funds
fed_funds = fetch_fed_funds()

returns_leverage = pd.merge(returns, fed_funds, how = 'outer', on = 'date')
returns_leverage.sort_values(by = ['date'], inplace = True)
returns_leverage['Fed_Funds_Annual'].ffill(inplace = True)
returns_leverage['Fed_Funds_Annual'] = returns_leverage['Fed_Funds_Annual'] / 100
returns_leverage['Fed_Funds_Daily'] = returns_leverage['Fed_Funds_Annual'] / 252

# Leverage, assuming Capital of 20m and 5x leverage
# Calculate the amount to fund on a daily basis
capital = 20000000
returns_leverage['Daily_Fund'] = np.where(returns_leverage['Total_Position_Value'] > capital, returns_leverage['Total_Position_Value'] - capital, 0)
returns_leverage.dropna(subset = ['Total_Position_Value'], inplace = True)

# Calculate daily borrowing costs
returns_leverage['Daily_Funding_Cost'] = returns_leverage['Daily_Fund'] * returns_leverage['Fed_Funds_Daily']
returns_leverage['Cum_Funding_Cost'] = returns_leverage['Daily_Funding_Cost'].cumsum()

qtsprojectfunctions.dp(2)
qtsprojectfunctions.df_info(returns_leverage)

There are  2177  rows and  10  columns
The columns and data types are:
Total_Position_Value     float64
Daily_Cash_Flow          float64
Portfolio_Cash           float64
Trading_Costs            float64
Total_Portfolio_Value    float64
Fed_Funds_Annual         float64
Fed_Funds_Daily          float64
Daily_Fund               float64
Daily_Funding_Cost       float64
Cum_Funding_Cost         float64
dtype: object

# Daily portfolio returns
returns_leverage['Portfolio_Daily_Ret'] = returns_leverage['Total_Portfolio_Value'].pct_change()

# Total capital and daily return on capital
returns_leverage['Total_Portfolio_Value_Diff'] = returns_leverage['Total_Portfolio_Value'].diff()
returns_leverage['Total_Cap'] = returns_leverage['Total_Portfolio_Value_Diff'].cumsum() + capital - returns_leverage['Daily_Funding_Cost']
returns_leverage['Daily_Ret_On_Cap'] = returns_leverage['Total_Cap'].pct_change()

qtsprojectfunctions.dp(2)
# returns_leverage[(returns_leverage.index >= '2012-12-15') & (returns_leverage.index <= '2013-01-15')]
qtsprojectfunctions.df_info(returns_leverage)

There are  2177  rows and  14  columns
The columns and data types are:
Total_Position_Value          float64
Daily_Cash_Flow               float64
Portfolio_Cash                float64
Trading_Costs                 float64
Total_Portfolio_Value         float64
Fed_Funds_Annual              float64
Fed_Funds_Daily               float64
Daily_Fund                    float64
Daily_Funding_Cost            float64
Cum_Funding_Cost              float64
Portfolio_Daily_Ret           float64
Total_Portfolio_Value_Diff    float64
Total_Cap                     float64
Daily_Ret_On_Cap              float64
dtype: object

qtsprojectfunctions.dp(4)
Portfolio_Daily_Ret = qtsprojectfunctions.return_stats(returns_leverage[['Portfolio_Daily_Ret']])
Portfolio_Daily_Ret

qtsprojectfunctions.ret_hist(returns_leverage[['Portfolio_Daily_Ret']])

qtsprojectfunctions.dp(6)
returns_leverage[['Portfolio_Daily_Ret']].describe()

qtsprojectfunctions.dp(4)
Daily_Ret_On_Cap = qtsprojectfunctions.return_stats(returns_leverage[['Daily_Ret_On_Cap']])
Daily_Ret_On_Cap

qtsprojectfunctions.ret_hist(returns_leverage[['Daily_Ret_On_Cap']])

qtsprojectfunctions.dp(6)
returns_leverage[['Daily_Ret_On_Cap']].describe()

returns_leverage['Portfolio_Cum_Ret'] = (returns_leverage['Portfolio_Daily_Ret'] + 1).cumprod()
returns_leverage['Cum_Ret_On_Cap'] = (returns_leverage['Daily_Ret_On_Cap'] + 1).cumprod()

# Create the initial plot
plt.figure(figsize=(10, 5))

# Plot the first y-axis data
plt.plot(returns_leverage.index, returns_leverage['Portfolio_Cum_Ret'], label = 'Portfolio Cumulative Return', linestyle='-', color='b', linewidth=2)
plt.plot(returns_leverage.index, returns_leverage['Cum_Ret_On_Cap'], label = 'Cumulative Return On Capital', linestyle='-', color='g', linewidth=2)
plt.gca().xaxis.set_major_locator(mdates.YearLocator())
plt.gca().xaxis.set_major_formatter(mdates.DateFormatter('%Y'))
plt.xlabel('Year')
plt.ylabel('Total Return')
plt.title('Cumulative Returns Comparison')
# # Define custom formatting function for y-axis labels
# def millions_formatter(x, pos):
#     return '{:.0f}M'.format(x / 1e6)
# plt.gca().yaxis.set_major_formatter(ticker.FuncFormatter(millions_formatter))
plt.xticks(rotation = 45, fontsize = 7)
plt.yticks(fontsize = 7)
plt.tight_layout()
plt.grid(True)
plt.legend(fontsize = 8)
plt.show()

# Create the initial plot
plt.figure(figsize=(10, 5))

# Plot the first y-axis data
plt.scatter(returns_leverage.index, returns_leverage['Total_Position_Value'], label='Total Equity Position Value', marker='.', linestyle='-', color='b', linewidth=1)
plt.scatter(returns_leverage.index, returns_leverage['Portfolio_Cash'], label='Total Portfolio Cash', marker='.', linestyle='-', color='g', linewidth=1)
plt.scatter(returns_leverage.index, returns_leverage['Total_Portfolio_Value'], label='Total Portfolio Value', marker='.', linestyle='-', color='r', linewidth=1)
plt.gca().xaxis.set_major_locator(mdates.YearLocator())
plt.gca().xaxis.set_major_formatter(mdates.DateFormatter('%Y'))
plt.xlabel('Year')
plt.ylabel('Total Value')
plt.title('Total Values For Equity Positions, Portfolio Cash, and Portfolio Value')
# Define custom formatting function for y-axis labels
def millions_formatter(x, pos):
    return '{:.0f}M'.format(x / 1e6)
plt.gca().yaxis.set_major_formatter(ticker.FuncFormatter(millions_formatter))
plt.xticks(rotation = 45, fontsize = 7)
plt.yticks(fontsize = 7)
plt.tight_layout()
plt.grid(True)
plt.legend(fontsize = 8)
plt.show()

# Create the initial plot
plt.figure(figsize=(10, 5))

start_date = '2017-01-01'
end_date = '2017-12-31'

only_2017 = returns_leverage[(returns_leverage.index >= start_date) & (returns_leverage.index <= end_date)]

# Plot the first y-axis data
plt.scatter(only_2017.index, only_2017['Total_Position_Value'], label='Total Equity Position Value', marker='.', linestyle='-', color='b', linewidth=1)
plt.scatter(only_2017.index, only_2017['Portfolio_Cash'], label='Total Portfolio Cash', marker='.', linestyle='-', color='g', linewidth=1)
plt.scatter(only_2017.index, only_2017['Total_Portfolio_Value'], label='Total Portfolio Value', marker='.', linestyle='-', color='r', linewidth=1)
plt.gca().xaxis.set_major_locator(mdates.MonthLocator())
plt.gca().xaxis.set_major_formatter(mdates.DateFormatter('%Y-%m'))  # Change to '%Y-%m' for year and month
plt.xlabel('Year')
plt.ylabel('Total Value')
plt.title('Total Values For Equity Positions, Portfolio Cash, and Portfolio Value')
# Define custom formatting function for y-axis labels
def millions_formatter(x, pos):
    return '{:.0f}M'.format(x / 1e6)
plt.gca().yaxis.set_major_formatter(ticker.FuncFormatter(millions_formatter))
plt.xticks(rotation = 45, fontsize = 7)
plt.yticks(fontsize = 7)
plt.tight_layout()
plt.grid(True)
plt.legend(fontsize = 8)
plt.show()

trades = filtered_prices[['ticker', 'entry_date', 'entry_price', 'exit_date', 'exit_price', 'Trade_PnL', 'Stop_Loss']]
trades = trades[trades['Stop_Loss'] == 'Stop Loss Or Exit Position']

(trades['exit_price'] > trades['entry_price']).value_counts()

False    335
True     264
dtype: int64

trades['ticker'].unique()

array(['PHG', 'NEM', 'COF', 'GLW', 'NOK', 'HES', 'JNPR', 'MT', 'SCCO',
       'FCX', 'IBN', 'AMAT', 'HAL', 'AFL', 'BHP', 'CAT', 'CVE', 'SHG',
       'GGB', 'BSBR', 'CEO', 'OXY', 'F', 'CVX', 'SHEL', 'AAPL', 'BIDU',
       'BLK', 'COP', 'TM', 'TXN', 'JPM', 'CAJPY', 'TEVA', 'KR', 'ISRG',
       'BA', 'HSBC', 'INTC', 'ADBE', 'AXP', 'TSM', 'XOM', 'USB', 'UPS',
       'T', 'D', 'KO', 'SPG', 'L', 'GM', 'AU', 'TECK', 'DB', 'EC', 'LVS',
       'PPG', 'BP', 'EOG', 'NUE', 'MET', 'EBAY', 'EQNR', 'MFG', 'IMO',
       'CNQ', 'SCHW', 'CMI', 'ETN', 'BKR', 'SAP', 'MSI', 'AEP', 'BRFS',
       'PARA', 'BCE', 'BUD', 'WYNN', 'CNI', 'EPD', 'CME', 'PCAR', 'BAX',
       'TFC', 'BKNG', 'LIN', 'MRK', 'CHU', 'CB', 'CMG', 'DLTR', 'MPC',
       'TJX', 'ING', 'LYB', 'MA', 'PUK', 'CBD', 'DG', 'FMX', 'SMFG',
       'DEO', 'NMR', 'TRV', 'GS', 'MO', 'MUFG', 'FDX', 'V', 'TRI', 'TS',
       'FMS', 'CMCSA', 'GPS', 'ACN', 'BAC', 'AMGN', 'PFE', 'MAR', 'HON',
       'ITW', 'MSFT', 'ALL', 'AMT', 'ORLY', 'CPRI', 'RRC', 'SAN', 'MU',
       'C', 'DAL', 'FLR', 'MFC', 'OVV', 'AIG', 'WDC', 'CTRA', 'K', 'VOD',
       'NVO', 'ERIC', 'EQR', 'JCI', 'TEL', 'BXP', 'IP', 'META', 'CP',
       'KMI', 'CAH', 'SBUX', 'VZ', 'ET', 'MRO', 'NFLX', 'SWKS', 'WMB',
       'AVGO', 'MOS', 'NXPI', 'RIO', 'YPF', 'ILMN', 'PRU', 'PXD', 'UAL',
       'WY', 'BIIB', 'ENB', 'HST', 'RY', 'ADM', 'CCI', 'GILD', 'HIG',
       'KB', 'LUV', 'PLD', 'TMUS', 'WELL', 'RYAAY', 'AVB', 'EA', 'ICE',
       'WBA', 'KEP', 'WM', 'EIX', 'PCG', 'REGN', 'TV', 'TGT', 'AAL', 'MS',
       'INTU', 'SJM', 'COR', 'FE', 'BABA', 'HLT', 'AZN', 'HOLX', 'AMZN',
       'MDLZ', 'SONY', 'ABBV', 'ESS', 'ABT', 'MKL', 'NVS', 'ORAN', 'SYK',
       'INCY', 'LRCX', 'MCK', 'STLA', 'APD', 'BCS', 'CL', 'LYG', 'NVDA',
       'VALE', 'VMC', 'BMY', 'DVA', 'KMB', 'NGG', 'TAP', 'LBTYK', 'PKX',
       'ZBH', 'ZTS', 'CRM', 'RCL', 'PPL', 'LBTYB', 'HMC', 'SNN', 'WB',
       'WRK', 'KHC', 'HUM', 'STM', 'FFIV', 'NDAQ', 'HPE', 'AEG', 'IQV',
       'BTI', 'PSX', 'SU', 'NSC', 'CSX', 'EXC', 'SNPS', 'UNP', 'MCO',
       'FIS', 'TRP', 'DVN', 'CNHI', 'NTAP', 'NTR', 'PAA', 'KEYS', 'WAT',
       'BDX', 'IT', 'GSK', 'A', 'BSX', 'CSCO', 'FTV', 'TXT', 'LMT', 'UBS',
       'GOOGL', 'GOOG', 'SO', 'SRE', 'VRTX', 'JNJ', 'ORCL', 'PEP', 'ACGL',
       'CINF', 'NWG', 'ADSK', 'CDNS', 'GOLD', 'HSIC', 'MGM', 'SSNC',
       'TCOM', 'TFX', 'WBD', 'CPB', 'NTES', 'FNV', 'ROP', 'LBTYA', 'LLY',
       'MRVL', 'ATUS', 'VNO', 'ANET', 'DLR', 'SBAC', 'LOW', 'WMT', 'CNP',
       'PG', 'PTC', 'NVR', 'TTD', 'ALGN', 'AMD', 'BIO', 'WPM', 'ALB',
       'DXCM', 'EL', 'NKE', 'TPR', 'ZM', 'CTLT', 'GMAB', 'QRVO', 'LBRDA',
       'LBRDK', 'HPQ', 'JD', 'ABBNY', 'CE', 'DE', 'RVTY', 'PEAK', 'FOX',
       'FOXA', 'SNY', 'SYY', 'BIP', 'TSLA', 'BNTX', 'DFS', 'SUZ', 'PBR',
       'SHOP', 'WFC', 'APA', 'SIRI', 'AVTR', 'CG', 'SSL', 'BX', 'MELI',
       'WLK', 'ON', 'E', 'ROST', 'WTW', 'APO', 'DD', 'DOW', 'ULTA', 'TEF'],
      dtype=object)

len(trades['ticker'].unique())

366

# Sum of Daily PnL by ticker and calculate quantiles for filtering
daily_pnl_sum = trades.groupby('ticker')['Trade_PnL'].sum()
quantiles = daily_pnl_sum.quantile([0.10, 0.90])

# Filter and combine top 10% and bottom 10% PnLs, then sort
pnl_filtered = pd.concat([
    daily_pnl_sum[daily_pnl_sum <= quantiles[0.10]],
    daily_pnl_sum[daily_pnl_sum >= quantiles[0.90]]
]).sort_values()

# Plotting
plt.figure(figsize=(10, 10))
pnl_filtered.plot.bar(color=['red' if x < 0 else 'green' for x in pnl_filtered], title='Top & Bottom 10% Tickers by PnL')
plt.xlabel('Ticker')
plt.ylabel('Profit and Loss (PnL)')
# Define custom formatting function for y-axis labels
def millions_formatter(x, pos):
    return '{:.1f}M'.format(x / 1e6)
plt.gca().yaxis.set_major_formatter(ticker.FuncFormatter(millions_formatter))
plt.xticks(rotation = 45, fontsize = 6)
plt.yticks(fontsize = 7)
plt.tight_layout()
plt.grid(True)
plt.show()

fig = plt.show()

# Sum of Daily PnL by ticker and calculate quantiles for filtering
daily_pnl_sum = trades.groupby('ticker')['Trade_PnL'].sum()
quantiles = daily_pnl_sum.quantile([0.90])

# Filter and combine top 10% and bottom 10% PnLs, then sort
pnl_filtered = pd.concat([
    daily_pnl_sum[daily_pnl_sum >= quantiles[0.90]]
]).sort_values()

# Plotting
plt.figure(figsize=(10, 6))
pnl_filtered.plot.bar(color=['red' if x < 0 else 'green' for x in pnl_filtered], title='Top 10% Tickers by PnL')
plt.xlabel('Ticker')
plt.ylabel('Profit and Loss (PnL)')
# Define custom formatting function for y-axis labels
def millions_formatter(x, pos):
    return '{:.1f}M'.format(x / 1e6)
plt.gca().yaxis.set_major_formatter(ticker.FuncFormatter(millions_formatter))
plt.xticks(rotation = 45, fontsize = 7)
plt.yticks(fontsize = 7)
plt.tight_layout()
plt.grid(True)
plt.show()

fig = plt.show()

bkng = qm_prices[qm_prices['ticker'] == 'BKNG'][['adj_close']].reset_index()
bkng['date'] = pd.to_datetime(bkng['date'])

# Create the initial plot
plt.figure(figsize=(10, 5))

# Plot the first y-axis data
plt.plot(bkng['date'], bkng['adj_close'], linestyle='-', color='b', linewidth=1)
plt.gca().xaxis.set_major_locator(mdates.YearLocator())
plt.gca().xaxis.set_major_formatter(mdates.DateFormatter('%Y'))
plt.xlabel('Year')
plt.ylabel('Adjusted Close Price')
plt.title('Booking Holdings Inc. (BKNG) Adjusted Closing Prices')
plt.xticks(rotation = 45, fontsize = 7)
plt.yticks(fontsize = 7)
plt.tight_layout()
plt.grid(True)
plt.show()

# SPY df
spy = qm_prices[qm_prices['ticker'] == 'SPY']
filtered_prices['date'] = pd.to_datetime(filtered_prices['date'])
spy.index = pd.to_datetime(spy.index)
# our first trades are in 2012
spy = spy[spy.index >= '2012']

# SPY buy and hold (hodl)
pd.set_option('display.float_format', lambda x: '%.2f' % x)  # Change '.2f' as needed for your precision
spy_buy_n_hold = spy.copy()
spy_buy_n_hold['SPY_Daily_Ret'] = spy_buy_n_hold['adj_close'].pct_change()
spy_buy_n_hold['Cum_Return'] = (1 + spy_buy_n_hold['SPY_Daily_Ret']).cumprod()
spy_buy_n_hold['shares'] = int(20000000 / spy_buy_n_hold.iloc[0]['adj_close'])
spy_buy_n_hold['dollar_value'] = spy_buy_n_hold['shares'] * spy_buy_n_hold['adj_close']
spy_buy_n_hold['daily_pnl'] = spy_buy_n_hold['dollar_value'].diff()
spy_buy_n_hold_ret = qtsprojectfunctions.return_stats(spy_buy_n_hold[['SPY_Daily_Ret']])
ret_comp = pd.concat([Portfolio_Daily_Ret, Daily_Ret_On_Cap, spy_buy_n_hold_ret])
qtsprojectfunctions.dp(4)
ret_comp

# Create the initial plot
plt.figure(figsize=(10, 5))

# Plot the first y-axis data
plt.plot(returns_leverage.index, returns_leverage['Portfolio_Cum_Ret'], label='Portfolio Cumulative Return', linestyle='-', color='b', linewidth=2)
plt.plot(returns_leverage.index, returns_leverage['Cum_Ret_On_Cap'], label='Cumulative Return On Capital', linestyle='-', color='g', linewidth=2)
plt.plot(spy_buy_n_hold.index, spy_buy_n_hold['Cum_Return'], label='SPY Total Return', linestyle='-', color='r', linewidth=2)
plt.gca().xaxis.set_major_locator(mdates.YearLocator())
plt.gca().xaxis.set_major_formatter(mdates.DateFormatter('%Y'))
plt.xlabel('Year')
plt.ylabel('Total Return')

# Formatting y-axis ticks as percentages
def percent_formatter(x, pos):
    return '{:.0f}%'.format(x * 100)

plt.gca().yaxis.set_major_formatter(FuncFormatter(percent_formatter))

plt.title('Cumulative Returns Comparison')
plt.xticks(rotation=45, fontsize=7)
plt.yticks(fontsize=7)
plt.tight_layout()
plt.grid(True)
plt.legend(fontsize=8)
plt.show()

strategy_and_spy_returns = pd.merge(returns_leverage[['Portfolio_Daily_Ret']],spy_buy_n_hold[['SPY_Daily_Ret']], 
                                    left_on=returns_leverage.index, right_on=spy_buy_n_hold.index).set_index('key_0')
strategy_and_spy_returns.corr()

spy_daily_pnl_sum = spy_buy_n_hold.groupby(spy_buy_n_hold.index)['daily_pnl'].sum()
spy_cumulative_pnl = spy_daily_pnl_sum.cumsum()

filtered_prices['date'] = pd.to_datetime(filtered_prices['date'])
daily_pnl_sum = filtered_prices.groupby('date')['Daily_PnL'].sum()
cumulative_pnl = daily_pnl_sum.cumsum()

plt.figure(figsize=(10, 5))
plt.plot(spy_cumulative_pnl.index, spy_cumulative_pnl.values, label='SPY Buy and Hold Cumulative Daily PnL', linestyle='-', color='b', linewidth=2)
plt.plot(cumulative_pnl.index, cumulative_pnl.values, label='Cumulative Daily PnL', linestyle='-', color='orange', linewidth=2)

plt.gca().xaxis.set_major_locator(mdates.YearLocator())
plt.gca().xaxis.set_major_formatter(mdates.DateFormatter('%Y'))
plt.xlabel('Year')
plt.ylabel('Cumulative Sum of Daily PnL')
plt.title('SPY Buy and Hold Cumulative Daily PnL Over Time')
# Define custom formatting function for y-axis labels
def millions_formatter(x, pos):
    return '{:.0f}M'.format(x / 1e6)
plt.gca().yaxis.set_major_formatter(ticker.FuncFormatter(millions_formatter))
plt.xticks(rotation = 45, fontsize = 7)
plt.yticks(fontsize = 7)
plt.tight_layout()
plt.grid(True)
plt.legend(fontsize = 8)
plt.show()

trades['entry_date'] = pd.to_datetime(trades['entry_date'])
trades.sort_values(by='entry_date', inplace=True)

trade_pnl_sum = filtered_prices.groupby('entry_date')['Daily_PnL'].sum()
cumulative_pnl = trade_pnl_sum.cumsum()


# Plotting
plt.figure(figsize=(10, 5))
plt.plot(cumulative_pnl.index, cumulative_pnl.values, label='Cumulative Trade PnL', linewidth=2)
plt.gca().xaxis.set_major_locator(mdates.YearLocator())
plt.gca().xaxis.set_major_formatter(mdates.DateFormatter('%Y'))
plt.xlabel('Year')
plt.ylabel('Cumulative Trade PnL')
plt.title('Cumulative Trade PnL Over Time')
# Define custom formatting function for y-axis labels
def millions_formatter(x, pos):
    return '{:.0f}M'.format(x / 1e6)
plt.gca().yaxis.set_major_formatter(ticker.FuncFormatter(millions_formatter))
plt.xticks(rotation = 45, fontsize = 7)
plt.yticks(fontsize = 7)
plt.tight_layout()
plt.grid(True)
plt.show()

trades['entry_date'] = pd.to_datetime(trades['entry_date'])
trades['entry_year'] = trades['entry_date'].dt.year
yearly_pnl = trades.groupby('entry_year')['Trade_PnL'].sum()
plt.figure(figsize=(10, 5))
yearly_pnl.plot(kind='bar', color=['red' if x < 0 else 'green' for x in yearly_pnl])
plt.xlabel('Year')
plt.ylabel('Total Trade PnL')
plt.title('Total Trade PnL Per Year')
# Define custom formatting function for y-axis labels
def millions_formatter(x, pos):
    return '{:.0f}M'.format(x / 1e6)
plt.gca().yaxis.set_major_formatter(ticker.FuncFormatter(millions_formatter))
plt.xticks(rotation = 45, fontsize = 7)
plt.yticks(fontsize = 7)
plt.tight_layout()
plt.grid(axis='y')
plt.show()

spy_buy_n_hold['entry_year'] = spy_buy_n_hold.index.year
spy_yearly_pnl = spy_buy_n_hold.groupby('entry_year')['daily_pnl'].sum()
plt.figure(figsize=(10, 5))
spy_yearly_pnl.plot(kind='bar', color=['red' if x < 0 else 'green' for x in spy_yearly_pnl])
plt.xlabel('Year')
plt.ylabel('Total Trade PnL')
plt.title('SPY Buy & Hold Total Trade PnL Per Year')
# Define custom formatting function for y-axis labels
def millions_formatter(x, pos):
    return '{:.0f}M'.format(x / 1e6)
plt.gca().yaxis.set_major_formatter(ticker.FuncFormatter(millions_formatter))
plt.xticks(rotation = 45, fontsize = 7)
plt.yticks(fontsize = 7)
plt.tight_layout()
plt.grid(axis='y')
plt.show()

rolling_max = returns_leverage['Total_Portfolio_Value'].cummax()
drawdown = (returns_leverage['Total_Portfolio_Value'] - rolling_max) / rolling_max
# Plot drawdown
plt.figure(figsize=(10, 5))
drawdown.plot()
plt.title('Total Portfolio Drawdown by Percentage')
plt.xlabel('Year')
plt.ylabel('Drawdown (%)')
plt.gca().xaxis.set_major_locator(mdates.YearLocator())
plt.gca().xaxis.set_major_formatter(mdates.DateFormatter('%Y'))
plt.xticks(rotation = 45, fontsize = 7)
plt.yticks(fontsize = 7)
plt.tight_layout()
plt.grid(True)
plt.show()

returns_leverage['Cum_Funding_Cost']
fed_funds = fetch_fed_funds()
fed_funds = fed_funds[fed_funds.index >= '2011-01-01']

# Create the initial plot
fig, ax1 = plt.subplots(figsize=(10, 5))

# Plot the first y-axis data
ax1.plot(returns_leverage.index, returns_leverage['Cum_Funding_Cost'], linestyle='-', color='b', linewidth=2)
ax1.set_xlabel('Year')
ax1.set_ylabel('Total Cumulative Funding Costs', color='b')
ax1.tick_params('y', colors='b')
ax1.tick_params(axis='x', rotation=45, labelsize=7)
ax1.tick_params(axis='y', labelsize=7)
for y_tick in ax1.get_yticks():
    ax1.axhline(y_tick, color='b', linestyle=':', linewidth=1)
ax1.grid(axis='x')

# Create the second y-axis
ax2 = ax1.twinx()
ax2.plot(fed_funds.index, fed_funds['Fed_Funds_Annual'], linestyle='-', color = 'g', linewidth=2)
ax2.set_ylabel('Fed Funds Rate (%)', color='g')
ax2.tick_params('y', colors='g')
ax2.tick_params(axis='y', labelsize=7)
for y_tick in ax2.get_yticks():
    ax2.axhline(y_tick, color='g', linestyle='--', linewidth=1)

# Define custom formatting function for y-axis labels
def millions_formatter(x, pos):
    return '{:.1f}M'.format(x / 1e6)
ax1.yaxis.set_major_formatter(ticker.FuncFormatter(millions_formatter))
plt.gca().xaxis.set_major_locator(mdates.YearLocator())
plt.gca().xaxis.set_major_formatter(mdates.DateFormatter('%Y'))

# Title and grid
plt.title('Cumulative Funding Costs vs Fed Funds Rate')
plt.tight_layout()
plt.show()

returns_leverage['Cum_Trading_Costs'] = abs(returns_leverage['Trading_Costs']).cumsum()

# Create the initial plot
plt.figure(figsize=(10, 5))

# Plot the first y-axis data
plt.plot(returns_leverage.index, returns_leverage['Cum_Trading_Costs'], linewidth=2)
plt.gca().xaxis.set_major_locator(mdates.YearLocator())
plt.gca().xaxis.set_major_formatter(mdates.DateFormatter('%Y'))
plt.xlabel('Year')
plt.ylabel('Total Value')
plt.title('Cumulative Trading Costs')
# Define custom formatting function for y-axis labels
def millions_formatter(x, pos):
    return '{:.1f}M'.format(x / 1e6)
plt.gca().yaxis.set_major_formatter(ticker.FuncFormatter(millions_formatter))
plt.xticks(rotation = 45, fontsize = 7)
plt.yticks(fontsize = 7)
plt.tight_layout()
plt.grid(True)
plt.show()

	ticker	adj_open	adj_high	adj_low	adj_close	eps_diluted_net	shares_out	mkt_val	filing_date
date
2010-01-01	ROICU	10.40	10.40	10.40	10.40	NaN	NaN	NaN	NaT
2010-01-01	ALBO	520.80	520.80	520.80	520.80	NaN	NaN	NaN	NaT
2010-01-01	ERS	1.07	1.07	1.07	1.07	NaN	NaN	NaN	NaT
2010-01-04	EEB	34.88	35.23	34.71	35.23	NaN	NaN	NaN	NaT
2010-01-04	IP	15.93	16.08	15.84	15.93	NaN	NaN	NaN	NaT

	ticker	adj_open	adj_high	adj_low	adj_close	eps_diluted_net	shares_out	mkt_val	filing_date	previous_eps_diluted_net	pct_change_eps_diluted_net
date
2010-01-22	ADBE	35.62	35.82	34.35	34.38	0.73	523.76	18006.87	2010-01-22	NaN	NaN
2010-01-25	AAPL	6.12	6.19	6.05	6.14	0.32	25082.88	153997.96	2010-01-25	NaN	NaN
2010-01-26	NVS	29.32	29.47	29.19	29.41	3.69	2271.20	66798.91	2010-01-26	NaN	NaN
2010-01-29	ISRG	37.27	37.44	36.32	36.45	0.66	343.73	12529.34	2010-01-29	NaN	NaN
2010-01-29	AMZN	6.47	6.58	6.19	6.26	0.10	8659.66	54169.93	2010-01-29	NaN	NaN

	date	ticker	adj_open_trade	adj_high_trade	adj_low_trade	adj_close_trade	trade_year
10750	2012-01-03	AAPL	12.38	12.47	12.37	12.43	2012
5000	2012-01-03	ADBE	28.70	29.01	28.51	28.57	2012
8000	2012-01-03	AFL	16.46	16.74	16.44	16.61	2012
6250	2012-01-03	AMAT	8.98	9.01	8.77	8.79	2012
2750	2012-01-03	AXP	40.40	40.95	40.27	40.48	2012

	date	ticker	adj_open_trade	adj_high_trade	adj_low_trade	adj_close_trade	trade_year	entry_price	entry_date
10750	2012-01-03	AAPL	12.38	12.47	12.37	12.43	2012	12.43	2012-01-03
5000	2012-01-03	ADBE	28.70	29.01	28.51	28.57	2012	28.57	2012-01-03
8000	2012-01-03	AFL	16.46	16.74	16.44	16.61	2012	16.61	2012-01-03
6250	2012-01-03	AMAT	8.98	9.01	8.77	8.79	2012	8.79	2012-01-03
2750	2012-01-03	AXP	40.40	40.95	40.27	40.48	2012	40.48	2012-01-03

	date	ticker	adj_open_trade	adj_high_trade	adj_low_trade	adj_close_trade	trade_year	entry_price	entry_date	Stop_Loss	duplicated	exit_price	exit_date
0	2012-01-03	AAPL	12.38	12.47	12.37	12.43	2012	12.43	2012-01-03	None	False	NaN	NaT
1	2012-01-03	ADBE	28.70	29.01	28.51	28.57	2012	28.57	2012-01-03	None	False	NaN	NaT
2	2012-01-03	AFL	16.46	16.74	16.44	16.61	2012	16.61	2012-01-03	None	False	NaN	NaT
3	2012-01-03	AMAT	8.98	9.01	8.77	8.79	2012	8.79	2012-01-03	None	False	NaN	NaT
4	2012-01-03	AXP	40.40	40.95	40.27	40.48	2012	40.48	2012-01-03	None	False	NaN	NaT

Systematic Equity Selection From Earnings Data Analysis¶

FINM 33150 - Quantitative Trading Strategies¶

REDACTED, REDACTED, Jared Szajkowski (REDACTED)¶

Abstract¶

Introduction / Goals¶

Relevant Literature¶

Methodology¶

Section 1: Imports¶

Section 2: Python Functions¶

Section 3: Acquire Data¶

Section 4: Initial Data Investigation¶

Section 5: Develop Data¶

Section 5b: Identify Trades¶

Section 5c: Entry Price & Date¶

Section 5d: Implement Stop Loss¶

Section 5e: Exit Price & Date¶

Section 5f: Position Sizing¶

Section 5g: Profit & Loss¶

Section 5h: Trading Costs & Portfolio Value¶

Section 5j: Funding Costs¶

Section 5k: Returns¶

Results¶

Section 1: Portfolio Returns¶

Section 2: Return On Capital¶

Section 3: Returns Comparison¶

Discussion¶

Section 1: Portfolio Values¶

Section 2: Trade Analysis¶

Section 3: Benchmark Comparison¶

Section 3a: Returns Comparison¶

Section 3b: Cumulative Daily Profit & Loss¶

Section 3c: Total Trade Profit & Loss¶

Section 4: Drawdown Analysis¶

Section 5: Funding Costs¶

Section 6: Trading Costs¶

Conclusion¶

	Total_Position_Value	Daily_Cash_Flow	Portfolio_Cash	Trading_Costs	Total_Portfolio_Value	Fed_Funds_Annual	Fed_Funds_Daily	Daily_Fund	Daily_Funding_Cost	Cum_Funding_Cost
date
2012-01-03	100000046.47	0.00	0.00	0.00	100000046.47	0.00	0.00	80000046.47	253.97	253.97
2012-01-04	99838597.97	0.00	0.00	0.00	99838597.97	0.00	0.00	79838597.97	253.46	507.42
2012-01-05	99991894.01	0.00	0.00	0.00	99991894.01	0.00	0.00	79991894.01	253.94	761.37
2012-01-06	99420348.41	0.00	0.00	0.00	99420348.41	0.00	0.00	79420348.41	252.13	1013.49
2012-01-09	99985691.93	0.00	0.00	0.00	99985691.93	0.00	0.00	79985691.93	253.92	1267.42

	Portfolio_Daily_Ret
count	2176.000000
mean	0.000083
std	0.003439
min	-0.026557
25%	-0.000734
50%	0.000083
75%	0.000955
max	0.037566

	Daily_Ret_On_Cap
count	2175.000000
mean	0.000390
std	0.013162
min	-0.098043
25%	-0.002721
50%	0.000292
75%	0.003688
max	0.164627

	Mean (Annual)	Volatility (Annual)	Sharpe Ratio (Annual)	Max Return (Daily)	Max Return (Date)	Min Return (Daily)	Min Return (Date)	Max Drawdown	Peak	Bottom	Recovery Date
Portfolio_Daily_Ret	0.0210	0.0546	0.3850	0.0376	2019-01-04	-0.0266	2018-02-05	-0.1178	2013-12-26	2016-02-11	2018-01-17
Daily_Ret_On_Cap	0.0983	0.2089	0.4705	0.1646	2019-01-04	-0.0980	2018-02-05	-0.4231	2013-12-26	2016-02-11	2018-01-17
SPY_Daily_Ret	0.1469	0.1666	0.8820	0.0906	2020-03-24	-0.1094	2020-03-16	-0.3370	2020-02-19	2020-03-23	2020-08-10

	Portfolio_Daily_Ret	SPY_Daily_Ret
Portfolio_Daily_Ret	1.0000	0.6074
SPY_Daily_Ret	0.6074	1.0000

Systematic Equity Selection From Earnings Data Analysis¶

FINM 33150 - Quantitative Trading Strategies¶

REDACTED, REDACTED, Jared Szajkowski (REDACTED)¶

Abstract¶

Introduction / Goals¶

Relevant Literature¶

Methodology¶

Section 1: Imports¶

Section 2: Python Functions¶

Section 3: Acquire Data¶

Section 4: Initial Data Investigation¶

Section 5: Develop Data¶

Section 5a: Earnings Per Share Signals¶

Section 5b: Identify Trades¶

Section 5c: Entry Price & Date¶

Section 5d: Implement Stop Loss¶

Section 5e: Exit Price & Date¶

Section 5f: Position Sizing¶

Section 5g: Profit & Loss¶

Section 5h: Trading Costs & Portfolio Value¶

Section 5j: Funding Costs¶

Section 5k: Returns¶

Results¶

Section 1: Portfolio Returns¶

Section 2: Return On Capital¶

Section 3: Returns Comparison¶

Discussion¶

Section 1: Portfolio Values¶

Section 2: Trade Analysis¶

Section 3: Benchmark Comparison¶

Section 3a: Returns Comparison¶

Section 3b: Cumulative Daily Profit & Loss¶

Section 3c: Total Trade Profit & Loss¶

Section 4: Drawdown Analysis¶

Section 5: Funding Costs¶

Section 6: Trading Costs¶

Conclusion¶