Add files via upload

robsalgado · Nov 24, 2019 · d634ecf · d634ecf
1 parent 9c080d2
commit d634ecf
Showing 3 changed files with 612 additions and 0 deletions.
diff --git a/trading_bot/get_data_cf.py b/trading_bot/get_data_cf.py
@@ -0,0 +1,152 @@
+import pytz
+import requests
+import pandas as pd
+import numpy as np
+from datetime import datetime, timedelta
+from bs4 import BeautifulSoup
+from google.cloud import bigquery
+import pyarrow
+from google.cloud import storage
+import string
+import time
+
+def daily_equity_quotes(event, context):
+    # Get the api key from cloud storage
+    storage_client = storage.Client()
+    bucket = storage_client.get_bucket('<NAME OF YOUR CLOUD STORAGE BUCKET>')
+    blob = bucket.blob('<NAME OF YOUR SECRET FILE>')
+    api_key = blob.download_as_string()
+
+    # Check if the market was open today. Cloud functions use UTC and I'm in
+    # eastern so I convert the timezone
+    today = datetime.today().astimezone(pytz.timezone("America/New_York"))
+    today_fmt = today.strftime('%Y-%m-%d')
+
+    # Call the td ameritrade hours endpoint for equities to see if it is open
+    market_url = 'https://api.tdameritrade.com/v1/marketdata/EQUITY/hours'
+
+    params = {
+        'apikey': api_key,
+        'date': today_fmt
+        }
+
+    request = requests.get(
+        url=market_url,
+        params=params
+        ).json()
+
+    try:
+        if request['equity']['EQ']['isOpen'] is True:
+            # Get a current list of all the stock symbols for the NYSE
+            # Create a list of every letter in the alphabet
+            # Each page has a letter for all those symbols
+            # i.e. http://eoddata.com/stocklist/NYSE/A.htm'
+            alpha = list(string.ascii_uppercase)
+
+            symbols = []
+
+            # Loop through the letters in the alphabet to get the stocks on each page
+            # from the table and store them in a list
+            for each in alpha:
+                url = 'http://eoddata.com/stocklist/NYSE/{}.htm'.format(each)
+                resp = requests.get(url)
+                site = resp.content
+                soup = BeautifulSoup(site, 'html.parser')
+                table = soup.find('table', {'class': 'quotes'})
+                for row in table.findAll('tr')[1:]:
+                    symbols.append(row.findAll('td')[0].text.rstrip())       
+
+            # Remove the extra letters on the end
+            symbols_clean = []
+
+            for each in symbols:
+                each = each.replace('.', '-')
+                symbols_clean.append((each.split('-')[0]))
+
+            # The TD Ameritrade api has a limit to the number of symbols you can get data for
+            # in a single call so we chunk the list into 200 symbols at a time 
+            def chunks(l, n):
+                """
+                Takes in a list and how long you want
+                each chunk to be
+                """
+                n = max(1, n)
+                return (l[i:i+n] for i in range(0, len(l), n))
+
+            symbols_chunked = list(chunks(list(set(symbols_clean)), 200))            
+
+            # Function for the api request to get the data from td ameritrade
+            def quotes_request(stocks):
+                """
+                Makes an api call for a list of stock symbols
+                and returns a dataframe
+                """
+                url = r"https://api.tdameritrade.com/v1/marketdata/quotes"
+
+                params = {
+                'apikey': api_key,
+                'symbol': stocks
+                }
+
+                request = requests.get(
+                    url=url,
+                    params=params
+                    ).json()
+
+                time.sleep(1)
+
+                return pd.DataFrame.from_dict(
+                    request,
+                    orient='index'
+                    ).reset_index(drop=True)
+
+            # Loop through the chunked list of synbols
+            # and call the api. Append all the resulting dataframes into one
+            df = pd.concat([quotes_request(each) for each in symbols_chunked])
+
+            # Add the date and fmt the dates for BQ
+            df['date'] = pd.to_datetime(today_fmt)
+            df['date'] = df['date'].dt.date
+            df['divDate'] = pd.to_datetime(df['divDate'])
+            df['divDate'] = df['divDate'].dt.date
+            df['divDate'] = df['divDate'].fillna(np.nan)
+
+            # Remove anything without a price
+            df = df.loc[df['bidPrice'] > 0]
+
+            # Rename columns and format for bq (can't start with a number)
+            df = df.rename(columns={
+                '52WkHigh': '_52WkHigh',
+                 '52WkLow': '_52WkLow'
+                })
+
+            # Add to bigquery
+            client = bigquery.Client()
+
+            dataset_id = 'equity_data'
+            table_id = 'daily_quote_data'
+
+            dataset_ref = client.dataset(dataset_id)
+            table_ref = dataset_ref.table(table_id)
+
+            job_config = bigquery.LoadJobConfig()
+            job_config.source_format = bigquery.SourceFormat.CSV
+            job_config.autodetect = True
+            job_config.ignore_unknown_values = True
+            job = client.load_table_from_dataframe(
+                df,
+                table_ref,
+                location='US',
+                job_config=job_config
+            )
+
+            job.result()
+
+            return 'Success'
+
+        else:
+            # Market Not Open Today
+            pass
+    except KeyError:
+        # Not a weekday
+        pass
diff --git a/trading_bot/portfolio_summary_by_day_query.sql b/trading_bot/portfolio_summary_by_day_query.sql
@@ -0,0 +1,45 @@
+-- CTE to join our portfolio with the
+-- daily closing prices
+
+WITH prices_joined AS (
+  SELECT
+    strat_log.symbol AS symbol,
+    qty,
+    strat_log.date AS date,
+    closePrice * qty AS market_value
+  FROM
+    `<YOUR PROJECT>.equity_data.strategy_log` AS strat_log
+  JOIN (
+    SELECT
+      closePrice,
+      symbol,
+      date
+      FROM
+      `<YOUR PROJECT>.equity_data.daily_quote`
+      ) AS price_data
+  ON 
+    strat_log.symbol = price_data.symbol
+    AND strat_log.date = price_data.date
+  WHERE
+    strat = 'momentum_strat_1'
+)
+
+-- Main query to get the portfolio total
+-- by day along with the percent change 
+-- from the previous day
+SELECT 
+  date,
+  ROUND(total, 2) AS total,
+  ROUND((total / prev_day -1) * 100, 2) AS perc_diff
+FROM (
+  SELECT
+    date,
+    SUM(market_value) AS total,
+    LAG(SUM(market_value)) OVER (ORDER BY date) AS prev_day
+  FROM
+    prices_joined
+  GROUP BY
+    date
+    )
+ORDER BY 
+  date
diff --git a/trading_bot/trading_bot_cf.py b/trading_bot/trading_bot_cf.py
@@ -0,0 +1,415 @@
+import pandas as pd
+import numpy as np
+from scipy import stats
+import requests
+import time
+from datetime import datetime
+import pytz
+from google.cloud import bigquery
+from google.cloud import storage
+import pyarrow
+import alpaca_trade_api as tradeapi
+from pypfopt.efficient_frontier import EfficientFrontier
+from pypfopt import risk_models
+from pypfopt import expected_returns
+from pypfopt.discrete_allocation import DiscreteAllocation, get_latest_prices
+
+def trade_bot(event, context):
+    # Get the api key from cloud storage
+    storage_client = storage.Client()
+    bucket = storage_client.get_bucket('<NAME OF YOUR CLOUD STORAGE BUCKET>')
+    blob = bucket.blob('<NAME OF YOUR SECRET FILE>')
+    api_key = blob.download_as_string()
+
+    # Check if the market was open today
+    today = datetime.today().astimezone(pytz.timezone("America/New_York"))
+    today_fmt = today.strftime('%Y-%m-%d')
+
+    market_url = 'https://api.tdameritrade.com/v1/marketdata/EQUITY/hours'
+
+    params = {
+        'apikey': api_key,
+        'date': today_fmt
+        }
+
+    request = requests.get(
+        url=market_url,
+        params=params
+        ).json()
+
+    try:
+        if request['equity']['EQ']['isOpen'] is True:                
+            # Alpaca creds and api
+            blob = bucket.blob('<NAME OF YOUR SECRET FILE>')
+            keys = blob.download_as_string()
+            keys_str = keys.decode().split(',')
+            key_id = keys_str[0]
+            secret_key = keys_str[1]
+
+            # Initialize the alpaca api
+            base_url = "https://paper-api.alpaca.markets"
+
+            api = tradeapi.REST(
+                key_id,
+                secret_key,
+                base_url,
+                'v2'
+                )
+
+            # BQ creds
+            client = bigquery.Client()
+
+            # Load the historical stock data from BQ
+            sql_hist = """
+                SELECT
+                  symbol,
+                  closePrice,
+                  date
+                FROM 
+                  `trading-247-365.equity_data.daily_quote_data`
+                """
+
+            df = client.query(sql_hist).to_dataframe()
+
+            # Convert the date column to datetime
+            df['date'] = pd.to_datetime(df['date'])
+
+            # Sort by date (ascending) for the momentum calculation
+            df = df.sort_values(by='date').reset_index(drop=True)
+
+            # Rename the column
+            df = df.rename(columns={'closePrice': 'close'})
+
+            # Get the current positions from alpaca and create a df
+            positions = api.list_positions()
+
+            symbol, qty, market_value = [], [], []
+
+            for each in positions:
+                symbol.append(each.symbol)
+                qty.append(int(each.qty))
+                market_value.append(float(each.market_value))
+
+            df_pf = pd.DataFrame(
+                {
+                    'symbol': symbol,
+                     'qty': qty,
+                    'market_value': market_value
+                }
+            )
+
+            # Current portfolio value
+            portfolio_value = round(df_pf['market_value'].sum(), 2)
+
+            # Calculate the momentum and select the stocks to buy
+            # Set the variables for the momentum trading strategy
+            momentum_window = 125
+            minimum_momentum = 40
+
+            # Momentum score function
+            def momentum_score(ts):
+                x = np.arange(len(ts))
+                log_ts = np.log(ts)
+                regress = stats.linregress(x, log_ts)
+                annualized_slope = (np.power(np.exp(regress[0]), 252) -1) * 100
+                return annualized_slope * (regress[2] ** 2)
+
+            df['momentum'] = df.groupby('symbol')['close'].rolling(
+                momentum_window,
+                min_periods=minimum_momentum
+                ).apply(momentum_score).reset_index(level=0, drop=True)
+
+            # Get the top momentum stocks for the period
+            # Set the portfolio size we want
+            portfolio_size = 10
+
+            # Function to get the momentum stocks we want
+            def get_momentum_stocks(df, date, portfolio_size, cash):
+                # Filter the df to get the top 10 momentum stocks for the latest day
+                df_top_m = df.loc[df['date'] == pd.to_datetime(date)]
+                df_top_m = df_top_m.sort_values(by='momentum', ascending=False).head(portfolio_size)
+
+                # Set the universe to the top momentum stocks for the period
+                universe = df_top_m['symbol'].tolist()
+
+                # Create a df with just the stocks from the universe
+                df_u = df.loc[df['symbol'].isin(universe)]
+
+                # Create the portfolio
+                # Pivot to format for the optimization library
+                df_u = df_u.pivot_table(
+                    index='date', 
+                    columns='symbol',
+                    values='close',
+                    aggfunc='sum'
+                    )
+
+                # Calculate expected returns and sample covariance
+                mu = expected_returns.mean_historical_return(df_u)
+                S = risk_models.sample_cov(df_u)
+
+                # Optimise the portfolio for maximal Sharpe ratio
+                ef = EfficientFrontier(mu, S, gamma=1) # Use regularization (gamma=1)
+                weights = ef.max_sharpe()
+                cleaned_weights = ef.clean_weights()
+
+                # Allocate
+                latest_prices = get_latest_prices(df_u)
+
+                da = DiscreteAllocation(
+                    cleaned_weights,
+                    latest_prices,
+                    total_portfolio_value=cash
+                    )
+
+                allocation = da.lp_portfolio()[0]
+
+                # Put the stocks and the number of shares from the portfolio into a df
+                symbol_list = []
+                num_shares_list = []
+
+                for symbol, num_shares in allocation.items():
+                    symbol_list.append(symbol)
+                    num_shares_list.append(num_shares)
+
+                # Now that we have the stocks we want to buy we filter the df for those ones
+                df_buy = df.loc[df['symbol'].isin(symbol_list)]
+
+                # Filter for the period to get the closing price
+                df_buy = df_buy.loc[df_buy['date'] == date].sort_values(by='symbol')
+
+                # Add in the qty that was allocated to each stock
+                df_buy['qty'] = num_shares_list
+
+                # Calculate the amount we own for each stock
+                df_buy['amount_held'] = df_buy['close'] * df_buy['qty']
+                df_buy = df_buy.loc[df_buy['qty'] != 0]
+                return df_buy
+
+            # Call the function
+            df_buy = get_momentum_stocks(
+                    df=df,
+                    date=today_fmt,
+                    portfolio_size=portfolio_size,
+                    cash=portfolio_value
+                )
+
+            # Figure out which stocks we need to sell
+
+            # Create a list of stocks to sell based on what is currently in our pf
+            sell_list = list(set(df_pf['symbol'].tolist()) - set(df_buy['symbol'].tolist()))
+
+            def sell_stocks(df, df_pf, sell_list, date):
+                # Get the current prices and the number of shares to sell
+                df_sell_price = df.loc[df['date'] == pd.to_datetime(date)]
+
+                # Filter 
+                df_sell_price = df_sell_price.loc[df_sell_price['symbol'].isin(sell_list)]
+
+                # Check to see if there are any stocks in the current ones to buy
+                # that are not in the current portfolio. It's possible there may not be any
+                if df_sell_price.shape[0] > 0:
+                    df_sell_price = df_sell_price[[
+                        'symbol',
+                        'close'
+                    ]]
+
+                    # Merge with the current pf to get the number of shares we bought initially
+                    # so we know how many to sell
+                    df_buy_shares = df_pf[[
+                        'symbol',
+                        'qty'
+                    ]]
+
+                    df_sell = pd.merge(
+                        df_sell_price,
+                        df_buy_shares,
+                        on='symbol',
+                        how='left'
+                    )
+
+                else:
+                    df_sell = None
+
+                return df_sell
+
+            # Call the function
+            df_sell = sell_stocks(
+                df=df,
+                df_pf=df_pf,
+                sell_list=sell_list,
+                date=today_fmt
+            )
+
+            # Get a list of all stocks to sell i.e. any not in the current df_buy and any diff in qty
+            def stock_diffs(df_sell, df_pf, df_buy):
+                # Select only the columns we need
+                df_stocks_held_prev = df_pf[['symbol', 'qty']]
+                df_stocks_held_curr = df_buy[['symbol', 'qty', 'date', 'close']]
+
+                # Inner merge to get the stocks that are the same week to week
+                df_stock_diff = pd.merge(
+                    df_stocks_held_curr,
+                    df_stocks_held_prev,
+                    on='symbol',
+                    how='inner'
+                )
+
+                # Calculate any difference in positions based on the new pf
+                df_stock_diff['share_amt_change'] = df_stock_diff['qty_x'] - df_stock_diff['qty_y']
+
+                # Create df with the share difference and current closing price
+                df_stock_diff = df_stock_diff[[
+                    'symbol',
+                    'share_amt_change',
+                    'close'
+                    ]]
+
+                # If there's less shares compared to last week for the stocks that
+                # are still in our portfolio, sell those shares
+                df_stock_diff_sale = df_stock_diff.loc[df_stock_diff['share_amt_change'] < 0]
+
+                # If there are stocks whose qty decreased, 
+                # add the df with the stocks that dropped out of the pf
+                if df_stock_diff_sale.shape[0] > 0:
+                    if df_sell is not None:
+                        df_sell_final = pd.concat([df_sell, df_stock_diff_sale])
+                        # Fill in NaNs in the share amount change column with
+                        # the qty of the stocks no longer in the pf
+                        df_sell_final['share_amt_change'] = df_sell_final['share_amt_change'].fillna(df_sell_final['qty'])
+                        # Turn the negative numbers into positive for the order
+                        df_sell_final['share_amt_change'] = np.abs(df_sell_final['share_amt_change'])
+                        df_sell_final = df_sell_final.rename(columns={'share_amt_change': 'qty'})
+                    else:
+                        df_sell_final = df_stock_diff_sale
+                        # Turn the negative numbers into positive for the order
+                        df_sell_final['share_amt_change'] = np.abs(df_sell_final['share_amt_change'])
+                        df_sell_final = df_sell_final.rename(columns={'share_amt_change': 'qty'})
+                else:
+                    df_sell_final = None
+
+                return df_sell_final
+
+            df_sell_final = stock_diffs(
+                df_sell=df_sell,
+                df_pf=df_pf,
+                df_buy=df_buy
+            )
+
+            # Send the sell order to the api
+            if df_sell_final is not None:
+                symbol_list = df_sell_final['symbol'].tolist()
+                qty_list = df_sell_final['qty'].tolist()
+
+                for symbol, qty in list(zip(symbol_list, qty_list)):
+                    api.submit_order(
+                    symbol=symbol,
+                    qty=qty,
+                    side='sell',
+                    type='market',
+                    time_in_force='day'
+                    )
+
+            # Buy the stocks that increased in shares compared
+            # to last week or any new stocks
+            def df_buy_new(df_pf, df_buy):
+                # Left merge to get any new stocks or see if they changed qty
+                df_buy_new = pd.merge(
+                    df_pf,
+                    df_buy,
+                    on='symbol',
+                    how='left'
+                    )
+
+                # Get the qty we need to increase our positions by
+                df_buy_new['qty_new'] = df_buy_new['qty_y'] - df_buy_new['qty_x']
+
+                # Filter for only shares that increased
+                df_buy_new = df_buy_new.loc[df_buy_new['qty_new'] > 0]
+                if df_buy_new.shape[0] > 0:
+                    df_buy_new = df_buy_new[[
+                        'symbol',
+                        'qty_new'
+                    ]]
+                    df_buy_new = df_buy_new.rename(columns={'qty_new': 'qty'})
+                else:
+                    df_buy_new = None
+
+                return df_buy_new
+
+            # Call the function
+            df_buy_new = df_buy_new(
+                df_pf=df_pf,
+                df_buy=df_buy
+            )
+
+            # Send the buy order to the api
+            if df_buy_new is not None:
+                symbol_list = df_buy_new['symbol'].tolist()
+                qty_list = df_buy_new['qty'].tolist()
+
+                for symbol, qty in list(zip(symbol_list, qty_list)):
+                    api.submit_order(
+                        symbol=symbol,
+                        qty=qty,
+                        side='buy',
+                        type='market',
+                        time_in_force='day'
+                    )
+
+            # Log the updated pf
+            positions = api.list_positions()
+
+            symbol, qty, market_value = [], [], []
+
+            for each in positions:
+                symbol.append(each.symbol)
+                qty.append(int(each.qty))
+
+            # New position df
+            position_df = pd.DataFrame(
+                {
+                    'symbol': symbol,
+                     'qty': qty
+                }
+            )
+
+            # Add the current date and other info into the portfolio df for logging
+            position_df['date'] = pd.to_datetime(today_fmt)
+            position_df['strat'] = 'momentum_strat_1'
+
+            # Add the new pf to BQ
+            # Format date to match schema
+            position_df['date'] = position_df['date'].dt.date
+
+            # Append it to the anomaly table
+            dataset_id = 'equity_data'
+            table_id = 'strategy_log'
+
+            dataset_ref = client.dataset(dataset_id)
+            table_ref = dataset_ref.table(table_id)
+
+            job_config = bigquery.LoadJobConfig()
+            job_config.source_format = bigquery.SourceFormat.CSV
+            job_config.autodetect = True
+            job_config.ignore_unknown_values = True
+
+            job = client.load_table_from_dataframe(
+                position_df,
+                table_ref,
+                location='US',
+                job_config=job_config
+                )
+
+            job.result()
+
+            return 'Success'
+
+        else:
+            # Market Not Open Today
+            pass
+
+    except KeyError:
+        # Not a weekday
+        pass
+