### Load packages
import pandas as pd
import numpy as np
import yfinance as yf
import datetime as dt
import matplotlib.pyplot as plt
from datetime import timedelta

### Magic command to allow inline display of plots in a jupyter notebook.
%matplotlib inline

### Settings to allow the lists of results to not be truncated.
pd.set_option('display.max_rows', None)
pd.set_option('display.max_colwidth', 140)
pd.set_option('display.max_columns', None)

### Make exponentiated values appear as 2 decimal place float.
pd.options.display.float_format = '{:.2f}'.format

tkr = yf.Ticker("SPY")
#tkr is now a yfinance Ticker object for SPY.

spy_data_df = tkr.history()
spy_data_df.head()

tkr.info

{'previousClose': 421.65,
 'regularMarketOpen': 422.96,
 'twoHundredDayAverage': 392.55035,
 'trailingAnnualDividendYield': None,
 'payoutRatio': None,
 'volume24Hr': None,
 'regularMarketDayHigh': 424.62,
 'navPrice': 421.53,
 'averageDailyVolume10Day': 52061657,
 'totalAssets': 361937436672,
 'regularMarketPreviousClose': 421.65,
 'fiftyDayAverage': 417.1997,
 'trailingAnnualDividendRate': None,
 'open': 422.96,
 'toCurrency': None,
 'averageVolume10days': 52061657,
 'expireDate': None,
 'yield': 0.013300001,
 'algorithm': None,
 'dividendRate': None,
 'exDividendDate': None,
 'beta': None,
 'circulatingSupply': None,
 'startDate': None,
 'regularMarketDayLow': 421.56,
 'priceHint': 2,
 'currency': 'USD',
 'regularMarketVolume': 18413511,
 'lastMarket': None,
 'maxSupply': None,
 'openInterest': None,
 'marketCap': None,
 'volumeAllCurrencies': None,
 'strikePrice': None,
 'averageVolume': 76217779,
 'priceToSalesTrailing12Months': None,
 'dayLow': 421.56,
 'ask': 422.17,
 'ytdReturn': None,
 'askSize': 900,
 'volume': 18413511,
 'fiftyTwoWeekHigh': 424.62,
 'forwardPE': None,
 'maxAge': 1,
 'fromCurrency': None,
 'fiveYearAvgDividendYield': None,
 'fiftyTwoWeekLow': 296.74,
 'bid': 422.37,
 'tradeable': False,
 'dividendYield': None,
 'bidSize': 900,
 'dayHigh': 424.62,
 'exchange': 'PCX',
 'shortName': 'SPDR S&P 500',
 'longName': 'SPDR S&P 500 ETF Trust',
 'exchangeTimezoneName': 'America/New_York',
 'exchangeTimezoneShortName': 'EDT',
 'isEsgPopulated': False,
 'gmtOffSetMilliseconds': '-14400000',
 'quoteType': 'ETF',
 'symbol': 'SPY',
 'messageBoardId': 'finmb_6160262',
 'market': 'us_market',
 'annualHoldingsTurnover': None,
 'enterpriseToRevenue': None,
 'beta3Year': 1,
 'profitMargins': None,
 'enterpriseToEbitda': None,
 '52WeekChange': None,
 'morningStarRiskRating': None,
 'forwardEps': None,
 'revenueQuarterlyGrowth': None,
 'fundInceptionDate': 727660800,
 'annualReportExpenseRatio': None,
 'bookValue': None,
 'fundFamily': 'SPDR State Street Global Advisors',
 'lastFiscalYearEnd': None,
 'netIncomeToCommon': None,
 'trailingEps': None,
 'lastDividendValue': None,
 'SandP52WeekChange': None,
 'priceToBook': None,
 'nextFiscalYearEnd': None,
 'mostRecentQuarter': None,
 'enterpriseValue': None,
 'threeYearAverageReturn': 0.1696,
 'lastSplitDate': None,
 'lastSplitFactor': None,
 'legalType': 'Exchange Traded Fund',
 'lastDividendDate': None,
 'morningStarOverallRating': None,
 'earningsQuarterlyGrowth': None,
 'pegRatio': None,
 'lastCapGain': None,
 'category': 'Large Blend',
 'fiveYearAverageReturn': 0.1691,
 'phone': '866-732-8673',
 'longBusinessSummary': 'The investment seeks to provide investment results that, before expenses, correspond generally to the price and yield performance of the S&P 500Â® Index.\n The Trust seeks to achieve its investment objective by holding a portfolio of the common stocks that are included in the index (the â\x80\x9cPortfolioâ\x80\x9d), with the weight of each stock in the Portfolio substantially corresponding to the weight of such stock in the index.',
 'companyOfficers': [],
 'regularMarketPrice': 422.96,
 'logo_url': ''}

# To see a list of all the dividends that have been paid.
tkr.dividends

Series([], Name: Dividends, dtype: int64)

spy_data_df = tkr.history(period = "max", auto_adjust = False)
spy_data_df.info()

<class 'pandas.core.frame.DataFrame'>
DatetimeIndex: 7143 entries, 1993-01-29 to 2021-06-10
Data columns (total 8 columns):
Open            7143 non-null float64
High            7143 non-null float64
Low             7143 non-null float64
Close           7143 non-null float64
Adj Close       7143 non-null float64
Volume          7143 non-null int64
Dividends       7143 non-null float64
Stock Splits    7143 non-null int64
dtypes: float64(6), int64(2)
memory usage: 502.2 KB

# Insert a Symbol column
spy_data_df.insert(0, "Symbol", value = "SPY")
spy_data_df.head()

### Load the list of stock symbols into a dataframe.
symbols_df = pd.read_csv("Symbols.txt", header = None, names = ["Symbol", "Name"])
symbols_df

# Initialize dataframe variable that will hold the results.
all_data_df = None 

# Get the price data for each stock in the symbols list and append results to the dataframe
for index, row in symbols_df.iterrows():
    STOCK_FUND_SYMBOL = row["Symbol"]
    STOCK_FUND_NAME = row["Name"]
    tkr = yf.Ticker(STOCK_FUND_SYMBOL)
    stock_price_df = tkr.history(period = "max", auto_adjust = False, debug = False)
    # debug = False, prevents error messages from being streamed to the console.
    
    # Insert a Symbol column
    stock_price_df.insert(0, "Symbol", value = STOCK_FUND_SYMBOL)
    
    # Append the symbol results to a single dataframe so all data is in one dataset.
    if all_data_df is None:
        all_data_df = stock_price_df
    else:
        all_data_df = all_data_df.append(stock_price_df, sort = True)
        
all_data_df.head()

# See which Symbols do not have data
dataframe1 = pd.DataFrame(symbols_df["Symbol"])
dataframe2 = pd.DataFrame(pd.unique(all_data_df['Symbol']))
dataframe2.columns = ["Symbol"]
common = dataframe1.merge(dataframe2, on=["Symbol"])
nodata = dataframe1[~dataframe1.Symbol.isin(common.Symbol)]
nodata

# Create a list of symbols 
symbols_lst = pd.unique(all_data_df['Symbol'])

# Get the names of the stocks to be plotted using the symbols_df dataframe
names_lst = list(symbols_df[symbols_df.Symbol.isin(symbols_lst)]["Name"])

# Loop though the data and plot each symbol

numrows = 8  # Arrange the plots in this number of rows
numcols = 2  # Arrange the plots in this number of columns
sym = 0  # symbol counter

fig, axes = plt.subplots(numrows, numcols, figsize=(30,60))
for ro in range(numrows):
    for co in range(numcols):
        price_df = pd.DataFrame(all_data_df.loc[all_data_df["Symbol"] == symbols_lst[sym]]['Adj Close'])        
        
        # Highlight the SPY chart using red.
        if symbols_lst[sym] == 'SPY':
            axcolor = 'red'
        else: 
            axcolor = 'black'
            
        axes[ro, co].plot(price_df,
                          color = axcolor)
        
        axes[ro, co].set_title(symbols_lst[sym] + ' - ' + names_lst[sym], 
                               fontsize = 28,
                               color = axcolor)

        axes[ro, co].set_ylabel('Adjusted Close', fontsize = 24, 
                                color = axcolor)
        
        axes[ro, co].tick_params(direction = 'out', 
                                 length = 6, 
                                 width =2 , 
                                 labelsize = 20,
                                 colors = axcolor)
        
        sym += 1
        if sym >= len(symbols_lst):
            break

/Users/mitchellfawcett/anaconda3/lib/python3.7/site-packages/pandas/plotting/_converter.py:129: FutureWarning: Using an implicitly registered datetime converter for a matplotlib plotting method. The converter was registered by pandas on import. Future versions of pandas will require you to explicitly register matplotlib converters.

To register the converters:
	>>> from pandas.plotting import register_matplotlib_converters
	>>> register_matplotlib_converters()
  warnings.warn(msg, FutureWarning)

# Get the starting and ending dates (which is the row index) of the price data for each symbol.
# Cite: jezrael  
# At https://stackoverflow.com/questions/47115448/pandas-get-index-of-first-and-last-element-by-group
fund_startend_date_df = all_data_df.index.to_series().groupby(all_data_df['Symbol']).agg(['first','last']) # .reset_index()

# Examine results
fund_startend_date_df

# Get the starting and ending price for each symbol
fund_startend_price_df = all_data_df.groupby("Symbol")['Adj Close'].agg(['first', 'last'])

# Examine results
fund_startend_price_df

### Calculate the CAGR

# Ratio of change in price from beginning of data to end.
price_ratio = (fund_startend_price_df['last'] / fund_startend_price_df['first'])

# Number of years and fraction of year each symbol's data covers.
num_years = ((fund_startend_date_df['last'] - fund_startend_date_df['first']) / timedelta(days=365))

# CAGR
cagr_df = pd.DataFrame((price_ratio ** (1 / num_years) - 1.0) * 100, columns = ['CAGR %'])
# (fund_startend_price_df['last'] / fund_startend_price_df['first']) ** (1 / ((fund_startend_date_df['last'] - fund_startend_date_df['first']) / timedelta(days=365))) - 1.0

cagr_df

	Open	High	Low	Close	Volume	Dividends	Stock Splits
Date
2021-05-10	422.50	422.74	417.81	417.94	81852400	0	0
2021-05-11	413.10	415.27	410.06	414.21	116888000	0	0
2021-05-12	411.23	412.59	404.00	405.41	134811000	0	0
2021-05-13	407.07	412.35	407.02	410.28	106394000	0	0
2021-05-14	413.21	417.49	413.18	416.58	82123100	0	0

	Symbol	Open	High	Low	Close	Adj Close	Volume	Dividends	Stock Splits
Date
1993-01-29	SPY	43.97	43.97	43.75	43.94	25.88	1003200	0.00	0
1993-02-01	SPY	43.97	44.25	43.97	44.25	26.07	480500	0.00	0
1993-02-02	SPY	44.22	44.38	44.12	44.34	26.12	201300	0.00	0
1993-02-03	SPY	44.41	44.84	44.38	44.81	26.40	529400	0.00	0
1993-02-04	SPY	44.97	45.09	44.47	45.00	26.51	531500	0.00	0

	Symbol	Name
0	AMDVX	Am Cntry Midcp Value
1	FLCNX	Fdlty Cntrfnd
2	MDIZX	Mfs Intl Dvrsfctn
3	PMEGX	T Rowe Midcp Eqty Grwth
4	SPY	S & P 500 ETF
5	TIREX	Tiaa Crf Real Estat Secrt
6	VEVRX	Victory Sycmre Estbls Value
7	VEIRX	Vngrd Eqty Incm
8	VIEIX	Vngrd Extnd Mrkt Indx
9	VWEAX	Vngrd High Yld Corp
10	VIIIX	Vngrd Indx
11	VIPIX	Vngrd Infl Prtct Secrt
12	VSCIX	Vngrd Smcp Indx
13	VUSXX	Vngrd Trsy Mny Mrkt
14	VBTIX	Vngrd Ttl Bond Mrkt Indx
15	VTSNX	Vngrd Ttl Intl Stck Indx
16	WACSX	Wstrn Asst Core Bond

	Adj Close	Close	Dividends	High	Low	Open	Stock Splits	Symbol	Volume
Date
2013-07-26	13.68	15.66	0.00	15.66	15.66	15.66	0.00	AMDVX	0.00
2013-07-29	13.61	15.58	0.00	15.58	15.58	15.58	0.00	AMDVX	0.00
2013-07-31	13.62	15.60	0.00	15.60	15.60	15.60	0.00	AMDVX	0.00
2013-08-01	13.82	15.82	0.00	15.82	15.82	15.82	0.00	AMDVX	0.00
2013-08-02	13.77	15.77	0.00	15.77	15.77	15.77	0.00	AMDVX	0.00

	first	last
Symbol
AMDVX	2013-07-26	2021-06-09
FLCNX	2017-05-25	2021-06-09
MDIZX	2017-10-05	2021-06-09
PMEGX	1996-07-30	2021-06-09
SPY	1993-01-29	2021-06-10
TIREX	2002-09-30	2021-06-09
VBTIX	1995-09-18	2021-06-09
VEIRX	2001-08-13	2021-06-09
VEVRX	2014-03-10	2021-06-09
VIEIX	1997-07-07	2021-06-09
VIIIX	1997-07-07	2021-06-09
VIPIX	2003-12-15	2021-06-09
VSCIX	1997-07-07	2021-06-09
VTSNX	2010-11-29	2021-06-09
VWEAX	2001-11-12	2021-06-09
WACSX	2008-08-29	2021-06-09

How to Download Stock Data Using Python¶

Outline of this project¶

Project setup¶

yfinance package basics¶

Other features of yfinance¶

Download data for one ticker symbol¶

"Adjusted" prices are important¶

Download data for a portfolio¶

Plot the adjusted prices¶

Comparing returns¶

Compound Annual Growth Rate formula¶

Conclusion¶

	CAGR %
Symbol
AMDVX	5.00
FLCNX	20.09
MDIZX	10.55
PMEGX	8.62
SPY	10.34
TIREX	6.99
VBTIX	4.86
VEIRX	6.03
VEVRX	6.58
VIEIX	8.18
VIIIX	8.04
VIPIX	4.02
VSCIX	8.29
VTSNX	6.49
VWEAX	5.98
WACSX	5.30

	first	last
Symbol
AMDVX	13.68	20.09
FLCNX	9.90	20.75
MDIZX	17.97	25.99
PMEGX	9.83	76.94
SPY	25.88	422.51
TIREX	6.11	21.63
VBTIX	3.33	11.30
VEIRX	29.01	92.72
VEVRX	32.29	51.29
VIEIX	21.48	140.92
VIIIX	57.99	369.57
VIPIX	5.85	11.65
VSCIX	16.11	108.45
VTSNX	74.28	144.06
VWEAX	1.91	5.97
WACSX	6.84	13.24