!pip install yfinance

Requirement already satisfied: yfinance in c:\programdata\anaconda3\lib\site-packages (0.1.63)
Requirement already satisfied: numpy>=1.15 in c:\users\dell\appdata\roaming\python\python38\site-packages (from yfinance) (1.19.5)
Requirement already satisfied: requests>=2.20 in c:\users\dell\appdata\roaming\python\python38\site-packages (from yfinance) (2.26.0)
Requirement already satisfied: multitasking>=0.0.7 in c:\programdata\anaconda3\lib\site-packages (from yfinance) (0.0.9)
Requirement already satisfied: pandas>=0.24 in c:\programdata\anaconda3\lib\site-packages (from yfinance) (1.2.4)
Requirement already satisfied: lxml>=4.5.1 in c:\programdata\anaconda3\lib\site-packages (from yfinance) (4.6.3)
Requirement already satisfied: pytz>=2017.3 in c:\programdata\anaconda3\lib\site-packages (from pandas>=0.24->yfinance) (2021.1)
Requirement already satisfied: python-dateutil>=2.7.3 in c:\programdata\anaconda3\lib\site-packages (from pandas>=0.24->yfinance) (2.8.1)
Requirement already satisfied: six>=1.5 in c:\programdata\anaconda3\lib\site-packages (from python-dateutil>=2.7.3->pandas>=0.24->yfinance) (1.15.0)
Requirement already satisfied: charset-normalizer~=2.0.0 in c:\users\dell\appdata\roaming\python\python38\site-packages (from requests>=2.20->yfinance) (2.0.7)
Requirement already satisfied: urllib3<1.27,>=1.21.1 in c:\programdata\anaconda3\lib\site-packages (from requests>=2.20->yfinance) (1.26.4)
Requirement already satisfied: certifi>=2017.4.17 in c:\programdata\anaconda3\lib\site-packages (from requests>=2.20->yfinance) (2020.12.5)
Requirement already satisfied: idna<4,>=2.5 in c:\programdata\anaconda3\lib\site-packages (from requests>=2.20->yfinance) (2.10)


import pandas as pd
import plotly.express as px
import cufflinks
import plotly.io as pio 
import yfinance as yf
cufflinks.go_offline()
cufflinks.set_config_file(world_readable=True, theme='pearl')
pio.renderers.default = "notebook" # should change by looking into pio.renderers

pd.options.display.max_columns = None


symbols = ["AAPL"]

df = yf.download(tickers=symbols)
df.head()

[*********************100%***********************]  1 of 1 completed


# convert column names into lowercase
df.columns = [c.lower() for c in df.columns]
df.rename(columns={"adj close":"adj_close"},inplace=True)


ndf = pd.DataFrame()
for c in df.columns:
    nc = df[c].isna().sum()
    tr = len(df[c])
    rate = nc/tr
    ndf = ndf.append({"col_name":c,"total_rows": tr, 
                "null_rows": nc,
                "rate": rate},ignore_index=True)
ndf


fig = df.iplot(kind="hist",subplots=True, title="Distribution of All Variables", asFigure=True)
fig.write_image("stock_analysis/dist.png")
fig.show()


fig = df.iplot(kind="box",subplots=True, title="Box of All Variables", asFigure=True)
fig.write_image("stock_analysis/box.png")
fig.show()


df.describe()


fig=df.iplot(kind="line",subplots=True, title="Trend of All Variables", asFigure=True)
fig.write_image("stock_analysis/trend.png")
fig.show()


tdf = df.copy()
smadf = tdf.rolling(window=5).mean()
smadf


for c in smadf.columns:
    tdf[f"sma_{c}"] = smadf[c]
tdf


smac = [c for c in tdf.columns if "sma" in c]
col = [c for c in tdf.columns if "sma" not in c]

for s,c in zip(smac,col):
    fig = tdf[[c, s]].iplot(kind="line", title=f"{s} vs {c}", xTitle="Date", asFigure=True)
    fig.write_image(f"stock_analysis/sma_{c}.png")
    fig.show()


wmadf=df.rolling(5).apply(lambda x: np.average(x, weights=[1,2,3,4,5]))
wmadf


for c in wmadf.columns:
    tdf[f"wma_{c}"] = wmadf[c]
tdf


smac = [c for c in tdf.columns if "sma" in c]
wmac = [c for c in tdf.columns if "wma" in c]
col = [c for c in tdf.columns if "sma" not in c and "wma" not in c]

for s,c,w in zip(smac,col, wmac):
    fig=tdf[[c, s, w]].iplot(kind="line", title=f"{s} vs {c} vs {w}", xTitle="Date", asFigure=True)
    fig.write_image(f"stock_analysis/wma_{c}.png")
    fig.show()


for s,c,w in zip(smac,col, wmac):
    fig=tdf[-100:][[c, s, w]].iplot(kind="line", title=f"{s} vs {c} vs {w}",  xTitle="Date", asFigure=True)
    fig.write_image(f"stock_analysis/sma_{c}2.png")
    fig.show()


emadf=df.ewm(span=5, min_periods=5, adjust=True).mean()
emadf


for c in emadf.columns:
    tdf[f"ema_{c}"] = emadf[c]
tdf


smac = [c for c in tdf.columns if "sma" in c]
wmac = [c for c in tdf.columns if "wma" in c]
emac = [c for c in tdf.columns if "ema" in c]
col = [c for c in tdf.columns if "sma" not in c and "wma" not in c and "ema" not in c]

for s,c,w,e in zip(smac,col, wmac, emac):
    fig=tdf[-100:][[c, s, w, e]].iplot(kind="line", title=f"{s} vs {c} vs {w} vs {e}", xTitle="Date", asFigure=True)
    fig.write_image(f"stock_analysis/ema_{c}.png")
    fig.show()


import plotly.graph_objects as go

fig=go.Figure()

fig.add_trace(go.Candlestick(x=tdf[-1000:].index,
                open=tdf[-1000:]['open'],
                high=tdf[-1000:]['high'],
                low=tdf[-1000:]['low'],
                close=tdf[-1000:]['close'], 
                 name = 'Stock Market Data'))
fig.add_trace(go.Candlestick(x=tdf[-1000:].index,
                open=tdf[-1000:]['ema_open'],
                high=tdf[-1000:]['ema_high'],
                low=tdf[-1000:]['ema_low'],
                close=tdf[-1000:]['ema_close'], 
                 name = 'EMA Stock Market Data'))

fig.update_layout(
    title= "AAPL Stock Data",
    yaxis_title="Stock's Price in USD",
    xaxis_title="Date")               

fig.update_xaxes(
    rangeslider_visible=True,
    rangeselector=dict(
        buttons=list([
            dict(count=150, label="150D", step="day", stepmode="backward"),
            dict(count=4, label="4m", step="month", stepmode="backward"),
            dict(step="all")
        ])
    )
)

color_hi_fill = 'black'
color_hi_line = 'blue'

color_lo_fill = 'yellow'
color_lo_line = 'purple'

fig.data[0].increasing.fillcolor = color_hi_fill
fig.data[0].increasing.line.color = color_hi_line
fig.data[0].decreasing.fillcolor = 'rgba(0,0,0,0)'
fig.data[0].decreasing.line.color = 'rgba(0,0,0,0)'

fig.data[1].increasing.fillcolor = 'rgba(0,0,0,0)'
fig.data[1].increasing.line.color = 'rgba(0,0,0,0)'
fig.data[1].decreasing.fillcolor = color_lo_fill
fig.data[1].decreasing.line.color = color_lo_line

fig.write_image("stock_analysis/candle.png")

fig.show()


tdf = df.copy()
smmdf = tdf.rolling(window=5).median()

for c in smmdf.columns:
    tdf[f"smm_{c}"] = smmdf[c]

emadf=df.ewm(span=5, min_periods=5, adjust=True).mean()

for c in emadf.columns:
    tdf[f"ema_{c}"] = emadf[c]
    
smmc = [c for c in tdf.columns if "smm" in c]
emac = [c for c in tdf.columns if "ema" in c]
col = [c for c in tdf.columns if "smm" not in c and "ema" not in c]

for s,c,e in zip(smmc,col,emac):
    fig=tdf[-100:][[c, s, e]].iplot(kind="line", title=f"{s} vs {c} vs {e}", xTitle="Date", asFigure=True)
    fig.write_image(f"stock_analysis/mma_{c}.png")
    fig.show()


tdf = df.copy()
smmdf = tdf.rolling(window=5).var()

for c in smmdf.columns:
    tdf[f"smv_{c}"] = smmdf[c]

emadf=df.ewm(span=5, min_periods=5, adjust=True).var()

for c in emadf.columns:
    tdf[f"emv_{c}"] = emadf[c]
    
smmc = [c for c in tdf.columns if "smv" in c]
emac = [c for c in tdf.columns if "emv" in c]
col = [c for c in tdf.columns if "smv" not in c and "emv" not in c]

for s,c,e in zip(smmc,col,emac):
    tdf[-100:][[c, s, e]].iplot(kind="line", y = [s,e], secondary_y=c, title=f"{s} vs vs {e}", xTitle="Date", asFigure=True)
    fig.write_image("stock_analysis/trend.png")
    fig.show()

	Open	High	Low	Close	Adj Close	Volume
Date
1980-12-12	0.128348	0.128906	0.128348	0.128348	0.100326	469033600
1980-12-15	0.122210	0.122210	0.121652	0.121652	0.095092	175884800
1980-12-16	0.113281	0.113281	0.112723	0.112723	0.088112	105728000
1980-12-17	0.115513	0.116071	0.115513	0.115513	0.090293	86441600
1980-12-18	0.118862	0.119420	0.118862	0.118862	0.092911	73449600

	open	high	low	close	adj_close	volume
count	10390.000000	10390.000000	10390.000000	10390.000000	10390.000000	1.039000e+04
mean	13.689530	13.837209	13.542035	13.695320	13.077773	3.326112e+08
std	29.525352	29.857351	29.199483	29.542847	29.249790	3.394925e+08
min	0.049665	0.049665	0.049107	0.049107	0.038385	0.000000e+00
25%	0.281250	0.287946	0.273996	0.281250	0.234167	1.251712e+08
50%	0.466518	0.476004	0.459732	0.466518	0.385693	2.205952e+08
75%	14.034375	14.205357	13.918214	14.033482	12.025375	4.136293e+08
max	182.630005	182.940002	179.119995	182.009995	181.778397	7.421641e+09

	open	high	low	close	adj_close	volume
Date
1980-12-12	NaN	NaN	NaN	NaN	NaN	NaN
1980-12-15	NaN	NaN	NaN	NaN	NaN	NaN
1980-12-16	NaN	NaN	NaN	NaN	NaN	NaN
1980-12-17	NaN	NaN	NaN	NaN	NaN	NaN
1980-12-18	0.119643	0.119978	0.119420	0.119420	0.093347	182107520.0
...	...	...	...	...	...	...
2022-02-18	170.208002	171.663998	168.304001	170.080002	170.080002	72770540.0
2022-02-22	169.730002	171.085999	167.422000	169.168002	169.168002	73766000.0
2022-02-23	168.644000	169.725998	165.322000	166.624005	166.624005	78910580.0
2022-02-24	164.789999	167.628000	161.712000	164.662006	164.662006	94904600.0
2022-02-25	163.351999	166.269998	160.191998	163.856006	163.856006	99363080.0

	open	high	low	close	adj_close	volume	sma_open	sma_high	sma_low	sma_close	sma_adj_close	sma_volume
Date
1980-12-12	0.128348	0.128906	0.128348	0.128348	0.100326	469033600	NaN	NaN	NaN	NaN	NaN	NaN
1980-12-15	0.122210	0.122210	0.121652	0.121652	0.095092	175884800	NaN	NaN	NaN	NaN	NaN	NaN
1980-12-16	0.113281	0.113281	0.112723	0.112723	0.088112	105728000	NaN	NaN	NaN	NaN	NaN	NaN
1980-12-17	0.115513	0.116071	0.115513	0.115513	0.090293	86441600	NaN	NaN	NaN	NaN	NaN	NaN
1980-12-18	0.118862	0.119420	0.118862	0.118862	0.092911	73449600	0.119643	0.119978	0.119420	0.119420	0.093347	182107520.0
...	...	...	...	...	...	...	...	...	...	...	...	...
2022-02-18	169.820007	170.539993	166.190002	167.300003	167.300003	82614200	170.208002	171.663998	168.304001	170.080002	170.080002	72770540.0
2022-02-22	164.979996	166.690002	162.149994	164.320007	164.320007	91162800	169.730002	171.085999	167.422000	169.168002	169.168002	73766000.0
2022-02-23	165.539993	166.149994	159.750000	160.070007	160.070007	90009200	168.644000	169.725998	165.322000	166.624005	166.624005	78910580.0
2022-02-24	152.580002	162.850006	152.000000	162.740005	162.740005	141147500	164.789999	167.628000	161.712000	164.662006	164.662006	94904600.0
2022-02-25	163.839996	165.119995	160.869995	164.850006	164.850006	91881700	163.351999	166.269998	160.191998	163.856006	163.856006	99363080.0

	open	high	low	close	adj_close	volume
Date
1980-12-12	NaN	NaN	NaN	NaN	NaN	NaN
1980-12-15	NaN	NaN	NaN	NaN	NaN	NaN
1980-12-16	NaN	NaN	NaN	NaN	NaN	NaN
1980-12-17	NaN	NaN	NaN	NaN	NaN	NaN
1980-12-18	0.117932	0.118304	0.117746	0.117746	0.092038	1.234001e+08
...	...	...	...	...	...	...
2022-02-18	170.538670	171.722664	168.136002	169.608669	169.608669	7.264790e+07
2022-02-22	168.796001	170.064666	166.084666	167.688671	167.688671	7.877865e+07
2022-02-23	167.399332	168.419331	163.527333	164.656006	164.656006	8.419305e+07
2022-02-24	162.044666	166.127334	159.086666	163.361339	163.361339	1.049387e+08
2022-02-25	161.727998	165.291332	158.805998	163.424006	163.424006	1.039311e+08

Table of Contents

Introduction¶

Preliminary Actions¶

Install Libraries¶

Import Required Libraries¶

Download Stock Data of Apple¶

Perform EDA¶

Checking for Null Value¶

View the Distribution¶

View the Box Plot¶

Summary of our data¶

Moving Average¶

Simple Moving Average (SMA)¶

Plotting SMA of All¶

Weighted Moving Average (WMA)¶

Plotting WMA of All¶

Exponential Moving Average (WMA)¶

Plotting EMA of All¶

Plotting Candlestick¶

Moving Median¶

Moving Variance¶

Conclusion¶

	col_name	total_rows
0	open	10390.0
1	high	10390.0
2	low	10390.0
3	close	10390.0
4	adj_close	10390.0
5	volume	10390.0