# Data and array manipulation
import pandas as pd
import numpy as np

# Datetime manipulation
import datetime as dt

# Plotting and Visualization
import matplotlib.pyplot as plt
import plotly.express as px
import chart_studio.plotly as py
import cufflinks as cf


# Fetching stock data from web
import pandas_datareader.data as web

# Interactive charts
from plotly.offline import download_plotlyjs, init_notebook_mode, plot, iplot
init_notebook_mode(connected = True)
cf.go_offline()

# Options
pd.options.display.float_format = '{:,.4f}'.format

# Default settings
default_yaxis = dict(showgrid = False,
                     zeroline = False,
                     showline = False,
                     showticklabels = True)
default_RgSlct = dict(buttons = list([dict(count = 1, label = "1 Month", step = "month", stepmode = "backward"),
                                      dict(count = 6, label = "6 Months", step = "month", stepmode = "backward"),
                                      dict(count = 1, label = "1 Year", step = "year", stepmode = "backward"),
                                      dict(count = 1, label = "YTD", step = "year", stepmode = "todate"),
                                      dict(label = "All Data", step = "all")]))


# Setting the windows of data to be fetched
start = dt.datetime(2017, 6, 28)
end = dt.datetime(2022, 6, 28)

# Listing the tickers of the choen stocks
tickers = ['SY1.DE', 'ALV.DE', 'MRK.DE', 'DTE.DE', 'VOW3.DE', 'DBK.DE', 'HNR1.DE', 'HEI.DE', '1COV.DE', 'BEI.DE']

# Empty Data Frame for combining results
df = pd.DataFrame([])

# Fetching
for _ in tickers:
    temp = web.DataReader(_, 'yahoo', start, end).reset_index()
    temp['Ticker'] = _
    df = pd.concat([df, temp], ignore_index = True)

# combined Data Frame
df


# Counting null value throughout the columns
df.isnull().sum()

Date         0
High         0
Low          0
Open         0
Close        0
Volume       0
Adj Close    0
Ticker       0
dtype: int64


# check start date, end date, and length of each ticker (ungrouped)
df.groupby('Ticker')['Date'].agg(['min', 'max', 'count'])


# Individual changes of each stock
fig = px.area(df, 
              x = 'Date',
              y = 'Open',
              facet_col = 'Ticker',
              color = 'Ticker',
              facet_col_wrap = 2, 
              labels = {'x': 'Date', 'y': 'Price'}, 
              title = 'Opening Price of chosen stocks in EUR (Jul 2017 - Jun 2022)',
              width = 1000,
              height = 800)

# Adjusting the layout to reduce clutter
fig.update_layout(yaxis = default_yaxis, showlegend = False, autosize = True, plot_bgcolor = 'white')

# Showing the visualization
fig.show()


# Creating the basic line chart
fig = px.line(df, 
              x = 'Date',
              y = 'Open',
              color = 'Ticker',
              labels = {'x': 'Date', 'y': 'Price'}, 
              title = 'Opening Price of chosen stocks in EUR (Jul 2017 - Jun 2022)',
              width = 1000,
              height = 600)

# Updating layout to reduce clutter
fig.update_layout(yaxis = default_yaxis, autosize = True, plot_bgcolor = 'white')

# Creating slider
fig.update_xaxes(rangeselector = default_RgSlct)

# Showing the visualization
fig.show()


# Creating the basic line chart
fig = px.line(df, 
              x = 'Date',
              y = 'Volume',
              color = 'Ticker',
              labels = {'x': 'Date', 'y': 'Traded Volume'}, 
              title = 'Traded Volume of chosen stocks (Jul 2017 - Jun 2022)',
              width = 1000,
              height = 600)

# Updating layout to reduce clutter
fig.update_layout(yaxis = default_yaxis, autosize = True, plot_bgcolor = 'white')

# Creating slider
fig.update_xaxes(rangeselector = default_RgSlct)

# Showing the visualization
fig.show()


# Calculating the traded value using the formula above
df['Traded Value'] = 0.5 * (df.High + df.Low) * df.Volume

# Creating the basic line chart
fig = px.line(df, 
              x = 'Date',
              y = 'Traded Value',
              color = 'Ticker',
              title = 'Traded value of chosen stocks in EUR (Jul 2017 - Jun 2022)',
              width = 1000,
              height = 600)

# Updating layout to reduce clutter
fig.update_layout(yaxis = default_yaxis, autosize = True, plot_bgcolor = 'white')

# Creating slider
fig.update_xaxes(rangeselector = default_RgSlct)

# Showing the visualization
fig.show()


# Listing the columns to show
r_show = [('Open', 'count'),
          ('Open', 'mean'),
          ('Open', 'std'),
          ('Open', 'mean/std'),
          ('Volume', 'mean'),
          ('Volume', 'std'),
          ('Volume', 'mean/std'),
          ('Traded Value', 'mean'),
          ('Traded Value', 'std'),
          ('Traded Value', 'mean/std')]

# Creating summary statistics for chosen variables
tab_sum1 = df.loc[:, ['Open', 'Volume', 'Traded Value', 'Ticker']].groupby('Ticker').describe()

# Calculating `mean/std`
tab_sum1[('Open', 'mean/std')] = tab_sum1[('Open', 'mean')] / tab_sum1[('Open', 'std')]
tab_sum1[('Volume', 'mean/std')] = tab_sum1[('Volume', 'mean')] / tab_sum1[('Volume', 'std')]
tab_sum1[('Traded Value', 'mean/std')] = tab_sum1[('Traded Value', 'mean')] / tab_sum1[('Traded Value', 'std')]

# Showing sorted results
tab_sum1 = tab_sum1.loc[:, r_show]
tab_sum1.sort_values(by = [('Traded Value', 'mean')], ascending = False)


# Extracting data of `DTE.DE`
df_smooth = df[df.Ticker == 'DTE.DE']

# Calculating moving average
df_smooth['MA30'] = df_smooth.Open.rolling(30).mean()
df_smooth['MA50'] = df_smooth.Open.rolling(50).mean()
df_smooth['MA100'] = df_smooth.Open.rolling(100).mean()

# Creating the basic line chart
fig = px.line(df_smooth, 
              x = 'Date',
              y = ['Open', 'MA30', 'MA50', 'MA100'],
              title = 'Smoothed opening price of DTE.DE (Jul 2017 - Jun 2022)',
              width = 1000,
              height = 600)

# Updating layout to reduce clutter
fig.update_layout(yaxis = default_yaxis, autosize = True, plot_bgcolor = 'white')

# Creating slider
fig.update_xaxes(rangeselector = default_RgSlct)

# Showing the visualization
fig.show()


# Filtering columns
c_show = ['Date', 'Adj Close', 'Ticker']

# Reshaping data
df_closingP = df.loc[:, c_show]
df_closingP = df_closingP.pivot(index = 'Date', columns = 'Ticker', values = 'Adj Close')

# Calculating daily percentage changes
df_returns = df_closingP.pct_change()

# Final result
df_returns


tab_sum2 = df_returns.describe().T.sort_values(by = 'std', ascending = False)
tab_sum2


tab_sum2['S'] = tab_sum2['mean']/tab_sum2['std']
tab_sum2.sort_values(by = 'S')


# Creating the basic line chart
fig = px.line(df_returns, 
              x = df_returns.index,
              y = df_returns.columns,
              title = 'Changes in daily percentage returns of chosen stocks (Jul 2017 - Jun 2022)',
              width = 1000,
              height = 600)

# Updating layout to reduce clutter
fig.update_layout(yaxis = default_yaxis, autosize = True, plot_bgcolor = 'white')

# Creating slider
fig.update_xaxes(rangeselector = default_RgSlct)

# Showing the visualization
fig.show()


# Simple box plots
fig = px.box(df_returns,
             title = 'Box plots of daily percentage returns of chosen stocks (Jul 2017 - Jun 2022)',
             width = 1000,
             height = 600,)

# Updating layout to reduce clutter
fig.update_layout(yaxis = default_yaxis, autosize = True, plot_bgcolor = 'white')

# Showing the visualization
fig.show()


# Simple correlation heat map
fig = px.imshow(df_returns.corr(),
                labels = dict(color = 'Correlation'),
                width = 800,
                height = 800,
                text_auto = '.3f')

# Adding color scale
fig.update_xaxes(side = 'top')

# Showing visualization
fig.show()


# Simple scatter matrix
fig = px.scatter_matrix(df_returns,
                        opacity = 0.4,
                        width = 800,
                        height = 800)

# Updating layout to reduce clutter
fig.update_layout(yaxis = default_yaxis, autosize = True, plot_bgcolor = 'white')

# Showing the visualization
fig.show()


df_cumR = (1 + df_returns).cumprod()
df_cumR


# Creating the basic line chart
fig = px.line(df_cumR, 
              x = df_cumR.index,
              y = df_cumR.columns,
              title = 'Changes in cumulative returns of chosen stocks (Jul 2017 - Jun 2022)',
              width = 1000,
              height = 600)

# Updating layout to reduce clutter
fig.update_layout(yaxis = default_yaxis, autosize = True, plot_bgcolor = 'white')
fig.add_hline(y = 1, line_dash = "dash", opacity = 0.5, annotation_text = "Break Even", annotation_position = "bottom right")

# Creating slider
fig.update_xaxes(rangeselector = default_RgSlct)

# Showing the visualization
fig.show()

Symbol	Company Name	Last Price	Change	% Change	Volume
SY1.DE	Symrise AG	106.25	0.05	0.05%	277,156
ALV.DE	Allianz SE	181.04	-0.16	-0.09%	1,069,053
MRK.DE	MERCK Kommanditgesellschaft auf Aktien	165.1	0.3	0.18%	313,644
DTE.DE	Deutsche Telekom AG	18.84	-0.04	-0.20%	6,880,550
VOW3.DE	Volkswagen AG	138.88	-0.3	-0.22%	913,070
DBK.DE	Deutsche Bank Aktiengesellschaft	8.89	-0.03	-0.33%	10,112,593
HNR1.DE	Hannover Rück SE	136.4	-0.45	-0.33%	95,892
HEI.DE	HeidelbergCement AG	48.78	0.29	0.60%	623,977
1COV.DE	Covestro AG	34.26	-0.22	-0.64%	982,911
BEI.DE	Beiersdorf Aktiengesellschaft	98.62	0.64	0.65%	246,097

	Date	High	Low	Open	Close	Volume	Adj Close	Ticker
0	2017-06-28	63.5700	62.6600	63.0900	62.7300	282,906.0000	59.0006	SY1.DE
1	2017-06-29	63.4300	62.0100	63.1400	62.2600	285,637.0000	58.5585	SY1.DE
2	2017-06-30	63.1100	62.0200	62.2600	62.0200	332,730.0000	58.3328	SY1.DE
3	2017-07-03	62.9000	62.1400	62.4000	62.4800	185,066.0000	58.7654	SY1.DE
4	2017-07-04	62.4500	61.7400	62.4200	62.0500	191,373.0000	58.3610	SY1.DE
...	...	...	...	...	...	...	...	...
12675	2022-06-22	95.6600	93.0600	93.7600	95.2600	419,458.0000	95.2600	BEI.DE
12676	2022-06-23	97.0600	95.0000	95.3000	96.6800	502,331.0000	96.6800	BEI.DE
12677	2022-06-24	98.7200	96.7600	97.4800	97.9800	326,421.0000	97.9800	BEI.DE
12678	2022-06-27	99.2600	98.1600	98.7400	98.6200	246,097.0000	98.6200	BEI.DE
12679	2022-06-28	99.0000	97.4200	98.4600	97.8600	334,672.0000	97.8600	BEI.DE

	min	max	count
Ticker
1COV.DE	2017-06-28	2022-06-28	1268
ALV.DE	2017-06-28	2022-06-28	1268
BEI.DE	2017-06-28	2022-06-28	1268
DBK.DE	2017-06-28	2022-06-28	1268
DTE.DE	2017-06-28	2022-06-28	1268
HEI.DE	2017-06-28	2022-06-28	1268
HNR1.DE	2017-06-28	2022-06-28	1268
MRK.DE	2017-06-28	2022-06-28	1268
SY1.DE	2017-06-28	2022-06-28	1268
VOW3.DE	2017-06-28	2022-06-28	1268

	Open				Volume			Traded Value
	count	mean	std	mean/std	mean	std	mean/std	mean	std	mean/std
Ticker
ALV.DE	1,268.0000	195.9094	17.1550	11.4200	1,234,959.0726	702,663.7348	1.7575	236,806,477.0144	120,640,343.5833	1.9629
VOW3.DE	1,268.0000	160.5898	26.3272	6.0998	1,246,523.7240	599,780.2028	2.0783	197,841,817.5991	99,784,517.4007	1.9827
DTE.DE	1,268.0000	15.2874	1.3982	10.9336	11,036,654.7626	5,414,675.0686	2.0383	165,840,174.8011	75,651,554.0899	2.1922
DBK.DE	1,268.0000	9.9029	2.7057	3.6600	14,553,537.1491	8,131,983.2105	1.7897	140,744,673.5562	82,965,723.6908	1.6964
1COV.DE	1,268.0000	54.7616	15.9841	3.4260	1,145,047.6601	680,003.6839	1.6839	58,916,163.4940	35,387,583.9680	1.6649
MRK.DE	1,268.0000	121.6767	39.1691	3.1064	483,637.3778	246,255.1722	1.9640	55,105,627.2274	25,301,075.3868	2.1780
HEI.DE	1,268.0000	66.4163	12.3248	5.3888	773,029.8604	395,742.2731	1.9534	49,452,505.0395	21,673,552.6223	2.2817
BEI.DE	1,268.0000	96.2652	6.2116	15.4976	394,496.2429	235,102.5830	1.6780	37,681,767.0158	21,338,037.4809	1.7659
SY1.DE	1,268.0000	91.1997	19.3209	4.7203	282,146.9606	146,474.4901	1.9263	25,581,089.6025	14,734,240.0513	1.7362
HNR1.DE	1,268.0000	136.8233	20.9603	6.5277	152,241.8675	89,515.4769	1.7007	20,469,877.0361	12,171,915.3281	1.6817

Ticker	1COV.DE	ALV.DE	BEI.DE	DBK.DE	DTE.DE	HEI.DE	HNR1.DE	MRK.DE	SY1.DE	VOW3.DE
Date
2017-06-28	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN
2017-06-29	-0.0483	-0.0072	-0.0322	0.0054	-0.0209	-0.0030	-0.0005	-0.0217	-0.0075	-0.0100
2017-06-30	-0.0035	-0.0040	0.0002	-0.0190	-0.0116	-0.0053	-0.0005	-0.0005	-0.0039	0.0026
2017-07-03	0.0079	0.0203	-0.0027	0.0367	0.0067	0.0250	0.0114	-0.0071	0.0074	0.0184
2017-07-04	-0.0138	0.0043	-0.0038	0.0186	-0.0095	0.0040	0.0047	-0.0090	-0.0069	0.0029
...	...	...	...	...	...	...	...	...	...	...
2022-06-22	-0.0548	-0.0070	0.0125	-0.0015	0.0171	-0.0091	-0.0145	-0.0095	0.0104	-0.0142
2022-06-23	-0.0302	-0.0263	0.0149	-0.1219	-0.0004	-0.0306	-0.0331	-0.0067	0.0005	-0.0370
2022-06-24	0.0414	0.0123	0.0134	0.0478	0.0119	0.0193	0.0419	0.0557	0.0422	0.0009
2022-06-27	-0.0064	-0.0009	0.0065	-0.0033	-0.0020	0.0060	-0.0033	0.0018	0.0005	-0.0022
2022-06-28	0.0035	0.0114	-0.0077	-0.0030	0.0120	-0.0016	0.0081	-0.0085	-0.0122	0.0140

Python Project 1: Stock Data Analysis with Pandas and Plotly¶

Case description¶

Objectives¶

Details of the analysis¶

Important libraries and default settings¶

Reading data¶

Trend Analysis¶

Volatility analysis¶

Cumulative returns¶

Conclusion¶

	count	mean	std	min	25%	50%	75%	max
Ticker
DBK.DE	1,267.0000	-0.0001	0.0260	-0.1844	-0.0125	-0.0002	0.0136	0.1290
VOW3.DE	1,267.0000	0.0004	0.0226	-0.1521	-0.0107	-0.0001	0.0104	0.1905
1COV.DE	1,267.0000	-0.0001	0.0214	-0.1556	-0.0114	0.0002	0.0118	0.0887
HEI.DE	1,267.0000	-0.0001	0.0193	-0.1424	-0.0088	0.0000	0.0087	0.1146
HNR1.DE	1,267.0000	0.0004	0.0165	-0.1779	-0.0062	0.0007	0.0079	0.1707
ALV.DE	1,267.0000	0.0004	0.0161	-0.1533	-0.0062	0.0005	0.0070	0.1580
MRK.DE	1,267.0000	0.0005	0.0157	-0.0922	-0.0073	0.0005	0.0090	0.1012
SY1.DE	1,267.0000	0.0006	0.0142	-0.1001	-0.0064	0.0005	0.0082	0.1034
BEI.DE	1,267.0000	0.0001	0.0131	-0.0981	-0.0058	0.0000	0.0068	0.0756
DTE.DE	1,267.0000	0.0004	0.0127	-0.1066	-0.0056	0.0000	0.0069	0.0652

Ticker	1COV.DE	ALV.DE	BEI.DE	DBK.DE	DTE.DE	HEI.DE	HNR1.DE	MRK.DE	SY1.DE	VOW3.DE
Date
2017-06-28	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN	NaN
2017-06-29	0.9517	0.9928	0.9678	1.0054	0.9791	0.9970	0.9995	0.9783	0.9925	0.9900
2017-06-30	0.9484	0.9888	0.9680	0.9863	0.9677	0.9917	0.9990	0.9778	0.9887	0.9926
2017-07-03	0.9559	1.0089	0.9654	1.0226	0.9741	1.0165	1.0105	0.9709	0.9960	1.0108
2017-07-04	0.9427	1.0132	0.9617	1.0416	0.9649	1.0206	1.0152	0.9621	0.9892	1.0138
...	...	...	...	...	...	...	...	...	...	...
2022-06-22	0.6833	1.3440	1.0405	0.6469	1.4857	0.7155	1.3902	1.5636	1.7263	1.2720
2022-06-23	0.6627	1.3086	1.0560	0.5680	1.4851	0.6936	1.3442	1.5531	1.7271	1.2250
2022-06-24	0.6901	1.3247	1.0702	0.5952	1.5027	0.7070	1.4005	1.6397	1.8000	1.2260
2022-06-27	0.6857	1.3236	1.0772	0.5932	1.4997	0.7113	1.3959	1.6427	1.8008	1.2234
2022-06-28	0.6881	1.3386	1.0689	0.5914	1.5177	0.7101	1.4071	1.6288	1.7788	1.2405