#import packages
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
#read data
df = pd.read_excel('/home/jovyan/work/the data for your group project_MA541.xlsx')
#look data
df.head()
#calculate mean and standard deviation of each columns
print(df.Close_ETF.mean())
print(df.Close_ETF.std())
print(df.oil.mean())
print(df.oil.std())
print(df.gold.mean())
print(df.gold.std())
print(df.JPM.mean())
print(df.JPM.std())
121.152960012
12.569790313110744
0.0010300354937470017
0.021092898551005313
0.0006628360819999999
0.011289060259316142
0.0005304110210000001
0.011016562382593569
df.corr()
#Histograms of four columns
df.Close_ETF.plot(kind = 'hist')
df.oil.plot(kind='hist')
df.gold.plot(kind='hist')
df.JPM.plot(kind = 'hist')