import pandas as pd
import seaborn as sns
import matplotlib.pyplot as plt
data = pd.read_csv(r'D:\Anaconda Files\Earthquakes\Earthquakes.csv', decimal=',' ,sep='\t', encoding='utf-8')
data['Date'] = pd.to_datetime(data['Date'])
data['Magnitude'] = data['Magnitude'].astype(float)
#sns.set_theme(style="whitegrid")
#tips = sns.load_dataset("tips")
plt.figure(figsize=(20,6))
ax = sns.boxplot(x=data["Magnitude"])
#Plot Histogram of "size"
plt.figure(figsize=(20,6))
sns.distplot(data["Magnitude"], bins = 40)
#Plot Histogram of "size"
datax = data[data['Magnitude'] >= 7]
plt.figure(figsize=(20,6))
sns.distplot(datax["Magnitude"], bins = 26)
#Count
rank_pre = data.groupby(['Country'])['Country'].count()
rank_pre = pd.DataFrame(rank_pre, columns=['Country', 'Length'])
rank_pre = rank_pre.drop(rank_pre.columns[1],axis=1)
rank_pre.index.names = ['Country_Name']
rank_pre.rename(columns = {'Country':'Count >5'}, inplace = True)
rank_pre.sort_values(by=['Count >5'], inplace=True, ascending=False)
rank_pre.head(15)
data_pre = data[data['Magnitude'] >= 6]
rank_pre = data_pre.groupby(['Country'])['Country'].count()
rank_pre = pd.DataFrame(rank_pre, columns=['Country', 'Length'])
rank_pre = rank_pre.drop(rank_pre.columns[1],axis=1)
rank_pre.index.names = ['Country_Name']
rank_pre.rename(columns = {'Country':'Count >6'}, inplace = True)
rank_pre.sort_values(by=['Count >6'], inplace=True, ascending=False)
rank_pre.head(15)
data_pre = data[data['Magnitude'] >= 7]
rank_pre = data_pre.groupby(['Country'])['Country'].count()
rank_pre = pd.DataFrame(rank_pre, columns=['Country', 'Length'])
rank_pre = rank_pre.drop(rank_pre.columns[1],axis=1)
rank_pre.index.names = ['Country_Name']
rank_pre.rename(columns = {'Country':'Count >7'}, inplace = True)
rank_pre.sort_values(by=['Count >7'], inplace=True, ascending=False)
rank_pre.head(15)
#Count
rank_pre = data.groupby(['Magnitude'])['Magnitude'].count()
rank_pre.head(20)