diff --git a/q01_plot/build.py b/q01_plot/build.py index 0425964..06a3831 100644 --- a/q01_plot/build.py +++ b/q01_plot/build.py @@ -1,8 +1,24 @@ +# %load q01_plot/build.py +# Default imports import matplotlib.pyplot as plt import seaborn as sns import pandas as pd data = pd.read_csv('data/house_prices_multivariate.csv') -plt.switch_backend('agg') -# Write your code here : +# Write your code here: +def plot(num_cols): + for i in range(0,len(num_cols),2): + if len(num_cols) > i+1: + plt.figure(figsize=(10,4)) + plt.subplot(121) + sns.distplot(data[num_cols[i]], kde=False) + plt.subplot(122) + sns.distplot(data[num_cols[i+1]], kde=False) + plt.tight_layout() + plt.show() + else: + sns.distplot(data[num_cols[i]], kde=False) + + + diff --git a/q02_plot/build.py b/q02_plot/build.py index 67b4924..720df8b 100644 --- a/q02_plot/build.py +++ b/q02_plot/build.py @@ -1,11 +1,29 @@ +# %load q02_plot/build.py # Default imports import pandas as pd import matplotlib.pyplot as plt import seaborn as sns - -data = pd.read_csv('data/house_prices_multivariate.csv') plt.switch_backend('agg') +data = pd.read_csv('data/house_prices_multivariate.csv') +dataframe = pd.read_csv('data/house_prices_multivariate.csv') # Write your code here: +def plot(a): + num_cols = ['LotArea' ,'GarageArea', 'OpenPorchSF','SalePrice'] + facet = None + for i in range(0,len(num_cols),2): + if len(num_cols) > i+1: + plt.figure(figsize=(10,4)) + plt.subplot(121) + sns.boxplot(facet, num_cols[i],data = a) + plt.subplot(122) + sns.boxplot(facet, num_cols[i+1],data = a) + plt.tight_layout() + plt.show() + else: + sns.boxplot(facet, num_cols[i],data = a) +plot(dataframe) + + diff --git a/q03_regression_plot/build.py b/q03_regression_plot/build.py index 2aaf8f6..135fb4d 100644 --- a/q03_regression_plot/build.py +++ b/q03_regression_plot/build.py @@ -1,3 +1,4 @@ +# %load q03_regression_plot/build.py # Default imports import pandas as pd @@ -8,8 +9,12 @@ data = pd.read_csv('data/house_prices_multivariate.csv') plt.switch_backend('agg') - # Write your code here +def regression_plot(a,b): + sns.lmplot(a, b, data = data, fit_reg=True) +regression_plot('GrLivArea','SalePrice') + + diff --git a/q04_cor/build.py b/q04_cor/build.py index f3fae50..73def22 100644 --- a/q04_cor/build.py +++ b/q04_cor/build.py @@ -1,3 +1,4 @@ +# %load q04_cor/build.py # Default imports import pandas as pd import matplotlib.pyplot as plt @@ -6,5 +7,11 @@ data = pd.read_csv('data/house_prices_multivariate.csv') plt.switch_backend('agg') - # Write your code here +def cor(a): + sns.heatmap(a.corr()) +cor(data) + + + +