diff --git a/q01_plot/build.py b/q01_plot/build.py index 0425964..51e7ebc 100644 --- a/q01_plot/build.py +++ b/q01_plot/build.py @@ -1,8 +1,24 @@ +# %load q01_plot/build.py +# Default imports import matplotlib.pyplot as plt import seaborn as sns import pandas as pd +plt.switch_backend('agg') data = pd.read_csv('data/house_prices_multivariate.csv') -plt.switch_backend('agg') -# Write your code here : +num_cols = ['LotArea', 'GarageArea', 'OpenPorchSF', 'SalePrice'] +# Write your code here: +def plot(num_cols): + for i in range(0,len(num_cols),2): + if len(num_cols) > i+1: + plt.figure(figsize=(10,4)) + plt.subplot(121) + sns.distplot(data[num_cols[i]], hist=True, kde=False) + plt.subplot(122) + sns.distplot(data[num_cols[i+1]], hist=True, kde=False) + plt.tight_layout() + plt.show() + +plot(num_cols) + diff --git a/q02_plot/build.py b/q02_plot/build.py index 67b4924..2a147d1 100644 --- a/q02_plot/build.py +++ b/q02_plot/build.py @@ -1,11 +1,24 @@ +# %load q02_plot/build.py # Default imports import pandas as pd import matplotlib.pyplot as plt import seaborn as sns - -data = pd.read_csv('data/house_prices_multivariate.csv') plt.switch_backend('agg') +data = pd.read_csv('data/house_prices_multivariate.csv') +num_cols = ['LotArea', 'GarageArea', 'OpenPorchSF', 'SalePrice'] # Write your code here: +def plot(num_cols): + facet = None + for i in range(0,len(num_cols),2): + if len(num_cols) > i+1: + plt.figure(figsize=(10,4)) + plt.subplot(121) + sns.boxplot(facet, num_cols[i],data = data) + plt.subplot(122) + sns.boxplot(facet, num_cols[i+1],data = data) + plt.tight_layout() + plt.show() +plot(num_cols) diff --git a/q03_regression_plot/build.py b/q03_regression_plot/build.py index 2aaf8f6..bf10cb8 100644 --- a/q03_regression_plot/build.py +++ b/q03_regression_plot/build.py @@ -1,16 +1,18 @@ +# %load q03_regression_plot/build.py # Default imports import pandas as pd import seaborn as sns import matplotlib.pyplot as plt - - -data = pd.read_csv('data/house_prices_multivariate.csv') plt.switch_backend('agg') +data = pd.read_csv('data/house_prices_multivariate.csv') +x = data['GrLivArea'] +y = data['SalePrice'] # Write your code here - - - +def regression_plot(x,y): + sns.lmplot('GrLivArea', 'SalePrice', data=data, fit_reg=True) + +regression_plot(x,y) diff --git a/q04_cor/build.py b/q04_cor/build.py index f3fae50..b9e56b6 100644 --- a/q04_cor/build.py +++ b/q04_cor/build.py @@ -1,10 +1,17 @@ +# %load q04_cor/build.py # Default imports import pandas as pd import matplotlib.pyplot as plt import seaborn as sns +plt.switch_backend('agg') data = pd.read_csv('data/house_prices_multivariate.csv') -plt.switch_backend('agg') # Write your code here +def cor(data): + plt.figure(figsize=(12,8)) + sns.heatmap(data.corr(), cmap='viridis') + +cor(data) +