diff --git a/__pycache__/__init__.cpython-36.pyc b/__pycache__/__init__.cpython-36.pyc
new file mode 100644
index 0000000..0269bda
Binary files /dev/null and b/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q01_missing_value/__pycache__/__init__.cpython-36.pyc b/q01_missing_value/__pycache__/__init__.cpython-36.pyc
new file mode 100644
index 0000000..48fe166
Binary files /dev/null and b/q01_missing_value/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q01_missing_value/__pycache__/build.cpython-36.pyc b/q01_missing_value/__pycache__/build.cpython-36.pyc
new file mode 100644
index 0000000..ee80273
Binary files /dev/null and b/q01_missing_value/__pycache__/build.cpython-36.pyc differ
diff --git a/q01_missing_value/build.py b/q01_missing_value/build.py
index 7dc4d18..a94c885 100644
--- a/q01_missing_value/build.py
+++ b/q01_missing_value/build.py
@@ -1,5 +1,8 @@
+# %load q01_missing_value/build.py
 # Default imports
 import pandas as pd
+from sklearn.preprocessing import Imputer
+import numpy as np
 
 # Data loading
 ny_housing = pd.read_csv('data/train.csv')
@@ -8,3 +11,23 @@
 
 
 # Write your code here:
+def imputation(dataset):
+    numeric_df = dataset._get_numeric_data()
+    categorical_df = dataset[list(set(housing_data.columns) - set(numeric_df.columns))]
+    
+    for column in categorical_df.columns:
+        most_frequent = categorical_df[column].value_counts().index[0]
+        categorical_df[column] = categorical_df[column].replace(np.nan, most_frequent)
+    
+    numeric_df = numeric_df.replace(np.nan, 0)
+        
+    imputer = Imputer(missing_values=0, strategy='mean')
+    numeric_df = pd.DataFrame(imputer.fit_transform(numeric_df), columns=numeric_df.columns)
+    
+    return numeric_df, categorical_df
+
+
+
+
+
+
diff --git a/q01_missing_value/tests/__pycache__/__init__.cpython-36.pyc b/q01_missing_value/tests/__pycache__/__init__.cpython-36.pyc
new file mode 100644
index 0000000..819240b
Binary files /dev/null and b/q01_missing_value/tests/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q01_missing_value/tests/__pycache__/test_q01_imputation.cpython-36.pyc b/q01_missing_value/tests/__pycache__/test_q01_imputation.cpython-36.pyc
new file mode 100644
index 0000000..2572859
Binary files /dev/null and b/q01_missing_value/tests/__pycache__/test_q01_imputation.cpython-36.pyc differ
diff --git a/q02_outlier_removal/__pycache__/__init__.cpython-36.pyc b/q02_outlier_removal/__pycache__/__init__.cpython-36.pyc
new file mode 100644
index 0000000..45bcb2e
Binary files /dev/null and b/q02_outlier_removal/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q02_outlier_removal/__pycache__/build.cpython-36.pyc b/q02_outlier_removal/__pycache__/build.cpython-36.pyc
new file mode 100644
index 0000000..9d0064a
Binary files /dev/null and b/q02_outlier_removal/__pycache__/build.cpython-36.pyc differ
diff --git a/q02_outlier_removal/build.py b/q02_outlier_removal/build.py
index 74df5f2..7692977 100644
--- a/q02_outlier_removal/build.py
+++ b/q02_outlier_removal/build.py
@@ -1,3 +1,4 @@
+# %load q02_outlier_removal/build.py
 # Default imports
 import pandas as pd
 
@@ -8,3 +9,17 @@
 
 
 # Write your code here:
+def outlier_removal(housing_data):
+    numeric_df = housing_data._get_numeric_data()
+    numeric_df = numeric_df.drop(['SalePrice'], axis=1)
+    for column in numeric_df.columns:
+        quantile_95 = housing_data[column].quantile(0.95)
+        index_to_drop = housing_data[housing_data[column] > quantile_95].index
+        housing_data = housing_data.drop(index_to_drop)
+        
+    return housing_data
+
+
+
+
+
diff --git a/q02_outlier_removal/tests/__pycache__/__init__.cpython-36.pyc b/q02_outlier_removal/tests/__pycache__/__init__.cpython-36.pyc
new file mode 100644
index 0000000..d8f38bd
Binary files /dev/null and b/q02_outlier_removal/tests/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q02_outlier_removal/tests/__pycache__/test_q02_outlier_removal.cpython-36.pyc b/q02_outlier_removal/tests/__pycache__/test_q02_outlier_removal.cpython-36.pyc
new file mode 100644
index 0000000..1839b76
Binary files /dev/null and b/q02_outlier_removal/tests/__pycache__/test_q02_outlier_removal.cpython-36.pyc differ
diff --git a/q03_skewness_log/__pycache__/__init__.cpython-36.pyc b/q03_skewness_log/__pycache__/__init__.cpython-36.pyc
new file mode 100644
index 0000000..1181571
Binary files /dev/null and b/q03_skewness_log/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q03_skewness_log/__pycache__/build.cpython-36.pyc b/q03_skewness_log/__pycache__/build.cpython-36.pyc
new file mode 100644
index 0000000..06bbcc7
Binary files /dev/null and b/q03_skewness_log/__pycache__/build.cpython-36.pyc differ
diff --git a/q03_skewness_log/build.py b/q03_skewness_log/build.py
index f008d0f..d441101 100644
--- a/q03_skewness_log/build.py
+++ b/q03_skewness_log/build.py
@@ -1,3 +1,4 @@
+# %load q03_skewness_log/build.py
 from scipy.stats import skew
 import pandas as pd
 import numpy as np
@@ -6,3 +7,10 @@
 
 
 # Write code here:
+def skewness_log(data):
+    data['GrLivArea'] = np.log(data['GrLivArea'])
+    data['SalePrice'] = np.log(data['SalePrice'])
+    return skew(data['GrLivArea']),skew(data['SalePrice'])
+
+
+
diff --git a/q03_skewness_log/tests/__pycache__/__init__.cpython-36.pyc b/q03_skewness_log/tests/__pycache__/__init__.cpython-36.pyc
new file mode 100644
index 0000000..fa298c6
Binary files /dev/null and b/q03_skewness_log/tests/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q03_skewness_log/tests/__pycache__/test_q03_skewness_log.cpython-36.pyc b/q03_skewness_log/tests/__pycache__/test_q03_skewness_log.cpython-36.pyc
new file mode 100644
index 0000000..8e20975
Binary files /dev/null and b/q03_skewness_log/tests/__pycache__/test_q03_skewness_log.cpython-36.pyc differ
diff --git a/q03_skewness_sqrt/__pycache__/__init__.cpython-36.pyc b/q03_skewness_sqrt/__pycache__/__init__.cpython-36.pyc
new file mode 100644
index 0000000..d76370d
Binary files /dev/null and b/q03_skewness_sqrt/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q03_skewness_sqrt/__pycache__/build.cpython-36.pyc b/q03_skewness_sqrt/__pycache__/build.cpython-36.pyc
new file mode 100644
index 0000000..d8bfc32
Binary files /dev/null and b/q03_skewness_sqrt/__pycache__/build.cpython-36.pyc differ
diff --git a/q03_skewness_sqrt/build.py b/q03_skewness_sqrt/build.py
index 4bdb0e4..3850c54 100644
--- a/q03_skewness_sqrt/build.py
+++ b/q03_skewness_sqrt/build.py
@@ -1,3 +1,4 @@
+# %load q03_skewness_sqrt/build.py
 # Default imports
 from scipy.stats import skew
 import pandas as pd
@@ -7,4 +8,10 @@
 
 
 # Write your Solution Here:
+def skewness_sqrt(data):
+    data['GrLivArea'] = np.sqrt(data['GrLivArea'])
+    data['SalePrice'] = np.sqrt(data['SalePrice'])
+    return skew(data['GrLivArea']), skew(data['SalePrice'])
+
+
 
diff --git a/q03_skewness_sqrt/tests/__pycache__/__init__.cpython-36.pyc b/q03_skewness_sqrt/tests/__pycache__/__init__.cpython-36.pyc
new file mode 100644
index 0000000..bda0442
Binary files /dev/null and b/q03_skewness_sqrt/tests/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q03_skewness_sqrt/tests/__pycache__/test-q03_skewness_sqrt.cpython-36.pyc b/q03_skewness_sqrt/tests/__pycache__/test-q03_skewness_sqrt.cpython-36.pyc
new file mode 100644
index 0000000..2b88a92
Binary files /dev/null and b/q03_skewness_sqrt/tests/__pycache__/test-q03_skewness_sqrt.cpython-36.pyc differ
diff --git a/q04_encoding/__pycache__/__init__.cpython-36.pyc b/q04_encoding/__pycache__/__init__.cpython-36.pyc
new file mode 100644
index 0000000..69dc991
Binary files /dev/null and b/q04_encoding/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q04_encoding/__pycache__/build.cpython-36.pyc b/q04_encoding/__pycache__/build.cpython-36.pyc
new file mode 100644
index 0000000..af73c20
Binary files /dev/null and b/q04_encoding/__pycache__/build.cpython-36.pyc differ
diff --git a/q04_encoding/build.py b/q04_encoding/build.py
index a52c57f..6265f89 100644
--- a/q04_encoding/build.py
+++ b/q04_encoding/build.py
@@ -1,3 +1,4 @@
+# %load q04_encoding/build.py
 # Default imports
 import pandas as pd
 from sklearn.preprocessing import LabelEncoder
@@ -7,4 +8,12 @@
 
 
 # Write your code here:
+def encoding(housing_data):
+    encoder = LabelEncoder()
+    housing_data['LotShape_Label'] = encoder.fit_transform(housing_data['LotShape'])
+    df= pd.get_dummies(housing_data['GarageType'])
+    df = pd.concat([housing_data, df], axis=1)
+    return df.drop(['GarageType'], axis=1)
+
+
 
diff --git a/q04_encoding/tests/__pycache__/__init__.cpython-36.pyc b/q04_encoding/tests/__pycache__/__init__.cpython-36.pyc
new file mode 100644
index 0000000..86dbf32
Binary files /dev/null and b/q04_encoding/tests/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q04_encoding/tests/__pycache__/test_q04_encoding.cpython-36.pyc b/q04_encoding/tests/__pycache__/test_q04_encoding.cpython-36.pyc
new file mode 100644
index 0000000..a9e2ab4
Binary files /dev/null and b/q04_encoding/tests/__pycache__/test_q04_encoding.cpython-36.pyc differ