diff --git a/__pycache__/__init__.cpython-36.pyc b/__pycache__/__init__.cpython-36.pyc
index 2e5da7d..f6bd725 100644
Binary files a/__pycache__/__init__.cpython-36.pyc and b/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q01_outlier_removal/__pycache__/__init__.cpython-36.pyc b/q01_outlier_removal/__pycache__/__init__.cpython-36.pyc
index 2f9a42a..3e34827 100644
Binary files a/q01_outlier_removal/__pycache__/__init__.cpython-36.pyc and b/q01_outlier_removal/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q01_outlier_removal/__pycache__/build.cpython-36.pyc b/q01_outlier_removal/__pycache__/build.cpython-36.pyc
index 8248a16..24a4d7b 100644
Binary files a/q01_outlier_removal/__pycache__/build.cpython-36.pyc and b/q01_outlier_removal/__pycache__/build.cpython-36.pyc differ
diff --git a/q01_outlier_removal/build.py b/q01_outlier_removal/build.py
index ec278ba..edf4dc4 100644
--- a/q01_outlier_removal/build.py
+++ b/q01_outlier_removal/build.py
@@ -1,8 +1,16 @@
+# %load q01_outlier_removal/build.py
 # Default imports
 import pandas as pd
 
-loan_data = pd.read_csv('data/loan_prediction_uncleaned.csv')
-loan_data = loan_data.drop('Loan_ID', 1)
+df = pd.read_csv('data/loan_prediction_uncleaned.csv')
+df = df.drop('Loan_ID', 1)
 
 
 # Write your Solution here:
+def outlier_removal(df):
+    df = df.drop(df[(df['ApplicantIncome']>df['ApplicantIncome'].quantile(0.95)) | 
+                    (df['CoapplicantIncome']>df['CoapplicantIncome'].quantile(0.95)) | 
+                    (df['LoanAmount']>df['LoanAmount'].quantile(0.95))].index)
+    return df
+
+
diff --git a/q01_outlier_removal/tests/__pycache__/__init__.cpython-36.pyc b/q01_outlier_removal/tests/__pycache__/__init__.cpython-36.pyc
index 5a057ff..9cd3e0f 100644
Binary files a/q01_outlier_removal/tests/__pycache__/__init__.cpython-36.pyc and b/q01_outlier_removal/tests/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q01_outlier_removal/tests/__pycache__/test_q01_outlier_removal.cpython-36.pyc b/q01_outlier_removal/tests/__pycache__/test_q01_outlier_removal.cpython-36.pyc
index 4c0b6c7..c262e9f 100644
Binary files a/q01_outlier_removal/tests/__pycache__/test_q01_outlier_removal.cpython-36.pyc and b/q01_outlier_removal/tests/__pycache__/test_q01_outlier_removal.cpython-36.pyc differ
diff --git a/q02_data_cleaning_all/__pycache__/__init__.cpython-36.pyc b/q02_data_cleaning_all/__pycache__/__init__.cpython-36.pyc
new file mode 100644
index 0000000..baa030c
Binary files /dev/null and b/q02_data_cleaning_all/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q02_data_cleaning_all/__pycache__/build.cpython-36.pyc b/q02_data_cleaning_all/__pycache__/build.cpython-36.pyc
new file mode 100644
index 0000000..28964f1
Binary files /dev/null and b/q02_data_cleaning_all/__pycache__/build.cpython-36.pyc differ
diff --git a/q02_data_cleaning_all/build.py b/q02_data_cleaning_all/build.py
index b56e2bc..5a251a4 100644
--- a/q02_data_cleaning_all/build.py
+++ b/q02_data_cleaning_all/build.py
@@ -1,10 +1,12 @@
+# %load q02_data_cleaning_all/build.py
 # Default Imports
 import sys, os
 sys.path.append(os.path.dirname(os.path.dirname(os.path.dirname('__file__'))))
 import pandas as pd
 import numpy as np
-from sklearn.model_selection import train_test_split
+from sklearn.model_selection import train_test_split as tts
 from greyatomlib.logistic_regression_project.q01_outlier_removal.build import outlier_removal
+from sklearn.preprocessing import Imputer
 
 loan_data = pd.read_csv('data/loan_prediction_uncleaned.csv')
 loan_data = loan_data.drop('Loan_ID', 1)
@@ -12,3 +14,24 @@
 
 
 # Write your solution here :
+def data_cleaning(df):
+    
+    imp_mean = Imputer(missing_values = float('NaN'), strategy='mean')
+    df['LoanAmount'] = imp_mean.fit_transform(df[['LoanAmount']]).ravel()
+         
+    df['Gender']  = df['Gender'].fillna(df['Gender'].mode()[0])
+    df['Married'] = df['Married'].fillna(df['Married'].mode()[0])
+    df['Dependents'] = df['Dependents'].fillna(df['Dependents'].mode()[0])
+    df['Self_Employed'] = df['Self_Employed'].fillna(df['Self_Employed'].mode()[0])
+    df['Loan_Amount_Term'] = df['Loan_Amount_Term'].fillna(df['Loan_Amount_Term'].mode()[0])
+    df['Credit_History'] = df['Credit_History'].fillna(df['Credit_History'].mode()[0])
+        
+    X=df.drop(['LoanAmount'],axis=1)
+    y=df['LoanAmount']
+  
+    X_train, X_test, y_train, y_test = tts(X, y, test_size = 0.25, random_state = 9)
+    
+    return (X,y,X_train, X_test, y_train, y_test)
+
+
+
diff --git a/q02_data_cleaning_all/tests/__pycache__/__init__.cpython-36.pyc b/q02_data_cleaning_all/tests/__pycache__/__init__.cpython-36.pyc
new file mode 100644
index 0000000..5475eda
Binary files /dev/null and b/q02_data_cleaning_all/tests/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q02_data_cleaning_all/tests/__pycache__/test_q02_data_cleaning.cpython-36.pyc b/q02_data_cleaning_all/tests/__pycache__/test_q02_data_cleaning.cpython-36.pyc
new file mode 100644
index 0000000..57931fd
Binary files /dev/null and b/q02_data_cleaning_all/tests/__pycache__/test_q02_data_cleaning.cpython-36.pyc differ
diff --git a/q02_data_cleaning_all_2/__pycache__/__init__.cpython-36.pyc b/q02_data_cleaning_all_2/__pycache__/__init__.cpython-36.pyc
new file mode 100644
index 0000000..a7dbdc9
Binary files /dev/null and b/q02_data_cleaning_all_2/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q02_data_cleaning_all_2/__pycache__/build.cpython-36.pyc b/q02_data_cleaning_all_2/__pycache__/build.cpython-36.pyc
new file mode 100644
index 0000000..6caaaef
Binary files /dev/null and b/q02_data_cleaning_all_2/__pycache__/build.cpython-36.pyc differ
diff --git a/q02_data_cleaning_all_2/build.py b/q02_data_cleaning_all_2/build.py
index e20ff7b..3bf97f3 100644
--- a/q02_data_cleaning_all_2/build.py
+++ b/q02_data_cleaning_all_2/build.py
@@ -1,3 +1,4 @@
+# %load q02_data_cleaning_all_2/build.py
 # Default Imports
 import pandas as pd
 import numpy as np
@@ -11,3 +12,17 @@
 
 
 # Write your solution here :
+def data_cleaning_2(X_train, X_test, y_train, y_test):
+    
+    CCL=['Gender', 'Married', 'Dependents', 'Education', 'Self_Employed', 'Property_Area']
+    X_train=pd.get_dummies(X_train,columns=CCL, drop_first=True)
+    X_test=pd.get_dummies(X_test,columns=CCL, drop_first=True)
+    
+    numeric_column=['ApplicantIncome', 'CoapplicantIncome', 'LoanAmount']
+    for c in numeric_column:
+        X_train[c] = np.sqrt(X_train[c])
+        X_test[c] = np.sqrt(X_test[c])
+    return X_train, X_test, y_train, y_test
+
+
+
diff --git a/q02_data_cleaning_all_2/tests/__pycache__/__init__.cpython-36.pyc b/q02_data_cleaning_all_2/tests/__pycache__/__init__.cpython-36.pyc
new file mode 100644
index 0000000..5e81584
Binary files /dev/null and b/q02_data_cleaning_all_2/tests/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q02_data_cleaning_all_2/tests/__pycache__/q02_test_data_cleaning_2.cpython-36.pyc b/q02_data_cleaning_all_2/tests/__pycache__/q02_test_data_cleaning_2.cpython-36.pyc
new file mode 100644
index 0000000..30b3b15
Binary files /dev/null and b/q02_data_cleaning_all_2/tests/__pycache__/q02_test_data_cleaning_2.cpython-36.pyc differ
diff --git a/q03_logistic_regression/__pycache__/__init__.cpython-36.pyc b/q03_logistic_regression/__pycache__/__init__.cpython-36.pyc
new file mode 100644
index 0000000..a572cce
Binary files /dev/null and b/q03_logistic_regression/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q03_logistic_regression/__pycache__/build.cpython-36.pyc b/q03_logistic_regression/__pycache__/build.cpython-36.pyc
new file mode 100644
index 0000000..3e8a6fa
Binary files /dev/null and b/q03_logistic_regression/__pycache__/build.cpython-36.pyc differ
diff --git a/q03_logistic_regression/build.py b/q03_logistic_regression/build.py
index cdbd506..fa0533e 100644
--- a/q03_logistic_regression/build.py
+++ b/q03_logistic_regression/build.py
@@ -1,3 +1,4 @@
+# %load q03_logistic_regression/build.py
 # Default Imports
 import pandas as pd
 from sklearn.preprocessing import StandardScaler
@@ -16,3 +17,17 @@
 
 # Write your solution code here:
 
+def logistic_regression(X_train,X_test,y_train,y_test):
+    
+    scale = StandardScaler()
+    scale.fit(X_train[['ApplicantIncome','CoapplicantIncome','LoanAmount']])
+    
+    log_reg = LogisticRegression()
+    log_reg.fit(X_train,y_train)
+    
+    y_pred = log_reg.predict(X_test)
+    conf_matrix = confusion_matrix(y_test,y_pred)
+       
+    return conf_matrix
+
+
diff --git a/q03_logistic_regression/tests/__pycache__/__init__.cpython-36.pyc b/q03_logistic_regression/tests/__pycache__/__init__.cpython-36.pyc
new file mode 100644
index 0000000..b08fce5
Binary files /dev/null and b/q03_logistic_regression/tests/__pycache__/__init__.cpython-36.pyc differ
diff --git a/q03_logistic_regression/tests/__pycache__/test_q03_logistic_regression.cpython-36.pyc b/q03_logistic_regression/tests/__pycache__/test_q03_logistic_regression.cpython-36.pyc
new file mode 100644
index 0000000..1ab10c5
Binary files /dev/null and b/q03_logistic_regression/tests/__pycache__/test_q03_logistic_regression.cpython-36.pyc differ