From 282d28f8219c2760bac2d9c83cf36b5bfe9d5de8 Mon Sep 17 00:00:00 2001
From: hrishiSU <hrishikesh.suslade1@gmail.com>
Date: Wed, 16 Oct 2019 01:24:54 +0530
Subject: [PATCH 1/2] Added Pytests for Decission Tree

Modified the mean_squared_error to be a static method

Created the Test_Decision_Tree class
Consists of two methods
1. helper_mean_squared_error_test: This method calculates the mean squared error manually without using
numpy. Instead a for loop is used for the same.
2. test_one_mean_squared_error: This method considers a simple test case and compares the results by the
helper function and the original mean_squared_error method of Decision_Tree class. This is done using asert
keyword.

Execution:
PyTest installation
pip3 install pytest OR pip install pytest

Test function execution
pytest decision_tree.py
---
 machine_learning/decision_tree.py | 36 +++++++++++++++++++++++++++++++
 1 file changed, 36 insertions(+)

diff --git a/machine_learning/decision_tree.py b/machine_learning/decision_tree.py
index 4f7a4d12966e..64d4edebcd47 100644
--- a/machine_learning/decision_tree.py
+++ b/machine_learning/decision_tree.py
@@ -15,6 +15,7 @@ def __init__(self, depth=5, min_leaf_size=5):
         self.min_leaf_size = min_leaf_size
         self.prediction = None
 
+    @staticmethod
     def mean_squared_error(self, labels, prediction):
         """
         mean_squared_error:
@@ -117,6 +118,41 @@ def predict(self, x):
             print("Error: Decision tree not yet trained")
             return None
 
+class Test_Decision_Tree:
+    """Decision Tres test class
+    To execute
+            pip install pytest
+            pytest decision_tree.py
+    If all test functions are passed a success message shall be displayed
+    
+    """
+
+    @staticmethod
+    def helper_mean_squared_error_test(labels, prediction):
+        """
+        helper_mean_squared_error_test:
+        @param labels: a one dimensional numpy array
+        @param prediction: a floating point value
+        return value: helper_mean_squared_error_test calculates the mean squared error 
+        """
+        squared_error_sum = np.float(0)
+        for label in labels:
+            squared_error_sum += ((label-prediction) ** 2)
+
+        return np.float(squared_error_sum/labels.size)
+         
+    
+    def test_one_mean_sqaurred_error(self):
+        """
+        test_one_mean_squared_error:
+        return value: test_one_mean_squared_error verifies the mean_squared_error function value for the given test case 
+        """       
+        test_labels = np.array([1,2,3,4,5,6,7,8,9,10])
+        test_prediction = np.float(6)
+        assert Decision_Tree.mean_squared_error(self,test_labels,test_prediction) == Test_Decision_Tree.helper_mean_squared_error_test(test_labels,test_prediction)
+    
+    
+
 
 def main():
     """

From 6014f29bd4e2d5a86c59aaafc678bab167efc63e Mon Sep 17 00:00:00 2001
From: hrishiSU <hrishikesh.suslade1@gmail.com>
Date: Fri, 18 Oct 2019 19:55:53 +0530
Subject: [PATCH 2/2] Modified the pytests to be compatible with the doctest
 Added 2 doctest in the mean_squared_error method For its verification a
 static method helper_mean_squared_error(labels, prediction) is used It uses a
 for loop to calculate the error instead of the numpy inbuilt methods
 Execution ``` pytest .\decision_tree.py --doctest-modules ```

---
 machine_learning/decision_tree.py | 26 +++++++++++---------------
 1 file changed, 11 insertions(+), 15 deletions(-)

diff --git a/machine_learning/decision_tree.py b/machine_learning/decision_tree.py
index 64d4edebcd47..14c02b64df0c 100644
--- a/machine_learning/decision_tree.py
+++ b/machine_learning/decision_tree.py
@@ -15,13 +15,20 @@ def __init__(self, depth=5, min_leaf_size=5):
         self.min_leaf_size = min_leaf_size
         self.prediction = None
 
-    @staticmethod
     def mean_squared_error(self, labels, prediction):
         """
         mean_squared_error:
         @param labels: a one dimensional numpy array
         @param prediction: a floating point value
         return value: mean_squared_error calculates the error if prediction is used to estimate the labels
+        >>> tester = Decision_Tree()
+        >>> test_labels = np.array([1,2,3,4,5,6,7,8,9,10])
+        >>> test_prediction = np.float(6)
+        >>> assert tester.mean_squared_error(test_labels, test_prediction) == Test_Decision_Tree.helper_mean_squared_error_test(test_labels, test_prediction)
+        >>> test_labels = np.array([1,2,3])
+        >>> test_prediction = np.float(2)
+        >>> assert tester.mean_squared_error(test_labels, test_prediction) == Test_Decision_Tree.helper_mean_squared_error_test(test_labels, test_prediction)
+
         """
         if labels.ndim != 1:
             print("Error: Input labels must be one dimensional")
@@ -120,11 +127,6 @@ def predict(self, x):
 
 class Test_Decision_Tree:
     """Decision Tres test class
-    To execute
-            pip install pytest
-            pytest decision_tree.py
-    If all test functions are passed a success message shall be displayed
-    
     """
 
     @staticmethod
@@ -140,16 +142,7 @@ def helper_mean_squared_error_test(labels, prediction):
             squared_error_sum += ((label-prediction) ** 2)
 
         return np.float(squared_error_sum/labels.size)
-         
     
-    def test_one_mean_sqaurred_error(self):
-        """
-        test_one_mean_squared_error:
-        return value: test_one_mean_squared_error verifies the mean_squared_error function value for the given test case 
-        """       
-        test_labels = np.array([1,2,3,4,5,6,7,8,9,10])
-        test_prediction = np.float(6)
-        assert Decision_Tree.mean_squared_error(self,test_labels,test_prediction) == Test_Decision_Tree.helper_mean_squared_error_test(test_labels,test_prediction)
     
     
 
@@ -177,3 +170,6 @@ def main():
 
 if __name__ == "__main__":
     main()
+    import doctest
+
+    doctest.testmod(name="mean_squarred_error", verbose=True)