abhi0316
diff --git a/‎images/decisiontree_fruit.jpg‎
44.9 KB b/‎images/decisiontree_fruit.jpg‎
44.9 KB
diff --git a/‎learning.ipynb‎
Lines changed: 159 additions & 108 deletions b/‎learning.ipynb‎
Lines changed: 159 additions & 108 deletions
diff --git a/‎learning.py‎
Lines changed: 28 additions & 1 deletion b/‎learning.py‎
Lines changed: 28 additions & 1 deletion
@@ -4,7 +4,7 @@
     removeall, unique, product, mode, argmax, argmax_random_tie, isclose, gaussian,
     dotproduct, vector_add, scalar_vector_product, weighted_sample_with_replacement,
     weighted_sampler, num_or_str, normalize, clip, sigmoid, print_table,
-    open_data, sigmoid_derivative
+    open_data, sigmoid_derivative, probability
 )
 
 import copy
@@ -493,6 +493,33 @@ def information_content(values):
 
 # ______________________________________________________________________________
 
+
+def RandomForest(dataset, n=5):
+    """A ensemble of Decision trese trained using bagging and feature bagging."""
+
+    predictors = [DecisionTreeLearner(examples=data_bagging(dataset),
+                                 attrs=dataset.attrs,
+                                 attrnames=dataset.attrnames,
+                                 target=dataset.target,
+                                 inputs=feature_bagging(datatset)) for _ in range(n)]
+
+    def data_bagging(dataset, m=0):
+        """Sample m examples with replacement"""
+        n = len(dataset.examples)
+        return weighted_sample_with_replacement(m or n, examples, [1]*n)
+
+    def feature_bagging(dataset, p=0.7):
+        """Feature bagging with probability p to retain an attribute"""
+        inputs = [i for i in dataset.inputs if probability(p)]
+        return inputs or dataset.inputs
+
+    def predict(example):
+        return mode(predictor(example) for predictor in predictors)
+
+    return predict
+
+# ______________________________________________________________________________
+
 # A decision list is implemented as a list of (test, value) pairs.