0% found this document useful (0 votes)

8 views12 pages

DM Practical06

The document contains Python code for implementing a Random Forest classifier using decision trees. It includes classes for DecisionTree and RandomForest, with methods for fitting the model, making predictions, and calculating information gain and entropy. The example usage demonstrates training the Random Forest on a sample dataset and making predictions.

Uploaded by

Kunal Prasad Zambare

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

8 views12 pages

DM Practical06

Uploaded by

Kunal Prasad Zambare

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

You are on page 1/ 12

Assignment No:-06

Assignment Name:- Classification using

Random Forest Roll No:-05
import numpy as np
from collections import Counter

class
DecisionTree:
def fit(self, X, y):
self.tree = self._grow_tree(X, y)

def _grow_tree(self, X, y):

if len(set(y)) == 1:
return y[0]

n_samples, n_features = X.shape

best_feature, best_threshold = self._best_split(X, y, n_features)

if best_feature is None:
return Counter(y).most_common(1)[0][0]

left_indices = X[:, best_feature] < best_threshold

right_indices = X[:, best_feature] >= best_threshold

left_child = self._grow_tree(X[left_indices], y[left_indices])

right_child = self._grow_tree(X[right_indices], y[right_indices])
return (best_feature, best_threshold, left_child, right_child)

def _best_split(self, X, y, n_features):

best_gain = -1
best_feature, best_threshold = None, None

for feature in range(n_features):

thresholds = np.unique(X[:,
feature]) for threshold in
thresholds:
left_indices = y[X[:, feature] < threshold]
right_indices = y[X[:, feature] >= threshold]
gain = self._information_gain(y, left_indices, right_indices)

if gain > best_gain:

best_gain = gain
best_feature = feature
best_threshold = threshold

return best_feature, best_threshold

def _information_gain(self, y, left_y, right_y):

p = len(left_y) / len(y)
return self._entropy(y) - (p * self._entropy(left_y) + (1 - p) * self._entropy(right_y))

def _entropy(self, y):

probabilities = np.bincount(y) / len(y)
return -np.sum(probabilities * np.log2(probabilities + 1e-6))

def predict(self, X):

return np.array([self._predict(sample) for sample in X])

def _predict(self, sample):

node = self.tree
while isinstance(node, tuple):
feature, threshold, left_child, right_child =
node if sample[feature] < threshold:
node = left_child
else:
node =
right_child return
node

class RandomForest:
def init (self, n_trees=5):
self.n_trees =
n_trees self.trees =
[]

def fit(self, X, y):

for _ in range(self.n_trees):
indices = np.random.choice(len(y), len(y), replace=True)
X_sample = X[indices]
y_sample =
y[indices] tree =
DecisionTree()
tree.fit(X_sample, y_sample)
self.trees.append(tree)

def predict(self, X):

tree_predictions = np.array([tree.predict(X) for tree in self.trees])
return [Counter(tree_preds).most_common(1)[0][0] for tree_preds in
tree_predictions.T]

# Example usage
if name == " main ":
# Sample dataset
X = np.array([[1, 2], [1, 4], [1, 0],
[2, 2], [2, 4], [2, 0]])
y = np.array([0, 0, 0, 1, 1, 1]) # Binary labels
# Create and train the Random
Forest rf =
RandomForest(n_trees=5)
rf.fit(X, y)

# Make predictions
predictions = rf.predict(X)
print("Predictions:", predictions)

….OUTPUT….
Assignment No:-06
Assignment Name:- Classification using
Random Forest Roll No:-06
import numpy as np
from collections import Counter

class
DecisionTree:
def fit(self, X, y):
self.tree = self._grow_tree(X, y)

def _grow_tree(self, X, y):

if len(set(y)) == 1:
return y[0]

n_samples, n_features = X.shape

best_feature, best_threshold = self._best_split(X, y, n_features)

if best_feature is None:
return Counter(y).most_common(1)[0][0]

left_indices = X[:, best_feature] < best_threshold

right_indices = X[:, best_feature] >= best_threshold

left_child = self._grow_tree(X[left_indices], y[left_indices])

right_child = self._grow_tree(X[right_indices], y[right_indices])
return (best_feature, best_threshold, left_child, right_child)

def _best_split(self, X, y, n_features):

best_gain = -1
best_feature, best_threshold = None, None

for feature in range(n_features):

if gain > best_gain:

best_gain = gain
best_feature = feature
best_threshold = threshold

return best_feature, best_threshold

def _information_gain(self, y, left_y, right_y):

p = len(left_y) / len(y)
return self._entropy(y) - (p * self._entropy(left_y) + (1 - p) * self._entropy(right_y))

def _entropy(self, y):

probabilities = np.bincount(y) / len(y)
return -np.sum(probabilities * np.log2(probabilities + 1e-6))

def predict(self, X):

return np.array([self._predict(sample) for sample in X])

def _predict(self, sample):

node = self.tree
while isinstance(node, tuple):
feature, threshold, left_child, right_child =
node if sample[feature] < threshold:
node = left_child
else:
node =
right_child return
node

class RandomForest:
def init (self, n_trees=5):
self.n_trees =
n_trees self.trees =
[]

def fit(self, X, y):

def predict(self, X):

tree_predictions = np.array([tree.predict(X) for tree in self.trees])
return [Counter(tree_preds).most_common(1)[0][0] for tree_preds in
tree_predictions.T]

# Make predictions
predictions = rf.predict(X)
print("Predictions:", predictions)

….OUTPUT….
Assignment No:-06
Assignment Name:- Classification using
Random Forest Roll No:-07
import numpy as np
from collections import Counter

class
DecisionTree:
def fit(self, X, y):
self.tree = self._grow_tree(X, y)

def _grow_tree(self, X, y):

if len(set(y)) == 1:
return y[0]

n_samples, n_features = X.shape

best_feature, best_threshold = self._best_split(X, y, n_features)

if best_feature is None:
return Counter(y).most_common(1)[0][0]

left_indices = X[:, best_feature] < best_threshold

right_indices = X[:, best_feature] >= best_threshold

left_child = self._grow_tree(X[left_indices], y[left_indices])

right_child = self._grow_tree(X[right_indices], y[right_indices])
return (best_feature, best_threshold, left_child, right_child)

def _best_split(self, X, y, n_features):

best_gain = -1
best_feature, best_threshold = None, None

for feature in range(n_features):

if gain > best_gain:

best_gain = gain
best_feature = feature
best_threshold = threshold

return best_feature, best_threshold

def _information_gain(self, y, left_y, right_y):

p = len(left_y) / len(y)
return self._entropy(y) - (p * self._entropy(left_y) + (1 - p) * self._entropy(right_y))

def _entropy(self, y):

probabilities = np.bincount(y) / len(y)
return -np.sum(probabilities * np.log2(probabilities + 1e-6))

def predict(self, X):

return np.array([self._predict(sample) for sample in X])

def _predict(self, sample):

node = self.tree
while isinstance(node, tuple):
feature, threshold, left_child, right_child =
node if sample[feature] < threshold:
node = left_child
else:
node =
right_child return
node

class RandomForest:
def init (self, n_trees=5):
self.n_trees =
n_trees self.trees =
[]

def fit(self, X, y):

def predict(self, X):

tree_predictions = np.array([tree.predict(X) for tree in self.trees])
return [Counter(tree_preds).most_common(1)[0][0] for tree_preds in
tree_predictions.T]

# Make predictions
predictions = rf.predict(X)
print("Predictions:", predictions)

….OUTPUT….
Assignment No:-06
Assignment Name:- Classification using
Random Forest Roll No:-08
import numpy as np
from collections import Counter

class
DecisionTree:
def fit(self, X, y):
self.tree = self._grow_tree(X, y)

def _grow_tree(self, X, y):

if len(set(y)) == 1:
return y[0]

n_samples, n_features = X.shape

best_feature, best_threshold = self._best_split(X, y, n_features)

if best_feature is None:
return Counter(y).most_common(1)[0][0]

left_indices = X[:, best_feature] < best_threshold

right_indices = X[:, best_feature] >= best_threshold

left_child = self._grow_tree(X[left_indices], y[left_indices])

right_child = self._grow_tree(X[right_indices], y[right_indices])
return (best_feature, best_threshold, left_child, right_child)

def _best_split(self, X, y, n_features):

best_gain = -1
best_feature, best_threshold = None, None

for feature in range(n_features):

if gain > best_gain:

best_gain = gain
best_feature = feature
best_threshold = threshold

return best_feature, best_threshold

def _information_gain(self, y, left_y, right_y):

p = len(left_y) / len(y)
return self._entropy(y) - (p * self._entropy(left_y) + (1 - p) * self._entropy(right_y))

def _entropy(self, y):

probabilities = np.bincount(y) / len(y)
return -np.sum(probabilities * np.log2(probabilities + 1e-6))

def predict(self, X):

return np.array([self._predict(sample) for sample in X])

def _predict(self, sample):

node = self.tree
while isinstance(node, tuple):
feature, threshold, left_child, right_child =
node if sample[feature] < threshold:
node = left_child
else:
node =
right_child return
node

class RandomForest:
def init (self, n_trees=5):
self.n_trees =
n_trees self.trees =
[]

def fit(self, X, y):

def predict(self, X):

tree_predictions = np.array([tree.predict(X) for tree in self.trees])
return [Counter(tree_preds).most_common(1)[0][0] for tree_preds in
tree_predictions.T]

# Make predictions
predictions = rf.predict(X)
print("Predictions:", predictions)

….OUTPUT….

Random Forest 1737667979
No ratings yet
Random Forest 1737667979
11 pages
Random Forest: The Algorithm in A Nutshell
No ratings yet
Random Forest: The Algorithm in A Nutshell
10 pages
ML Asst.-01
No ratings yet
ML Asst.-01
21 pages
L3 - Classification - RandomForest - Jupyter Notebook
No ratings yet
L3 - Classification - RandomForest - Jupyter Notebook
6 pages
10 Random - Forest - Algo
No ratings yet
10 Random - Forest - Algo
6 pages
DA PRA WEEK 13 (Random Forest) - 054551
No ratings yet
DA PRA WEEK 13 (Random Forest) - 054551
12 pages
Ex 6
No ratings yet
Ex 6
10 pages
Random Forest
No ratings yet
Random Forest
25 pages
Random Forest Classifier on Banking Dataset
No ratings yet
Random Forest Classifier on Banking Dataset
7 pages
1 Homework 2: 1.1 Large Scale Data Analysis / Aalto University, Spring 2023
No ratings yet
1 Homework 2: 1.1 Large Scale Data Analysis / Aalto University, Spring 2023
12 pages
Decision Tree, Random Forest
No ratings yet
Decision Tree, Random Forest
37 pages
Random Forest
No ratings yet
Random Forest
2 pages
Random Forest Algorithm
No ratings yet
Random Forest Algorithm
2 pages
AAM 6th Prac
No ratings yet
AAM 6th Prac
3 pages
015 - Random Forest
No ratings yet
015 - Random Forest
15 pages
Practical No4 - 5 ML
No ratings yet
Practical No4 - 5 ML
11 pages
Setup: This Notebook Contains All The Sample Code and Solutions To The Exercises in Chapter 7
No ratings yet
Setup: This Notebook Contains All The Sample Code and Solutions To The Exercises in Chapter 7
23 pages
Aam p-4 To 6
No ratings yet
Aam p-4 To 6
6 pages
Telecom Churn Proj
No ratings yet
Telecom Churn Proj
4 pages
Assgn 06 ML - Ipynb - Colab
No ratings yet
Assgn 06 ML - Ipynb - Colab
5 pages
Random Forest
100% (1)
Random Forest
11 pages
Exp 6
No ratings yet
Exp 6
3 pages
03 - Random Forest
No ratings yet
03 - Random Forest
24 pages
Lecture+Notes+-+Random Forests
No ratings yet
Lecture+Notes+-+Random Forests
10 pages
Random Forest Classification
No ratings yet
Random Forest Classification
8 pages
Random Forest Algorithm Unit 3
No ratings yet
Random Forest Algorithm Unit 3
2 pages
Ex No 6
No ratings yet
Ex No 6
3 pages
CSET301 LabW8L2
No ratings yet
CSET301 LabW8L2
1 page
CS326 Report
No ratings yet
CS326 Report
36 pages
Forest - Py
No ratings yet
Forest - Py
50 pages
Mid2 Answers
No ratings yet
Mid2 Answers
42 pages
Decision Trees
No ratings yet
Decision Trees
11 pages
Machine Learning With Random Forests - by Knoldus Inc. - Knoldus - Technical Insights - Medium
No ratings yet
Machine Learning With Random Forests - by Knoldus Inc. - Knoldus - Technical Insights - Medium
12 pages
Python Implementation of Random Forest Algorithm
No ratings yet
Python Implementation of Random Forest Algorithm
10 pages
A) What Is Motivation Behind Ensemble Methods? Give Your Answer in Probabilistic Terms
100% (1)
A) What Is Motivation Behind Ensemble Methods? Give Your Answer in Probabilistic Terms
6 pages
Random Forest
No ratings yet
Random Forest
3 pages
Aam Codes
No ratings yet
Aam Codes
8 pages
CSL0777 L26
No ratings yet
CSL0777 L26
33 pages
PR 2
No ratings yet
PR 2
3 pages
Big Data Practical
No ratings yet
Big Data Practical
20 pages
Intro to ML: Random Forest Exercise
No ratings yet
Intro to ML: Random Forest Exercise
2 pages
Ensemble Learning
No ratings yet
Ensemble Learning
12 pages
Machine Learning
No ratings yet
Machine Learning
23 pages
Untitled Document
No ratings yet
Untitled Document
6 pages
Notes 221104 101858
No ratings yet
Notes 221104 101858
32 pages
210 Handout
No ratings yet
210 Handout
45 pages
ML5 Implementation
No ratings yet
ML5 Implementation
32 pages
Random Forest Algorithm
No ratings yet
Random Forest Algorithm
9 pages
ML: Decision Trees & Random Forests
No ratings yet
ML: Decision Trees & Random Forests
25 pages
MlLabManualdocx 2024 09 04 22 02 58
No ratings yet
MlLabManualdocx 2024 09 04 22 02 58
19 pages
Random Forest
No ratings yet
Random Forest
10 pages
Machine Learning - Random Forest
No ratings yet
Machine Learning - Random Forest
6 pages
Random Forest
No ratings yet
Random Forest
8 pages
Assignment:2 Topic: Decision Tree in Python Submitted To:prof - Taj Submitted By:Ayesha Akram Class:BSIT 6 (SS1) Roll No:BSIT51F22S038 Code
No ratings yet
Assignment:2 Topic: Decision Tree in Python Submitted To:prof - Taj Submitted By:Ayesha Akram Class:BSIT 6 (SS1) Roll No:BSIT51F22S038 Code
7 pages
Random Forest
No ratings yet
Random Forest
3 pages
Random Forest I
No ratings yet
Random Forest I
1 page
Learn Python From Scratch
No ratings yet
Learn Python From Scratch
9 pages
Iris Classifier Accuracy Comparison
No ratings yet
Iris Classifier Accuracy Comparison
5 pages
Threat: Q.1 Data and Information Define
No ratings yet
Threat: Q.1 Data and Information Define
4 pages
DM Practical07
No ratings yet
DM Practical07
4 pages
DM Practical 04
No ratings yet
DM Practical 04
4 pages
DM Practical05
No ratings yet
DM Practical05
4 pages
Oracle Certificate
No ratings yet
Oracle Certificate
1 page
CSE 5311 Homework 2 Solution: Problem 6.2-6
No ratings yet
CSE 5311 Homework 2 Solution: Problem 6.2-6
8 pages
Solution of Week - 3
No ratings yet
Solution of Week - 3
8 pages
Amanda Rozi Kurnia - 05111940000094 - AA TREE
No ratings yet
Amanda Rozi Kurnia - 05111940000094 - AA TREE
19 pages
Segment Tree PDF
No ratings yet
Segment Tree PDF
5 pages
Lab File - DAA
No ratings yet
Lab File - DAA
49 pages
Dsa Heap
No ratings yet
Dsa Heap
12 pages
Capgemini MCQ
No ratings yet
Capgemini MCQ
9 pages
M.tech Ads Lab Manual 1
100% (1)
M.tech Ads Lab Manual 1
84 pages
Suffix Trees and Suffix Arrays
No ratings yet
Suffix Trees and Suffix Arrays
33 pages
Minimum Spanning Trees: Algorithms & Applications
No ratings yet
Minimum Spanning Trees: Algorithms & Applications
42 pages
Data Structures Lab for Students
No ratings yet
Data Structures Lab for Students
5 pages
Mod 2 (Aad)
No ratings yet
Mod 2 (Aad)
26 pages
? Interview Master 100
No ratings yet
? Interview Master 100
6 pages
Sorting: Data and File Structures Laboratory
No ratings yet
Sorting: Data and File Structures Laboratory
8 pages
Trie Insertion
No ratings yet
Trie Insertion
31 pages
Threaded Binary Tree
No ratings yet
Threaded Binary Tree
3 pages
B Tree
No ratings yet
B Tree
6 pages
DSA Lab Report 11 Anas Zohrab
No ratings yet
DSA Lab Report 11 Anas Zohrab
9 pages
Heap Sort - 2
No ratings yet
Heap Sort - 2
43 pages
Unit-3 Non-Linear Data Structure Part-3 (Tree - III)
No ratings yet
Unit-3 Non-Linear Data Structure Part-3 (Tree - III)
40 pages
Binary Tree
No ratings yet
Binary Tree
58 pages
DS Unit 2
No ratings yet
DS Unit 2
32 pages
DAA Unit 2 Notes
No ratings yet
DAA Unit 2 Notes
54 pages
Heap Operations for Programmers
No ratings yet
Heap Operations for Programmers
3 pages
DSA Lab Projects Group One
No ratings yet
DSA Lab Projects Group One
4 pages
2-3 Trees Tyutorial
No ratings yet
2-3 Trees Tyutorial
19 pages
B Trees
No ratings yet
B Trees
50 pages
MCQ (Tree)
No ratings yet
MCQ (Tree)
14 pages
Algorithms Questions
0% (1)
Algorithms Questions
13 pages

DM Practical06

Uploaded by

DM Practical06

Uploaded by

Assignment No:-06

Assignment Name:- Classification using

def _grow_tree(self, X, y):

n_samples, n_features = X.shape

left_indices = X[:, best_feature] < best_threshold

left_child = self._grow_tree(X[left_indices], y[left_indices])

def _best_split(self, X, y, n_features):

for feature in range(n_features):

if gain > best_gain:

return best_feature, best_threshold

def _information_gain(self, y, left_y, right_y):

def _entropy(self, y):

def predict(self, X):

def _predict(self, sample):

def fit(self, X, y):

def predict(self, X):

def _grow_tree(self, X, y):

n_samples, n_features = X.shape

left_indices = X[:, best_feature] < best_threshold

left_child = self._grow_tree(X[left_indices], y[left_indices])

def _best_split(self, X, y, n_features):

for feature in range(n_features):

if gain > best_gain:

return best_feature, best_threshold

def _information_gain(self, y, left_y, right_y):

def _entropy(self, y):

def predict(self, X):

def _predict(self, sample):

def fit(self, X, y):

def predict(self, X):

def _grow_tree(self, X, y):

n_samples, n_features = X.shape

left_indices = X[:, best_feature] < best_threshold

left_child = self._grow_tree(X[left_indices], y[left_indices])

def _best_split(self, X, y, n_features):

for feature in range(n_features):

if gain > best_gain:

return best_feature, best_threshold

def _information_gain(self, y, left_y, right_y):

def _entropy(self, y):

def predict(self, X):

def _predict(self, sample):

def fit(self, X, y):

def predict(self, X):

def _grow_tree(self, X, y):

n_samples, n_features = X.shape

left_indices = X[:, best_feature] < best_threshold

left_child = self._grow_tree(X[left_indices], y[left_indices])

def _best_split(self, X, y, n_features):

for feature in range(n_features):

if gain > best_gain:

return best_feature, best_threshold

def _information_gain(self, y, left_y, right_y):

def _entropy(self, y):

def predict(self, X):

def _predict(self, sample):

def fit(self, X, y):

def predict(self, X):

You might also like