0% found this document useful (0 votes)

6 views22 pages

ASSESSMENT2

The document contains code implementations for various machine learning algorithms, including decision trees using ID3 and CART methods, simple linear regression, and logistic regression. It utilizes Python libraries such as pandas, numpy, and matplotlib for data manipulation and visualization. The code reads data from CSV files, calculates necessary metrics, and builds models to predict outcomes based on input features.

Uploaded by

vaibhavdutt.trivedi2022

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

6 views22 pages

ASSESSMENT2

Uploaded by

vaibhavdutt.trivedi2022

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 22

ASSESSMENT-2

NAME - VAIBHAV DUTT TRIVEDI

REG. NO. – 22MIC0118

COURSE TITLE – MACHINE LEARNING

COURSE CODE – CSI 3026

LAB SLOT – L9+L10

CODE-
import pandas as pd
import numpy as np

def calculate_entropy(column):
values, counts = np.unique(column, return_counts=True)
probabilities = counts / len(column)
return -np.sum(probabilities * np.log2(probabilities))

def calculate_info_gain(data, feature, target):

total_entropy = calculate_entropy(data[target])
feature_values = data[feature].unique()
weighted_entropy = 0
for value in feature_values:
subset = data[data[feature] == value]
weight = len(subset) / len(data)
weighted_entropy += weight * calculate_entropy(subset[target])
return total_entropy - weighted_entropy

def build_tree(data, features, target):

if len(np.unique(data[target])) == 1:
return data[target].iloc[0]
if not features:
return data[target].mode()[0]
best_feature = max(features, key=lambda f: calculate_info_gain(data, f, target))
tree = {best_feature: {}}
remaining_features = [f for f in features if f != best_feature]
for value in np.unique(data[best_feature]):
subset = data[data[best_feature] == value]
tree[best_feature][value] = build_tree(subset, remaining_features, target)
return tree

data = pd.read_csv("id3.csv")
target = data.columns[-1]
features = list(data.columns[:-1])

decision_tree = build_tree(data, features, target)

print("Decision Tree:", decision_tree)
CODE-
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

data = pd.read_csv('L.csv')
x = data['X']
y = data['Y']

n = len(x)
mean_x = np.mean(x)
mean_y = np.mean(y)

numerator = np.sum((x - mean_x) * (y - mean_y))

denom = np.sum((x - mean_x) ** 2)
slope = numerator / denom
intercept = mean_y - slope * mean_x

print("Slope (m):", slope)

print("Intercept (b):", intercept)

y_pred = slope * x + intercept

plt.scatter(x, y, color='blue', label='Data Points')

plt.plot(x, y_pred, color='red', label='Regression Line')
plt.xlabel('X')
plt.ylabel('Y')
plt.title('Simple Linear Regression')
plt.legend()
plt.show()
4
CODE-
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

def sigmoid(z):
return 1 / (1 + np.exp(-z))

data = pd.read_csv('LOG.csv')
x = data['X']
y = data['Y']

n = len(x)
mean_x = np.mean(x)
mean_y = np.mean(y)

numerator = np.sum((x - mean_x) * (y - mean_y))

denom = np.sum((x - mean_x) ** 2)
slope = numerator / denom
intercept = mean_y - slope * mean_x

print("Slope (m):", slope)

print("Intercept (b):", intercept)

z = slope * x + intercept
y_pred = sigmoid(z)

plt.scatter(x, y, color='blue', label='Data Points')

plt.plot(x, y_pred, color='red', label='Logistic Regression Curve')
plt.xlabel('X')
plt.ylabel('Probability')
plt.title('Logistic Regression')
plt.legend()
plt.show()
CODE-

import pandas as pd
import numpy as np

def gini_impurity(column):
values, counts = np.unique(column, return_counts=True)
probabilities = counts / len(column)
return 1 - np.sum(probabilities ** 2)

def calculate_gini_index(data, feature, target):

feature_values = data[feature].unique()
weighted_gini = 0
for value in feature_values:
subset = data[data[feature] == value]
weight = len(subset) / len(data)
weighted_gini += weight * gini_impurity(subset[target])
return weighted_gini

def build_cart_tree(data, features, target):

if len(np.unique(data[target])) == 1:
return data[target].iloc[0]
if not features:
return data[target].mode()[0]
best_feature = min(features, key=lambda f: calculate_gini_index(data, f, target))
tree = {best_feature: {}}
remaining_features = [f for f in features if f != best_feature]
for value in np.unique(data[best_feature]):
subset = data[data[best_feature] == value]
tree[best_feature][value] = build_cart_tree(subset, remaining_features, target)
return tree

data = pd.read_csv("cart.csv")
target = data.columns[-1]
features = list(data.columns[:-1])

decision_tree = build_cart_tree(data, features, target)

print("Decision Tree:", decision_tree)

ASSESSMENT2
No ratings yet
ASSESSMENT2
22 pages
DA_Programs
No ratings yet
DA_Programs
44 pages
DECISION TREES
No ratings yet
DECISION TREES
7 pages
221IT027_DA_lab3 (2)
No ratings yet
221IT027_DA_lab3 (2)
5 pages
Machine Learning Laboratory Manual
No ratings yet
Machine Learning Laboratory Manual
11 pages
Ml Short Code_under Updating
No ratings yet
Ml Short Code_under Updating
4 pages
Alishba(S005)
No ratings yet
Alishba(S005)
5 pages
LAB 3
No ratings yet
LAB 3
7 pages
Play Tennis Prog 4
No ratings yet
Play Tennis Prog 4
3 pages
ML Journal External
No ratings yet
ML Journal External
14 pages
Aiml Lab
No ratings yet
Aiml Lab
14 pages
DA LAB MANNUAL
No ratings yet
DA LAB MANNUAL
25 pages
ML Lab
No ratings yet
ML Lab
7 pages
DA_012307
No ratings yet
DA_012307
8 pages
DMW
No ratings yet
DMW
8 pages
indexdw (1)
No ratings yet
indexdw (1)
34 pages
AIML PROGRAMS
No ratings yet
AIML PROGRAMS
12 pages
1
No ratings yet
1
13 pages
Final ML File
No ratings yet
Final ML File
34 pages
ML Lab Record
No ratings yet
ML Lab Record
33 pages
Data Science Record_05
No ratings yet
Data Science Record_05
20 pages
MLLabManual
No ratings yet
MLLabManual
24 pages
ML File
No ratings yet
ML File
13 pages
Ml Lab Experiment Shortened With Same Output
No ratings yet
Ml Lab Experiment Shortened With Same Output
6 pages
ML LAB manual-1
No ratings yet
ML LAB manual-1
33 pages
Pramkk
No ratings yet
Pramkk
10 pages
Project paarth (1) (1)
No ratings yet
Project paarth (1) (1)
21 pages
ml
No ratings yet
ml
17 pages
HIV Regression Source Code
No ratings yet
HIV Regression Source Code
26 pages
22K61A0654_2_sasi_auto
No ratings yet
22K61A0654_2_sasi_auto
24 pages
Aiml Ex 4-7
No ratings yet
Aiml Ex 4-7
8 pages
Rabia Malik (s0001)
No ratings yet
Rabia Malik (s0001)
5 pages
ML 5
No ratings yet
ML 5
2 pages
Data_preprocessing_example_programs1
No ratings yet
Data_preprocessing_example_programs1
9 pages
Aiml Practical
No ratings yet
Aiml Practical
17 pages
bacdeaf_23032025_115708_split_1
No ratings yet
bacdeaf_23032025_115708_split_1
37 pages
ML Lab Prgms Split
No ratings yet
ML Lab Prgms Split
3 pages
ML spy programs
No ratings yet
ML spy programs
16 pages
Machine learning lab manual
No ratings yet
Machine learning lab manual
9 pages
ML Book Notes
No ratings yet
ML Book Notes
9 pages
22MCA1008 - Varun ML LAB ASSIGNMENTS
100% (1)
22MCA1008 - Varun ML LAB ASSIGNMENTS
41 pages
Dav Lab Manual
No ratings yet
Dav Lab Manual
28 pages
Slip
No ratings yet
Slip
5 pages
prgm 4
No ratings yet
prgm 4
3 pages
Udacity Machine Learning Analysis Supervised Learning
100% (1)
Udacity Machine Learning Analysis Supervised Learning
504 pages
mlalllabprgs
No ratings yet
mlalllabprgs
17 pages
Experiment1111
No ratings yet
Experiment1111
25 pages
PRG 4
No ratings yet
PRG 4
2 pages
DataAnalytics Lab Manual (1)
No ratings yet
DataAnalytics Lab Manual (1)
35 pages
Argha's ML LAB_240927_121838
No ratings yet
Argha's ML LAB_240927_121838
13 pages
ML Shristi File
No ratings yet
ML Shristi File
49 pages
Lab Program 3
No ratings yet
Lab Program 3
6 pages
AIML
No ratings yet
AIML
12 pages
Ml Manual
No ratings yet
Ml Manual
30 pages
ml_all_projectpdf_removed
No ratings yet
ml_all_projectpdf_removed
41 pages
ai int-1
No ratings yet
ai int-1
6 pages
Chandigarh Group of Colleges College of Engineering Landran, Mohali
No ratings yet
Chandigarh Group of Colleges College of Engineering Landran, Mohali
47 pages
Data warehousing and data mining
No ratings yet
Data warehousing and data mining
24 pages
Machine Learning Unit4
No ratings yet
Machine Learning Unit4
8 pages
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
Tuning PID Controllers Using The ITAE Criterion
No ratings yet
Tuning PID Controllers Using The ITAE Criterion
7 pages
Flow Chart Lect June 22
No ratings yet
Flow Chart Lect June 22
44 pages
Part 3 - MEM23004A Apply Technical Mathematics - 1
No ratings yet
Part 3 - MEM23004A Apply Technical Mathematics - 1
34 pages
MGSC5111-Assignment#2
No ratings yet
MGSC5111-Assignment#2
17 pages
Kunal_From Sensors to Solutions A Survey on IoT and Machine Learning in Modern Agriculture
No ratings yet
Kunal_From Sensors to Solutions A Survey on IoT and Machine Learning in Modern Agriculture
5 pages
Final - ST4238 1f6mnp9
No ratings yet
Final - ST4238 1f6mnp9
5 pages
Generate an algorithm handout
No ratings yet
Generate an algorithm handout
2 pages
Cryptography Hash Functions
No ratings yet
Cryptography Hash Functions
5 pages
8-Puzzle Programming Assignment
No ratings yet
8-Puzzle Programming Assignment
3 pages
Factoring Polynomials
100% (1)
Factoring Polynomials
18 pages
Ieee Access Chatgpt
No ratings yet
Ieee Access Chatgpt
15 pages
Student Notes: Convolutional Neural Networks (CNN) Introduction
No ratings yet
Student Notes: Convolutional Neural Networks (CNN) Introduction
9 pages
Dual Domain Image Encryption Using Bit Plane Scrambling and Sub - Band Scrambling
No ratings yet
Dual Domain Image Encryption Using Bit Plane Scrambling and Sub - Band Scrambling
16 pages
Lab 9 SS
No ratings yet
Lab 9 SS
24 pages
Predictive Analytics A Review of Trends and Techni
No ratings yet
Predictive Analytics A Review of Trends and Techni
7 pages
Barlas Exercises Ch3
No ratings yet
Barlas Exercises Ch3
4 pages
VTU OLD QP@AzDOCUMENTS - in
No ratings yet
VTU OLD QP@AzDOCUMENTS - in
18 pages
Module 5 - S8 CSE NOTES - KTU DEEP LEARNING NOTES - CST414
No ratings yet
Module 5 - S8 CSE NOTES - KTU DEEP LEARNING NOTES - CST414
26 pages
SoftFRAC Matlab Library For Realization
No ratings yet
SoftFRAC Matlab Library For Realization
10 pages
Demand Forecasting Methods
No ratings yet
Demand Forecasting Methods
24 pages
Ai Pyq
No ratings yet
Ai Pyq
8 pages
Backend Development Test
No ratings yet
Backend Development Test
10 pages
CPE0013 Module 3 Bracketing Methods - Part 1 PDF
No ratings yet
CPE0013 Module 3 Bracketing Methods - Part 1 PDF
13 pages
Exercises in Nonlinear Control Systems
No ratings yet
Exercises in Nonlinear Control Systems
115 pages
Algorithms and Flowcharts
100% (1)
Algorithms and Flowcharts
34 pages
Artificial Neural Networks (ch7)
No ratings yet
Artificial Neural Networks (ch7)
12 pages
Problem Set 10
No ratings yet
Problem Set 10
2 pages
Lecture 0 - CS50's Introduction To Artificial Intelligence With Python
No ratings yet
Lecture 0 - CS50's Introduction To Artificial Intelligence With Python
13 pages
GHRCE - Raisoni - Enrolled Students - Pregrad
No ratings yet
GHRCE - Raisoni - Enrolled Students - Pregrad
2 pages
Perspective Chapter - Insights From Kalman Filtering With Correlated Noises Recursive Least-Square Algorithm For State and Parameter Estimation
No ratings yet
Perspective Chapter - Insights From Kalman Filtering With Correlated Noises Recursive Least-Square Algorithm For State and Parameter Estimation
30 pages

ASSESSMENT2

Uploaded by

ASSESSMENT2

Uploaded by

ASSESSMENT-2

NAME - VAIBHAV DUTT TRIVEDI

REG. NO. – 22MIC0118

COURSE TITLE – MACHINE LEARNING

COURSE CODE – CSI 3026

LAB SLOT – L9+L10

def calculate_info_gain(data, feature, target):

def build_tree(data, features, target):

decision_tree = build_tree(data, features, target)

numerator = np.sum((x - mean_x) * (y - mean_y))

print("Slope (m):", slope)

y_pred = slope * x + intercept

plt.scatter(x, y, color='blue', label='Data Points')

numerator = np.sum((x - mean_x) * (y - mean_y))

print("Slope (m):", slope)

plt.scatter(x, y, color='blue', label='Data Points')

def calculate_gini_index(data, feature, target):

def build_cart_tree(data, features, target):

decision_tree = build_cart_tree(data, features, target)

You might also like