0% found this document useful (0 votes)

12 views

DMT Cia2

Uploaded by

Swathi Senthilkumar

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

12 views

DMT Cia2

Uploaded by

Swathi Senthilkumar

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 11

K Means

import pandas as pd
from sklearn.cluster import KMeans
from sklearn.preprocessing import StandardScaler
import matplotlib.pyplot as plt

# Load the Iris dataset

data = pd.read_csv('iris.csv')

# Separate features and target variable

X = data.drop('species', axis=1)
y = data['species']

# Standardize the features

scaler = StandardScaler()
X_scaled = scaler.fit_transform(X)

# Create a K-means clustering model with 3 clusters

kmeans = KMeans(n_clusters=3, random_state=42)

# Fit the model to the scaled data

kmeans.fit(X_scaled)

# Get the cluster labels

labels = kmeans.labels_

# Visualize the clusters

plt.scatter(X_scaled[:, 0], X_scaled[:, 1], c=labels)
plt.title('K-means Clustering of Iris Dataset')
plt.xlabel('Sepal Length')
plt.ylabel('Sepal Width')
plt.show()
Decision Tree

import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.tree import DecisionTreeClassifier
from sklearn.metrics import accuracy_score

# Load the Zoo dataset

data = pd.read_csv('zoo.csv')

# Separate features and target variable

X = data.drop('type', axis=1)
y = data['type']

# Split the data into training and testing sets

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2,
random_state=42)

# Create a decision tree classifier

clf = DecisionTreeClassifier()

# Fit the classifier to the training data

clf.fit(X_train, y_train)
# Make predictions on the testing data
y_pred = clf.predict(X_test)

# Calculate accuracy
accuracy = accuracy_score(y_test, y_pred)
print("Accuracy:", accuracy)
import pandas as pd
from sklearn.tree import DecisionTreeClassifier
from sklearn.model_selection import train_test_split

# Create a DataFrame with your CPT data (replace with your actual data)
data = pd.DataFrame({
'age': ['<=30', '<=30', '<=30', '>30', '>30', '>30', '<=30', '>30', '>30',
'<=30'],
'income': ['low', 'low', 'medium', 'medium', 'medium', 'high', 'high', 'low',
'medium', 'high'],
'student': ['yes', 'yes', 'yes', 'no', 'no', 'no', 'yes', 'no', 'no', 'yes'],
'credit_rating': ['excellent', 'good', 'excellent', 'excellent', 'fair', 'fair',
'good', 'excellent', 'fair', 'good'],
'buys_computer': ['yes', 'yes', 'yes', 'no', 'no', 'yes', 'yes', 'no', 'yes', 'yes']
})

# Separate features and target variable

X = data.drop('buys_computer', axis=1)
y = data['buys_computer']

# Split the data into training and testing sets

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2,
random_state=42)

# Create a decision tree classifier

clf = DecisionTreeClassifier()

# Fit the classifier to the training data

clf.fit(X_train, y_train)

# Make predictions on the testing data

y_pred = clf.predict(X_test)

# Evaluate the model (e.g., accuracy)

accuracy = accuracy_score(y_test, y_pred)
print("Accuracy:", accuracy)
K Nearest Neighbour

import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.neighbors import KNeighborsClassifier
from sklearn.preprocessing import StandardScaler
from sklearn.metrics import accuracy_score

# Assuming your data is in a CSV file named 'zoo.csv'

data = pd.read_csv('zoo.csv')

# Separate features (X) and target variable (y)

X = data.drop('animal_name', axis=1) # Remove the 'animal_name'
column
y = data['animal_name']

# Split the data into training and testing sets

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2,
random_state=42)

# Standardize the features

scaler = StandardScaler()
X_train_scaled = scaler.fit_transform(X_train)
X_test_scaled = scaler.transform(X_test)

# Create a KNN classifier with k=3 (you can adjust the value of k)
knn = KNeighborsClassifier(n_neighbors=3)

# Fit the classifier to the training data

knn.fit(X_train_scaled, y_train)

# Make predictions on the testing data

y_pred = knn.predict(X_test_scaled)

# Calculate accuracy
accuracy = accuracy_score(y_test, y_pred)
print("Accuracy:", accuracy)
Eclat Algorithm

import pandas as pd
from mlxtend.frequent_patterns import apriori, association_rules
from mlxtend.preprocessing import TransactionEncoder

# Create a sample dataset (replace with your own data)

data = [
['milk', 'bread', 'eggs'],
['bread', 'butter'],
['milk', 'bread', 'butter'],
['milk', 'eggs'],
['bread', 'eggs', 'butter']
]

# Encode the data into a one-hot encoded format

te = TransactionEncoder()
te_data = te.fit(data).transform(data)
df = pd.DataFrame(te_data, columns=te.columns_)

# Apply the ECLAT algorithm to find frequent itemsets

frequent_itemsets = apriori(df, min_support=0.5, use_colnames=True)

# Generate association rules from the frequent itemsets

rules = association_rules(frequent_itemsets, metric="lift",
min_threshold=1)

# Print the results

print("Frequent itemsets:")
print(frequent_itemsets)
print("\nAssociation rules:")
print(rules)
import pandas as pd
from mlxtend.frequent_patterns import eclat, association_rules
from mlxtend.preprocessing import TransactionEncoder

# Sample dataset
data = [
['milk', 'bread', 'eggs'],
['bread', 'butter'],
['milk', 'bread', 'butter'],
['milk', 'eggs'],
['bread', 'eggs', 'butter']
]

# Encode the data into a one-hot encoded format

te = TransactionEncoder()
te_data = te.fit(data).transform(data)
df = pd.DataFrame(te_data, columns=te.columns_)

# Apply the ECLAT algorithm to find frequent itemsets

frequent_itemsets = eclat(df, min_support=0.5, use_colnames=True)

# Find closed frequent itemsets

closed_itemsets =
frequent_itemsets[frequent_itemsets['itemsets'].apply(lambda itemset: not
any(subset in frequent_itemsets['itemsets'].tolist() if len(subset) <
len(itemset) and set(subset) == set(itemset)))]

# Find maximal frequent itemsets

maximal_itemsets =
frequent_itemsets[frequent_itemsets['itemsets'].apply(lambda itemset: not
any(subset in frequent_itemsets['itemsets'].tolist() if len(subset) >
len(itemset) and set(subset).issubset(set(itemset))))]

# Find minimal frequent itemsets

minimal_itemsets =
frequent_itemsets[frequent_itemsets['itemsets'].apply(lambda itemset: not
any(subset in frequent_itemsets['itemsets'].tolist() if len(subset) <
len(itemset) and set(subset).issubset(set(itemset))))]

# Print the results

print("Frequent itemsets:")
print(frequent_itemsets)
print("\nClosed itemsets:")
print(closed_itemsets)
print("\nMaximal itemsets:")
print(maximal_itemsets)
print("\nMinimal itemsets:")
print(minimal_itemsets)
D-Eclat

import pandas as pd
from mlxtend.frequent_patterns import diff_eclat
from mlxtend.preprocessing import TransactionEncoder

# Create a sample dataset (replace with your own data)

data = [
['milk', 'bread', 'eggs'],
['bread', 'butter'],
['milk', 'bread', 'butter'],
['milk', 'eggs'],
['bread', 'eggs', 'butter'],
['milk', 'bread', 'cheese'],
['bread', 'butter', 'yogurt'],
['milk', 'bread', 'butter', 'jam'],
['milk', 'eggs', 'cheese'],
['bread', 'eggs', 'butter', 'honey']
]

# Encode the data into a one-hot encoded format

te = TransactionEncoder()
te_data = te.fit(data).transform(data)
df = pd.DataFrame(te_data, columns=te.columns_)

# Split the data into two parts to simulate a temporal change

df1 = df[:5]
df2 = df[5:]

# Apply the DiffEclat algorithm to find frequent itemsets

frequent_itemsets = diff_eclat(df1, df2, min_support=0.5,
use_colnames=True)

# Print the results

print("Frequent itemsets:")
print(frequent_itemsets)
Apriori Algorithm

import pandas as pd
from mlxtend.frequent_patterns import apriori
from mlxtend.preprocessing import TransactionEncoder

# Sample transaction data as a dictionary

transaction_data = {
1: ['milk', 'bread', 'eggs'],
2: ['bread', 'butter'],
3: ['milk', 'bread', 'butter'],
4: ['milk', 'eggs'],
5: ['bread', 'eggs', 'butter']
}

# Convert the dictionary to a list of lists

data = list(transaction_data.values())

# Encode the data into a one-hot encoded format

te = TransactionEncoder()
te_data = te.fit(data).transform(data)
df = pd.DataFrame(te_data, columns=te.columns_)

# Apply the Apriori algorithm to find frequent itemsets

frequent_itemsets = apriori(df, min_support=0.5, use_colnames=True)

# Print the results

print("Frequent itemsets:")
print(frequent_itemsets)
FP Growth

import pandas as pd
from mlxtend.frequent_patterns import fpgrowth
from mlxtend.preprocessing import TransactionEncoder
import graphviz

# Sample dataset
data = [
['milk', 'bread', 'eggs'],
['bread', 'butter'],
['milk', 'bread', 'butter'],
['milk', 'eggs'],
['bread', 'eggs', 'butter']
]

# Encode the data into a one-hot encoded format

te = TransactionEncoder()
te_data = te.fit(data).transform(data)
df = pd.DataFrame(te_data, columns=te.columns_)

# Apply the FP-growth algorithm to find frequent itemsets and get the
FP-tree
frequent_itemsets, fptree = fpgrowth(df, min_support=0.5,
use_colnames=True, return_tree=True)

# Visualize the FP-tree

dot_data = fptree.graphviz()
graph = graphviz.Source(dot_data)
graph.render("fptree_visualization")
Naive Bayes
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.naive_bayes import GaussianNB
from sklearn.metrics import accuracy_score

# Load your dataset (replace 'your_dataset.csv' with your actual file)

data = pd.read_csv('your_dataset.csv')

# Separate features and target variable

X = data.drop('target_column', axis=1) # Replace 'target_column' with
your actual target column name
y = data['target_column']

# Split the data into training and testing sets

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2,
random_state=42)

# Create a Naive Bayes classifier

nb = GaussianNB()

# Fit the classifier to the training data

nb.fit(X_train, y_train)

# Make predictions on the testing data

y_pred = nb.predict(X_test)

# Calculate accuracy
accuracy = accuracy_score(y_test, y_pred)
print("Accuracy:", accuracy)

# Assign predicted labels to the original data

data['predicted_label'] = y_pred

# Print the predicted labels

print(data)

Micr Basics Hand Book
100% (4)
Micr Basics Hand Book
21 pages
ISO 22192 2021 (E) - Character PDF Document
No ratings yet
ISO 22192 2021 (E) - Character PDF Document
7 pages
Electromagnetic Waves
100% (1)
Electromagnetic Waves
24 pages
Aterial Specification & All Thickness Calculation
100% (1)
Aterial Specification & All Thickness Calculation
35 pages
ML
No ratings yet
ML
11 pages
ML Practical 205160694034
No ratings yet
ML Practical 205160694034
33 pages
Prac7 8 9 10
No ratings yet
Prac7 8 9 10
12 pages
S6 - Data Mining Lab Experiments (Except 1)
No ratings yet
S6 - Data Mining Lab Experiments (Except 1)
6 pages
Fa22-bcs-025 MOAZ Assignment 1
No ratings yet
Fa22-bcs-025 MOAZ Assignment 1
9 pages
DWDM Lab Report
No ratings yet
DWDM Lab Report
26 pages
Source Code
No ratings yet
Source Code
28 pages
Ds 2
No ratings yet
Ds 2
3 pages
Final ML File
No ratings yet
Final ML File
34 pages
DATA MINING EX1
No ratings yet
DATA MINING EX1
10 pages
DM ML Practical
No ratings yet
DM ML Practical
13 pages
DA Assignment
No ratings yet
DA Assignment
18 pages
pratham ML
No ratings yet
pratham ML
14 pages
Algorithm
No ratings yet
Algorithm
8 pages
Department Of: Computer Science & Engineering
No ratings yet
Department Of: Computer Science & Engineering
4 pages
soal try out UN Fis
No ratings yet
soal try out UN Fis
6 pages
DWM Practical
No ratings yet
DWM Practical
12 pages
ML Lab Programs
No ratings yet
ML Lab Programs
23 pages
ML#07
No ratings yet
ML#07
21 pages
Da Exp9,10
No ratings yet
Da Exp9,10
9 pages
D3 docs
No ratings yet
D3 docs
6 pages
TOO
No ratings yet
TOO
7 pages
ML Shristi File
No ratings yet
ML Shristi File
49 pages
Code:: To Find Frequent Itemsets and Association Between Different Itemsets Using Apriori Algorithm
No ratings yet
Code:: To Find Frequent Itemsets and Association Between Different Itemsets Using Apriori Algorithm
28 pages
Implementing KNN Algorithm on the Iris Dataset
No ratings yet
Implementing KNN Algorithm on the Iris Dataset
7 pages
Practical File of AI and ML
No ratings yet
Practical File of AI and ML
26 pages
ml_labmanual (3)
No ratings yet
ml_labmanual (3)
33 pages
Project Data Mining (AMAN YADAV)
No ratings yet
Project Data Mining (AMAN YADAV)
12 pages
DataScience All 1to8
No ratings yet
DataScience All 1to8
6 pages
AAM CODES
No ratings yet
AAM CODES
8 pages
MLLabManual
No ratings yet
MLLabManual
24 pages
ML Lab
No ratings yet
ML Lab
7 pages
mlalllabprgs
No ratings yet
mlalllabprgs
17 pages
KRAI LabManual
No ratings yet
KRAI LabManual
77 pages
DWDM Lab All
No ratings yet
DWDM Lab All
20 pages
v
No ratings yet
v
8 pages
DM Lab Internal
No ratings yet
DM Lab Internal
37 pages
15th QN
No ratings yet
15th QN
3 pages
Data Mining Lab Record
No ratings yet
Data Mining Lab Record
18 pages
KNN - Jupyter Notebook
No ratings yet
KNN - Jupyter Notebook
8 pages
indexdw (1)
No ratings yet
indexdw (1)
34 pages
2.3 Aiml Rishit
No ratings yet
2.3 Aiml Rishit
7 pages
Programs Lab Bca
No ratings yet
Programs Lab Bca
16 pages
ML-3
No ratings yet
ML-3
24 pages
1
No ratings yet
1
13 pages
BDA Experiments
No ratings yet
BDA Experiments
41 pages
ML 2.3 Prashant
No ratings yet
ML 2.3 Prashant
4 pages
AML - LAB (1-6)
No ratings yet
AML - LAB (1-6)
15 pages
Mlda - Lab
No ratings yet
Mlda - Lab
35 pages
Final_Code
No ratings yet
Final_Code
3 pages
St. John College of Engineering and Management, Palghar - Maharashtra
No ratings yet
St. John College of Engineering and Management, Palghar - Maharashtra
11 pages
Split Data
No ratings yet
Split Data
5 pages
ML5_Implementation
No ratings yet
ML5_Implementation
32 pages
7 output
No ratings yet
7 output
4 pages
ML Lab Manual
No ratings yet
ML Lab Manual
24 pages
simple 4,6 DWDM
No ratings yet
simple 4,6 DWDM
5 pages
Machine Learning Lab
No ratings yet
Machine Learning Lab
33 pages
Knn Datacamp
No ratings yet
Knn Datacamp
31 pages
The Essential R Reference
From Everand
The Essential R Reference
Mark Gardener
No ratings yet
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
Voice Assistant
No ratings yet
Voice Assistant
5 pages
ex no 4 a
No ratings yet
ex no 4 a
5 pages
01 1. Survey Paper (Final) - Review#1-March3-2022
No ratings yet
01 1. Survey Paper (Final) - Review#1-March3-2022
5 pages
Review 1
No ratings yet
Review 1
11 pages
4.5.2.10 Lab - Exploring Nmap
No ratings yet
4.5.2.10 Lab - Exploring Nmap
8 pages
Events 2k22 Guidelines
No ratings yet
Events 2k22 Guidelines
31 pages
B - Milling - Machine
No ratings yet
B - Milling - Machine
12 pages
Activity Design-Rain Catcher Facility
No ratings yet
Activity Design-Rain Catcher Facility
2 pages
Product Name Product Key
No ratings yet
Product Name Product Key
9 pages
Chap00
No ratings yet
Chap00
33 pages
Project Report On Reverse Marketing Trend
No ratings yet
Project Report On Reverse Marketing Trend
13 pages
Master Power Turbos - Application Catalog - Jun/2011
100% (4)
Master Power Turbos - Application Catalog - Jun/2011
83 pages
Reading Capacitor Codes
No ratings yet
Reading Capacitor Codes
2 pages
P4 I 65 G
No ratings yet
P4 I 65 G
36 pages
Jotafloor Solvent Free Primer: Technical Data Sheet
No ratings yet
Jotafloor Solvent Free Primer: Technical Data Sheet
5 pages
Semiconductor MainMemory
No ratings yet
Semiconductor MainMemory
18 pages
Appendices
No ratings yet
Appendices
6 pages
Wiring Diagram DSE 7320 AMF
100% (1)
Wiring Diagram DSE 7320 AMF
1 page
Im 445
No ratings yet
Im 445
20 pages
Bleach Brave Souls Hack Generator Spirit Orbs Coins No Human Verification
No ratings yet
Bleach Brave Souls Hack Generator Spirit Orbs Coins No Human Verification
3 pages
RITES 41st Annual Day
No ratings yet
RITES 41st Annual Day
3 pages
Simulated
No ratings yet
Simulated
6 pages
PDF Quotations 1596737373390
No ratings yet
PDF Quotations 1596737373390
1 page
NAO Technical Brochure
No ratings yet
NAO Technical Brochure
18 pages
Case Study Edl
No ratings yet
Case Study Edl
5 pages
Choose: The Answers. Then Write
No ratings yet
Choose: The Answers. Then Write
6 pages
Environmental Scanning and Industry Analysis Report
No ratings yet
Environmental Scanning and Industry Analysis Report
59 pages
Code Division Mutiple Access
No ratings yet
Code Division Mutiple Access
36 pages
Ipad Wallpapers Free HD Download (500+ HQ) Uns
No ratings yet
Ipad Wallpapers Free HD Download (500+ HQ) Uns
2 pages
Neiman Machinery Puma Series
No ratings yet
Neiman Machinery Puma Series
8 pages