0% found this document useful (0 votes)

15 views12 pages

Machine Learning Program

Uploaded by

sudhisugumar3006

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

15 views12 pages

Machine Learning Program

Uploaded by

sudhisugumar3006

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

You are on page 1/ 12

DATA CLEANING AND PREPROSSING:

import numpy as np

import pandas as pd

dataset = pd.read_csv("D:/book1.csv",delimiter=',')

print(dataset)

dataset.info()

dataset.isna()

dataset_1=dataset.dropna()

print(dataset_1)

x=dataset.iloc[:,[0,1,2]]

y=dataset.iloc[:,[3]]

print(x)

print(y)

from sklearn.preprocessing import LabelEncoder

lEncoder=LabelEncoder()

x.iloc[:,0]=lEncoder.fit_transform(x.iloc[:,0])

print(x)

OUTPUT:

= RESTART: C:/Users/AMAR PAAPU/pre1.py

COUNTRY AGE SALARY PURCHASED

0 France 44 72000 no

1 Spain 27 48000 yes

2 Germany 30 64000 no

3 Spain 38 61000 no

4 Germany 40 Nan yes

5 France 38 54000 yes

6 Spain Nan 62000 no

7 France 48 74000 yes

8 Germany 50 83000 no

9 France 37 67000 yes

RangeIndex: 10 entries, 0 to 9

Data columns (total 4 columns):

# Column Non-Null Count Dtype

--- ------ -------------- -----

0 COUNTRY 10 non-null object

1 AGE 10 non-null object

2 SALARY 10 non-null object

3 PURCHASED 10 non-null object

dtypes: object(4)

memory usage: 452.0+ bytes

COUNTRY AGE SALARY PURCHASED

0 France 44 72000 no

1 Spain 27 48000 yes

2 Germany 30 64000 no

3 Spain 38 61000 no

4 Germany 40 Nan yes

5 France 38 54000 yes

6 Spain Nan 62000 no

7 France 48 74000 yes

8 Germany 50 83000 no

9 France 37 67000 yes

COUNTRY AGE SALARY

0 France 44 72000

1 Spain 27 48000

2 Germany 30 64000

3 Spain 38 61000

4 Germany 40 Nan

5 France 38 54000

6 Spain Nan 62000

7 France 48 74000

8 Germany 50 83000

9 France 37 67000

PURCHASED

0 no

1 yes

2 no

3 no

4 yes

5 yes

6 no

7 yes

8 no

9 yes

COUNTRY AGE SALARY

0 0 44 72000

1 2 27 48000
2 1 30 64000

3 2 38 61000

4 1 40 Nan

5 0 38 54000

6 2 Nan 62000

7 0 48 74000

8 1 50 83000

9 0 37 67000
Data from database:

import mysql.connector
# Create the connection object
myconn = mysql.connector.connect(host = "localhost", user = "root",passwd = "",database="SampleDB")
# Creating the cursor object
cur = myconn.cursor()
# Executing the query
cur.execute("select * from students")
# Fetching the rows from the cursor object
result = cur.fetchall()
print("Student Details are :")
# Printing the result
for x in result:
print(x);
# Commit the transaction
myconn.commit()
# Close the connection
myconn.close()
Output:
K-means clustering:

from sklearn.cluster import KMeans

import matplotlib.pyplot as plt

x = [4, 5, 10, 4, 3, 11, 14 , 6, 10, 12]

y = [21, 19, 24, 17, 16, 25, 24, 22, 21, 21]

#plt.scatter(x, y)

data = list(zip(x, y))

inertias = []

for i in range(1,11):
kmeans = KMeans(n_clusters=i)
kmeans.fit(data)
inertias.append(kmeans.inertia_)

plt.plot(range(1,11), inertias, marker='o')

plt.title('Elbow method')
plt.xlabel('Number of clusters')
plt.ylabel('Inertia')
plt.show()

Output:
K-nearest neighbours:

# Import necessary modules

from sklearn.neighbors import KNeighborsClassifier
from sklearn.model_selection import train_test_split
from sklearn.datasets import load_iris
import random

# Loading data
data_iris = load_iris()
# To get list of target names
label_target = data_iris.target_names
print()
print("Sample Data from Iris Dataset")
print("*"*30)
# to display the sample data from the iris dataset
for i in range(10):
rn = random.randint(0,120)
print(data_iris.data[rn],"===>",label_target[data_iris.target[rn]])

# Create feature and target arrays

X = data_iris.data
y = data_iris.target

# Split into training and test set

X_train, X_test, y_train, y_test = train_test_split(
X, y, test_size = 0.3, random_state=1)

print("The Training dataset length: ",len(X_train))

print("The Testing dataset length: ",len(X_test))
try:
nn = int(input("Enter number of neighbors :"))
knn = KNeighborsClassifier(nn)

knn.fit(X_train, y_train)
# to display the score
print("The Score is :",knn.score(X_test, y_test))
# To get test data from the user
test_data = input("Enter Test Data :").split(",")
for i in range(len(test_data)):
test_data[i] = float(test_data[i])
print()

v = knn.predict([test_data])
print("Predicted output is :",label_target[v])
except:
print("Please supply valid input......")
Output:
Linear regression:

import numpy as np
import matplotlib.pyplot as plt

def estimate_coef(x, y):

# number of observations/points
n = np.size(x)

# mean of x and y vector

m_x = np.mean(x)
m_y = np.mean(y)

# calculating cross-deviation and deviation about x

SS_xy = np.sum(y*x) - n*m_y*m_x
SS_xx = np.sum(x*x) - n*m_x*m_x

# calculating regression coefficients

b_1 = SS_xy / SS_xx
b_0 = m_y - b_1*m_x

return (b_0, b_1)

def plot_regression_line(x, y, b):

# plotting the actual points as scatter plot
plt.scatter(x, y, color = "m",
marker = "o", s = 30)

# predicted response vector

y_pred = b[0] + b[1]*x

# plotting the regression line

plt.plot(x, y_pred, color = "g")

# putting labels
plt.xlabel('x')
plt.ylabel('y')

# function to show plot

plt.show()

def main():
# observations / data
x = np.array([0, 1, 2, 3, 4, 5, 6, 7, 8, 9])
y = np.array([1, 3, 2, 5, 7, 8, 8, 9, 10, 12])

# estimating coefficients
b = estimate_coef(x, y)
print("Estimated coefficients:\nb_0 = {} \
\nb_1 = {}".format(b[0], b[1]))

# plotting regression line

plot_regression_line(x, y, b)

#if name == "main":

main()
Output:
SVM program:

import numpy as np

import matplotlib.pyplot as plt

from sklearn.dataset import make_blobs

x,y=make_blobs(n_samples=500,centers=2,random_state=0,cluster_std=0.40)

xfit=np.linspace(-1,3.5)

plt.scatter(x[:,0],x[:,1],c=y,s=50,cmap='spring')

for m,b,d in [(1,0.65,0.33),(0.5,1.6,0.55),(-0.2,2.9,0.2)]:

yfit=m*xfit+b

plt.plot(xfit,yfit,'-k')

plt.fill_between(xfit,yfit-d,yfit+d,edgecolor='none',color='#AAAAAA',alpha=0.4)

plt.xlim(-1,3.5);

plt.show()

Second
No ratings yet
Second
4 pages
Data Preprocessing 2
No ratings yet
Data Preprocessing 2
5 pages
Data Mining - Project
100% (2)
Data Mining - Project
11 pages
One Hot Encoding
No ratings yet
One Hot Encoding
12 pages
Data Pre Processing
No ratings yet
Data Pre Processing
2 pages
Reading Data: #Importing Required Libraries
No ratings yet
Reading Data: #Importing Required Libraries
16 pages
Assignmnet 5
No ratings yet
Assignmnet 5
11 pages
Experiment 2
No ratings yet
Experiment 2
5 pages
Data Analysis for Beginners
No ratings yet
Data Analysis for Beginners
1 page
DWM Practical
No ratings yet
DWM Practical
12 pages
Mlda - Lab
No ratings yet
Mlda - Lab
35 pages
DSC Lab Programs
No ratings yet
DSC Lab Programs
24 pages
ML Lab Manual 1-10
No ratings yet
ML Lab Manual 1-10
58 pages
Machine Learning Algorithms Guide
No ratings yet
Machine Learning Algorithms Guide
34 pages
Ip Practical File
No ratings yet
Ip Practical File
20 pages
Machine Learning Record VR19
No ratings yet
Machine Learning Record VR19
46 pages
#Group: B (ML) : Numpy NP Pandas PD
No ratings yet
#Group: B (ML) : Numpy NP Pandas PD
9 pages
K Means
No ratings yet
K Means
5 pages
Programs of Python Pandas
No ratings yet
Programs of Python Pandas
15 pages
ML LAB Manual-1
No ratings yet
ML LAB Manual-1
33 pages
Practical 3
No ratings yet
Practical 3
8 pages
Dataframe
No ratings yet
Dataframe
19 pages
Loading The Dataset: 'Churn - Modelling - CSV'
No ratings yet
Loading The Dataset: 'Churn - Modelling - CSV'
6 pages
Data Preprocessing 1
No ratings yet
Data Preprocessing 1
6 pages
Practice Questions2
No ratings yet
Practice Questions2
2 pages
Data - Analytics Lab - Manual JNTUH R22 Regulation
No ratings yet
Data - Analytics Lab - Manual JNTUH R22 Regulation
26 pages
DA Programs
No ratings yet
DA Programs
44 pages
PRACTICALS
No ratings yet
PRACTICALS
52 pages
KSTV
No ratings yet
KSTV
19 pages
Ilovepdf Merged (2) Merged
No ratings yet
Ilovepdf Merged (2) Merged
65 pages
Data Visualization & Preprocessing Guide
No ratings yet
Data Visualization & Preprocessing Guide
18 pages
IP Practical PRGM
No ratings yet
IP Practical PRGM
41 pages
Ip File
No ratings yet
Ip File
66 pages
10) Merging Dataframes: # Detecting Duplicates
No ratings yet
10) Merging Dataframes: # Detecting Duplicates
7 pages
K-Means Clustering Algorithm
No ratings yet
K-Means Clustering Algorithm
17 pages
NumPy and Pandas Step
No ratings yet
NumPy and Pandas Step
9 pages
Numpy Dataframe
No ratings yet
Numpy Dataframe
12 pages
Machine Learning Lab
No ratings yet
Machine Learning Lab
20 pages
Data Preprocessing Techniques Guide
No ratings yet
Data Preprocessing Techniques Guide
23 pages
ML Batch
No ratings yet
ML Batch
36 pages
Ex. No.: 01 Working With Numpy Arrays
No ratings yet
Ex. No.: 01 Working With Numpy Arrays
30 pages
Array - Numpy 1
No ratings yet
Array - Numpy 1
14 pages
MLLab Manual
No ratings yet
MLLab Manual
24 pages
Experiment No 11
No ratings yet
Experiment No 11
19 pages
Walmart Sales Forecasting Guide
No ratings yet
Walmart Sales Forecasting Guide
37 pages
Datascience Internship
No ratings yet
Datascience Internship
43 pages
AI & Data Science Lab Record
No ratings yet
AI & Data Science Lab Record
28 pages
1st PGM
No ratings yet
1st PGM
10 pages
Lab File
No ratings yet
Lab File
96 pages
Tugas Clustering - 132021012 - Kevin Gazkia Naufal
No ratings yet
Tugas Clustering - 132021012 - Kevin Gazkia Naufal
6 pages
Python Pandas and DataFrame Basics
No ratings yet
Python Pandas and DataFrame Basics
20 pages
Aiml Lab Manaual R23
100% (1)
Aiml Lab Manaual R23
10 pages
Chandigarh Group of Colleges College of Engineering Landran, Mohali
No ratings yet
Chandigarh Group of Colleges College of Engineering Landran, Mohali
47 pages
Project 4 - House Price Prediction - Ipynb - Colab
No ratings yet
Project 4 - House Price Prediction - Ipynb - Colab
5 pages
MACHINE LEARNING Manual
No ratings yet
MACHINE LEARNING Manual
36 pages
ML Practical 4D
No ratings yet
ML Practical 4D
11 pages
ML Lab Prgms Split
No ratings yet
ML Lab Prgms Split
3 pages
CS8492-Database Management Systems Department of CSE: Relational Databases
No ratings yet
CS8492-Database Management Systems Department of CSE: Relational Databases
18 pages
Alteryx Workflow Tools Overview
No ratings yet
Alteryx Workflow Tools Overview
16 pages
Delivery Routines
No ratings yet
Delivery Routines
8 pages
Large Language Models Orchestrating Structured Reasoning Achieve Kaggle Grandmaster Level
No ratings yet
Large Language Models Orchestrating Structured Reasoning Achieve Kaggle Grandmaster Level
88 pages
Ooad Through Uml Lab
No ratings yet
Ooad Through Uml Lab
4 pages
Chapter 03
No ratings yet
Chapter 03
61 pages
An Approximate Algorithm For Maximum Inner Product Search Over Streaming Sparse Vectors
No ratings yet
An Approximate Algorithm For Maximum Inner Product Search Over Streaming Sparse Vectors
44 pages
Lab # 2 Objective: Submitted By: Ali Murad Submitted To: Muhib Khan
No ratings yet
Lab # 2 Objective: Submitted By: Ali Murad Submitted To: Muhib Khan
3 pages
Ch4 Storage
No ratings yet
Ch4 Storage
23 pages
Sap FS Template
No ratings yet
Sap FS Template
7 pages
Tal Charnes Programming Team Leader
No ratings yet
Tal Charnes Programming Team Leader
1 page
Enabling High Availability With Data Guard On Amazon RDS Custom For Oracle
No ratings yet
Enabling High Availability With Data Guard On Amazon RDS Custom For Oracle
52 pages
Boutique
No ratings yet
Boutique
21 pages
Mastering Google Bigtable Database
No ratings yet
Mastering Google Bigtable Database
248 pages
MIS602 - Assessment 3 - Database Case Study Report - Final
No ratings yet
MIS602 - Assessment 3 - Database Case Study Report - Final
3 pages
MCA Project Documentation Format-V2024
No ratings yet
MCA Project Documentation Format-V2024
80 pages
Data e Sarana PIBG
No ratings yet
Data e Sarana PIBG
2 pages
Precision Agriculture Tech Guide
No ratings yet
Precision Agriculture Tech Guide
25 pages
SN-SNF-L010 ServiceNow Fundamentals
100% (7)
SN-SNF-L010 ServiceNow Fundamentals
323 pages
Full Stack Developer 2024
No ratings yet
Full Stack Developer 2024
2 pages
Siddaganga Institute of Technology, Tumakuru - 572 103
No ratings yet
Siddaganga Institute of Technology, Tumakuru - 572 103
2 pages
OOSE
No ratings yet
OOSE
64 pages
Enqueue Waits: Locks Thanks To Doug Burns For Much of The Row Lock Example
No ratings yet
Enqueue Waits: Locks Thanks To Doug Burns For Much of The Row Lock Example
66 pages
CBP Afi
No ratings yet
CBP Afi
30 pages
Fundamentals of Database Management Systems 2nd Edition Gillenson Test Bank Sample
100% (3)
Fundamentals of Database Management Systems 2nd Edition Gillenson Test Bank Sample
71 pages
How To Build A Scalable & Robust Web Application Design
No ratings yet
How To Build A Scalable & Robust Web Application Design
8 pages
JAVA Full Stack Development by Sidharth Sahoo 1689241942
No ratings yet
JAVA Full Stack Development by Sidharth Sahoo 1689241942
72 pages
Microsoft Power BI For Dummies 1st Edition Jack Hyman PDF Download
No ratings yet
Microsoft Power BI For Dummies 1st Edition Jack Hyman PDF Download
161 pages
MS Access 2010-2014
No ratings yet
MS Access 2010-2014
118 pages
University of Eldoret Main Campus School of Science Mathematics and Computer Science Department. Kiptoo Nickson INF/039/17
No ratings yet
University of Eldoret Main Campus School of Science Mathematics and Computer Science Department. Kiptoo Nickson INF/039/17
34 pages

Machine Learning Program

Uploaded by

Machine Learning Program

Uploaded by

DATA CLEANING AND PREPROSSING:

from sklearn.preprocessing import LabelEncoder

= RESTART: C:/Users/AMAR PAAPU/pre1.py

1 Spain 27 48000 yes

4 Germany 40 Nan yes

5 France 38 54000 yes

6 Spain Nan 62000 no

7 France 48 74000 yes

9 France 37 67000 yes

Data columns (total 4 columns):

# Column Non-Null Count Dtype

--- ------ -------------- -----

0 COUNTRY 10 non-null object

1 AGE 10 non-null object

2 SALARY 10 non-null object

3 PURCHASED 10 non-null object

memory usage: 452.0+ bytes

COUNTRY AGE SALARY PURCHASED

1 Spain 27 48000 yes

4 Germany 40 Nan yes

5 France 38 54000 yes

7 France 48 74000 yes

9 France 37 67000 yes

COUNTRY AGE SALARY

6 Spain Nan 62000

COUNTRY AGE SALARY

from sklearn.cluster import KMeans

import matplotlib.pyplot as plt

x = [4, 5, 10, 4, 3, 11, 14 , 6, 10, 12]

data = list(zip(x, y))

plt.plot(range(1,11), inertias, marker='o')

# Import necessary modules

# Create feature and target arrays

# Split into training and test set

print("The Training dataset length: ",len(X_train))

def estimate_coef(x, y):

# mean of x and y vector

# calculating cross-deviation and deviation about x

# calculating regression coefficients

return (b_0, b_1)

def plot_regression_line(x, y, b):

# predicted response vector

# plotting the regression line

# function to show plot

# plotting regression line

#if __name__ == "__main__":

import matplotlib.pyplot as plt

from sklearn.dataset import make_blobs

for m,b,d in [(1,0.65,0.33),(0.5,1.6,0.55),(-0.2,2.9,0.2)]:

You might also like

#if name == "main":