Week 1
Week 1
Week 1
ipynb - Colab
import pandas as pd
df = pd.read_excel('student_marks.xlsx')
def pass_fail_status(row):
return "Fail" if any(mark < 50 for mark in row[2:]) else "Pass"
df["Status"] = df.apply(pass_fail_status, axis=1)
df_status = df[["Name", "Roll Number", "Status"]]
print(df_status)
df.to_excel('Updated_Students_Data.xlsx', index=False)
print(df)
https://colab.research.google.com/drive/17u1rJx_8k-YiRyWTtd_gGHOKBQDkg-NA#scrollTo=AYBgC6SB7V6v&printMode=true 1/4
8/19/24, 2:15 PM 12 Aug(1st & 2nd Labs Combined).ipynb - Colab
23 Student 24 24 35 70 55 75
24 Student 25 25 31 49 49 61
25 Student 26 26 42 70 36 50
26 Student 27 27 70 70 74 34
27 Student 28 28 41 47 75 60
28 Student 29 29 44 74 49 78
29 Student 30 30 34 76 69 41
30 Student 31 31 53 60 79 71
31 Student 32 32 77 54 67 55
32 Student 33 33 60 62 64 68
33 Student 34 34 68 75 53 46
34 Student 35 35 61 76 42 66
35 Student 36 36 64 51 68 39
36 Student 37 37 65 46 79 39
37 Student 38 38 38 46 33 66
38 Student 39 39 78 53 40 67
39 Student 40 40 77 44 68 50
40 Student 41 41 43 50 54 41
41 Student 42 42 60 46 60 36
42 Student 43 43 78 35 76 62
43 Student 44 44 40 57 53 64
44 Student 45 45 31 45 46 54
45 Student 46 46 47 63 58 30
46 Student 47 47 65 79 71 44
47 Student 48 48 51 75 33 37
48 Student 49 49 46 33 37 57
49 Student 50 50 67 49 75 68
data_file = 'Updated_Students_Data.xlsx'
student_data = pd.read_excel(data_file)
features = student_data.drop(columns=['Status'])
labels = student_data['Status']
label_encoder = LabelEncoder()
for column in features.select_dtypes(include='object').columns:
features[column] = label_encoder.fit_transform(features[column])
labels = label_encoder.fit_transform(labels)
scaler = StandardScaler()1
features_scaled = scaler.fit_transform(features)
keyboard_arrow_down KNN
from sklearn.neighbors import KNeighborsClassifier
knn_params = {
'n_neighbors': [3, 5, 7],
'weights': ['uniform', 'distance'],
'p': [1, 2] # 1 for Manhattan, 2 for Euclidean
}
knn_grid_search = GridSearchCV(KNeighborsClassifier(), knn_params, cv=5)
knn_grid_search.fit(X_train, y_train)
knn_best_model = knn_grid_search.best_estimator_
knn_predictions = knn_best_model.predict(X_test)
print(student_data['Status'].value_counts())
Status
Fail 46
Pass 4
Name: count, dtype: int64
https://colab.research.google.com/drive/17u1rJx_8k-YiRyWTtd_gGHOKBQDkg-NA#scrollTo=AYBgC6SB7V6v&printMode=true 3/4
8/19/24, 2:15 PM 12 Aug(1st & 2nd Labs Combined).ipynb - Colab
https://colab.research.google.com/drive/17u1rJx_8k-YiRyWTtd_gGHOKBQDkg-NA#scrollTo=AYBgC6SB7V6v&printMode=true 4/4