ML ASSIGNMENT 1
Shivam Sanjay Kasodekar
123B1D024
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
df = pd.read_csv('/content/heart_cleveland_upload.csv')
df.head()
{"summary":"{\n \"name\": \"df\",\n \"rows\": 297,\n \"fields\": [\
n {\n \"column\": \"age\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 9,\n \"min\": 29,\n
\"max\": 77,\n \"num_unique_values\": 41,\n \"samples\":
[\n 50,\n 42,\n 58\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"sex\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 1,\n \"num_unique_values\": 2,\n \"samples\":
[\n 0,\n 1\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"cp\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 3,\n \"num_unique_values\": 4,\n \"samples\":
[\n 1,\n 3\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"trestbps\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 17,\n \"min\": 94,\n
\"max\": 200,\n \"num_unique_values\": 50,\n
\"samples\": [\n 148,\n 144\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"chol\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 51,\n \"min\": 126,\n
\"max\": 564,\n \"num_unique_values\": 152,\n
\"samples\": [\n 360,\n 341\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"fbs\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 1,\n \"num_unique_values\": 2,\n \"samples\":
[\n 0,\n 1\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"restecg\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 2,\n \"num_unique_values\": 3,\n \"samples\":
[\n 2,\n 0\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"thalach\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 22,\n \"min\": 71,\n
\"max\": 202,\n \"num_unique_values\": 91,\n
\"samples\": [\n 170,\n 164\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"exang\",\n \"properties\": {\
n \"dtype\": \"number\",\n \"std\": 0,\n \"min\":
0,\n \"max\": 1,\n \"num_unique_values\": 2,\n
\"samples\": [\n 1,\n 0\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"oldpeak\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\":
1.1661227818468956,\n \"min\": 0.0,\n \"max\": 6.2,\n
\"num_unique_values\": 40,\n \"samples\": [\n 0.7,\n
0.3\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"slope\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 2,\n
\"num_unique_values\": 3,\n \"samples\": [\n 1,\n
0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"ca\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 3,\n
\"num_unique_values\": 4,\n \"samples\": [\n 2,\n
3\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"thal\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 2,\n
\"num_unique_values\": 3,\n \"samples\": [\n 0,\n
2\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"condition\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 1,\n \"num_unique_values\": 2,\n \"samples\":
[\n 1,\n 0\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n }\n ]\
n}","type":"dataframe","variable_name":"df"}
df.sample()
{"summary":"{\n \"name\": \"df\",\n \"rows\": 1,\n \"fields\": [\n
{\n \"column\": \"age\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\": 61,\n
\"max\": 61,\n \"num_unique_values\": 1,\n \"samples\":
[\n 61\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"sex\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": 0,\n \"max\": 0,\n
\"num_unique_values\": 1,\n \"samples\": [\n 0\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"cp\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\": 3,\n
\"max\": 3,\n \"num_unique_values\": 1,\n \"samples\":
[\n 3\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"trestbps\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": null,\n \"min\": 130,\n
\"max\": 130,\n \"num_unique_values\": 1,\n \"samples\":
[\n 130\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"chol\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": 330,\n \"max\": 330,\n
\"num_unique_values\": 1,\n \"samples\": [\n 330\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"fbs\",\n \"properties\": {\
n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": 0,\n \"max\": 0,\n \"num_unique_values\": 1,\n
\"samples\": [\n 0\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"restecg\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": null,\n \"min\": 2,\n
\"max\": 2,\n \"num_unique_values\": 1,\n \"samples\":
[\n 2\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"thalach\",\n \"properties\": {\n \"dtype\": \"number\",\
n \"std\": null,\n \"min\": 169,\n \"max\": 169,\
n \"num_unique_values\": 1,\n \"samples\": [\n
169\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"exang\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": 0,\n \"max\": 0,\n
\"num_unique_values\": 1,\n \"samples\": [\n 0\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"oldpeak\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
null,\n \"min\": 0.0,\n \"max\": 0.0,\n
\"num_unique_values\": 1,\n \"samples\": [\n 0.0\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"slope\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": 0,\n \"max\": 0,\n \"num_unique_values\": 1,\n
\"samples\": [\n 0\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"ca\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": null,\n \"min\": 0,\n
\"max\": 0,\n \"num_unique_values\": 1,\n \"samples\":
[\n 0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"thal\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": 0,\n \"max\": 0,\n
\"num_unique_values\": 1,\n \"samples\": [\n 0\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"condition\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
null,\n \"min\": 1,\n \"max\": 1,\n
\"num_unique_values\": 1,\n \"samples\": [\n 1\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n }\n ]\n}","type":"dataframe"}
df.isnull().sum()
age 0
sex 0
cp 0
trestbps 0
chol 0
fbs 0
restecg 0
thalach 0
exang 0
oldpeak 0
slope 0
ca 0
thal 0
condition 0
dtype: int64
df.describe()
{"summary":"{\n \"name\": \"df\",\n \"rows\": 8,\n \"fields\": [\n
{\n \"column\": \"age\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 90.50115084828495,\n
\"min\": 9.049735681096765,\n \"max\": 297.0,\n
\"num_unique_values\": 8,\n \"samples\": [\n
54.54208754208754,\n 56.0,\n 297.0\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"sex\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 104.79682279715288,\n
\"min\": 0.0,\n \"max\": 297.0,\n \"num_unique_values\":
5,\n \"samples\": [\n 0.6767676767676768,\n
1.0,\n 0.468499967441002\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"cp\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 104.34732263291957,\n
\"min\": 0.0,\n \"max\": 297.0,\n \"num_unique_values\":
6,\n \"samples\": [\n 297.0,\n
2.1582491582491583,\n 3.0\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"trestbps\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\":
80.94289052189558,\n \"min\": 17.762806366599,\n
\"max\": 297.0,\n \"num_unique_values\": 8,\n
\"samples\": [\n 131.69360269360268,\n 130.0,\n
297.0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"chol\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 150.05026434490236,\n \"min\": 51.99758253513897,\n
\"max\": 564.0,\n \"num_unique_values\": 8,\n
\"samples\": [\n 247.35016835016836,\n 243.0,\n
297.0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"fbs\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 104.93029576699878,\n \"min\": 0.0,\n \"max\":
297.0,\n \"num_unique_values\": 5,\n \"samples\": [\n
0.1447811447811448,\n 1.0,\n 0.35247393412545347\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"restecg\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
104.6549606800254,\n \"min\": 0.0,\n \"max\": 297.0,\n
\"num_unique_values\": 6,\n \"samples\": [\n 297.0,\n
0.9966329966329966,\n 2.0\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"thalach\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\":
82.15688994105308,\n \"min\": 22.941562061360813,\n
\"max\": 297.0,\n \"num_unique_values\": 8,\n
\"samples\": [\n 149.5993265993266,\n 153.0,\n
297.0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"exang\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 104.86494385520157,\n \"min\": 0.0,\n \"max\":
297.0,\n \"num_unique_values\": 5,\n \"samples\": [\n
0.3265993265993266,\n 1.0,\n 0.46976081219618576\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"oldpeak\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
104.47750327433197,\n \"min\": 0.0,\n \"max\": 297.0,\n
\"num_unique_values\": 7,\n \"samples\": [\n 297.0,\n
1.0555555555555556,\n 1.6\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"slope\",\n \"properties\": {\
n \"dtype\": \"number\",\n \"std\": 104.74360725657165,\
n \"min\": 0.0,\n \"max\": 297.0,\n
\"num_unique_values\": 6,\n \"samples\": [\n 297.0,\n
0.6026936026936027,\n 2.0\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"ca\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 104.72638124231159,\n
\"min\": 0.0,\n \"max\": 297.0,\n \"num_unique_values\":
6,\n \"samples\": [\n 297.0,\n
0.6767676767676768,\n 3.0\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"thal\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 104.71611983772739,\n
\"min\": 0.0,\n \"max\": 297.0,\n \"num_unique_values\":
5,\n \"samples\": [\n 0.835016835016835,\n
2.0,\n 0.9566902138394462\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"condition\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
104.85664736713339,\n \"min\": 0.0,\n \"max\": 297.0,\n
\"num_unique_values\": 5,\n \"samples\": [\n
0.4612794612794613,\n 1.0,\n 0.49933981349402623\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n }\n ]\n}","type":"dataframe"}
sns.scatterplot(x='age', y='chol', hue='condition', data=df)
plt.title('Scatter Plot of Age vs Cholesterol by Heart Condition')
plt.xlabel('Age')
plt.ylabel('Cholesterol')
plt.legend(title='Condition')
plt.show()
sns.scatterplot(x='condition', y='thalach', data=df)
plt.title('Scatter Plot of Heart Condition vs Max Heart Rate')
plt.xlabel('Heart Condition (0 = No Disease)')
plt.ylabel('Maximum Heart Rate (thalach)')
plt.show()
numerical_cols = df.select_dtypes(include=['number']).columns
for col in numerical_cols:
Q1 = df[col].quantile(0.25)
Q3 = df[col].quantile(0.75)
IQR = Q3 - Q1
lower_bound = Q1 - 1.5 * IQR
upper_bound = Q3 + 1.5 * IQR
outliers = df[(df[col] < lower_bound) | (df[col] > upper_bound)]
print(f"Outliers in '{col}':")
display(outliers)
Outliers in 'age':
{"summary":"{\n \"name\": \"outliers\",\n \"rows\": 0,\n
\"fields\": [\n {\n \"column\": \"age\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"sex\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"cp\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"trestbps\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"chol\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"fbs\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"restecg\",\n \"properties\": {\n \"dtype\": \"number\",\
n \"std\": null,\n \"min\": null,\n \"max\":
null,\n \"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"thalach\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"exang\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"oldpeak\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"slope\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"ca\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"thal\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"condition\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n }\n ]\n}","type":"dataframe","variable_name":"outliers"}
Outliers in 'sex':
{"summary":"{\n \"name\": \"outliers\",\n \"rows\": 0,\n
\"fields\": [\n {\n \"column\": \"age\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"sex\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"cp\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"trestbps\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"chol\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"fbs\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"restecg\",\n \"properties\": {\n \"dtype\": \"number\",\
n \"std\": null,\n \"min\": null,\n \"max\":
null,\n \"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"thalach\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"exang\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"oldpeak\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"slope\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"ca\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"thal\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"condition\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n }\n ]\n}","type":"dataframe","variable_name":"outliers"}
Outliers in 'cp':
{"summary":"{\n \"name\": \"outliers\",\n \"rows\": 23,\n
\"fields\": [\n {\n \"column\": \"age\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
10,\n \"min\": 34,\n \"max\": 69,\n
\"num_unique_values\": 17,\n \"samples\": [\n 69,\n
66,\n 61\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"sex\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 1,\n
\"num_unique_values\": 2,\n \"samples\": [\n 0,\n
1\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"cp\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 0,\n
\"num_unique_values\": 1,\n \"samples\": [\n 0\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"trestbps\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
19,\n \"min\": 110,\n \"max\": 178,\n
\"num_unique_values\": 14,\n \"samples\": [\n 120\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"chol\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": 33,\n
\"min\": 182,\n \"max\": 298,\n \"num_unique_values\":
22,\n \"samples\": [\n 234\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"fbs\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 1,\n \"num_unique_values\": 2,\n \"samples\":
[\n 0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"restecg\",\n \"properties\": {\n \"dtype\": \"number\",\
n \"std\": 0,\n \"min\": 0,\n \"max\": 2,\n
\"num_unique_values\": 2,\n \"samples\": [\n 0\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"thalach\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
20,\n \"min\": 114,\n \"max\": 190,\n
\"num_unique_values\": 16,\n \"samples\": [\n 131\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"exang\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": 0,\n
\"min\": 0,\n \"max\": 1,\n \"num_unique_values\": 2,\n
\"samples\": [\n 1\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"oldpeak\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 1.1425303033491698,\n \"min\":
0.0,\n \"max\": 4.2,\n \"num_unique_values\": 15,\n
\"samples\": [\n 0.0\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"slope\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 2,\n \"num_unique_values\": 3,\n \"samples\":
[\n 1\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"ca\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 2,\n
\"num_unique_values\": 3,\n \"samples\": [\n 1\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"thal\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": 0,\n
\"min\": 0,\n \"max\": 2,\n \"num_unique_values\": 3,\n
\"samples\": [\n 0\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"condition\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 1,\n \"num_unique_values\": 2,\n \"samples\":
[\n 1\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n }\n ]\
n}","type":"dataframe","variable_name":"outliers"}
Outliers in 'trestbps':
{"summary":"{\n \"name\": \"outliers\",\n \"rows\": 9,\n
\"fields\": [\n {\n \"column\": \"age\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
5,\n \"min\": 52,\n \"max\": 68,\n
\"num_unique_values\": 8,\n \"samples\": [\n 54,\n
64,\n 59\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"sex\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 1,\n
\"num_unique_values\": 2,\n \"samples\": [\n 0,\n
1\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"cp\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 1,\n \"min\": 0,\n \"max\": 3,\n
\"num_unique_values\": 4,\n \"samples\": [\n 1,\n
3\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"trestbps\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 8,\n \"min\": 172,\n
\"max\": 200,\n \"num_unique_values\": 6,\n \"samples\":
[\n 178,\n 192\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"chol\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 41,\n \"min\": 199,\n
\"max\": 327,\n \"num_unique_values\": 9,\n \"samples\":
[\n 288,\n 283\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"fbs\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 1,\n \"num_unique_values\": 2,\n \"samples\":
[\n 1,\n 0\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"restecg\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 1,\n \"min\": 0,\n
\"max\": 2,\n \"num_unique_values\": 3,\n \"samples\":
[\n 2,\n 0\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"thalach\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 21,\n \"min\": 117,\n
\"max\": 195,\n \"num_unique_values\": 9,\n \"samples\":
[\n 133,\n 195\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"exang\",\n \"properties\": {\
n \"dtype\": \"number\",\n \"std\": 0,\n \"min\":
0,\n \"max\": 1,\n \"num_unique_values\": 2,\n
\"samples\": [\n 1,\n 0\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"oldpeak\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\":
1.7677669529663687,\n \"min\": 0.0,\n \"max\": 4.2,\n
\"num_unique_values\": 7,\n \"samples\": [\n 4.2,\n
0.0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"slope\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 2,\n
\"num_unique_values\": 3,\n \"samples\": [\n 2,\n
0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"ca\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 2,\n
\"num_unique_values\": 3,\n \"samples\": [\n 0,\n
1\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"thal\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 1,\n \"min\": 0,\n \"max\": 2,\n
\"num_unique_values\": 2,\n \"samples\": [\n 0,\n
2\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"condition\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 1,\n \"num_unique_values\": 2,\n \"samples\":
[\n 1,\n 0\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n }\n ]\
n}","type":"dataframe","variable_name":"outliers"}
Outliers in 'chol':
{"summary":"{\n \"name\": \"outliers\",\n \"rows\": 5,\n
\"fields\": [\n {\n \"column\": \"age\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
4,\n \"min\": 56,\n \"max\": 67,\n
\"num_unique_values\": 5,\n \"samples\": [\n 65,\n
56,\n 63\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"sex\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 0,\n
\"num_unique_values\": 1,\n \"samples\": [\n 0\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"cp\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 0,\n \"min\": 2,\n
\"max\": 3,\n \"num_unique_values\": 2,\n \"samples\":
[\n 3\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"trestbps\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 12,\n \"min\": 115,\n
\"max\": 150,\n \"num_unique_values\": 4,\n \"samples\":
[\n 140\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"chol\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 70,\n \"min\": 394,\n \"max\": 564,\n
\"num_unique_values\": 5,\n \"samples\": [\n 417\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"fbs\",\n \"properties\": {\
n \"dtype\": \"number\",\n \"std\": 0,\n \"min\":
0,\n \"max\": 1,\n \"num_unique_values\": 2,\n
\"samples\": [\n 1\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"restecg\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 0,\n \"min\": 2,\n
\"max\": 2,\n \"num_unique_values\": 1,\n \"samples\":
[\n 2\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"thalach\",\n \"properties\": {\n \"dtype\": \"number\",\
n \"std\": 3,\n \"min\": 150,\n \"max\": 160,\n
\"num_unique_values\": 4,\n \"samples\": [\n 157\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"exang\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": 0,\n
\"min\": 0,\n \"max\": 1,\n \"num_unique_values\": 2,\n
\"samples\": [\n 1\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"oldpeak\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 1.2449899597988732,\n \"min\":
0.8,\n \"max\": 4.0,\n \"num_unique_values\": 5,\n
\"samples\": [\n 0.8\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"slope\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 1,\n \"num_unique_values\": 2,\n \"samples\":
[\n 0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"ca\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 1,\n \"min\": 0,\n \"max\": 3,\n
\"num_unique_values\": 4,\n \"samples\": [\n 1\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"thal\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": 1,\n
\"min\": 0,\n \"max\": 2,\n \"num_unique_values\": 2,\n
\"samples\": [\n 0\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"condition\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 1,\n \"num_unique_values\": 2,\n \"samples\":
[\n 1\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n }\n ]\
n}","type":"dataframe","variable_name":"outliers"}
Outliers in 'fbs':
{"summary":"{\n \"name\": \"outliers\",\n \"rows\": 43,\n
\"fields\": [\n {\n \"column\": \"age\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
6,\n \"min\": 42,\n \"max\": 71,\n
\"num_unique_values\": 22,\n \"samples\": [\n 69,\n
57,\n 71\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"sex\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 1,\n
\"num_unique_values\": 2,\n \"samples\": [\n 0,\n
1\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"cp\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 3,\n
\"num_unique_values\": 4,\n \"samples\": [\n 1,\n
3\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"trestbps\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 20,\n \"min\": 101,\n
\"max\": 200,\n \"num_unique_values\": 27,\n
\"samples\": [\n 101,\n 126\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"chol\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 51,\n \"min\": 126,\n
\"max\": 417,\n \"num_unique_values\": 38,\n
\"samples\": [\n 225,\n 203\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"fbs\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 0,\n \"min\": 1,\n
\"max\": 1,\n \"num_unique_values\": 1,\n \"samples\":
[\n 1\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"restecg\",\n \"properties\": {\n \"dtype\": \"number\",\
n \"std\": 0,\n \"min\": 0,\n \"max\": 2,\n
\"num_unique_values\": 2,\n \"samples\": [\n 0\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"thalach\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
22,\n \"min\": 90,\n \"max\": 194,\n
\"num_unique_values\": 36,\n \"samples\": [\n 136\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"exang\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": 0,\n
\"min\": 0,\n \"max\": 1,\n \"num_unique_values\": 2,\n
\"samples\": [\n 1\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"oldpeak\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 1.086619515381114,\n \"min\":
0.0,\n \"max\": 4.0,\n \"num_unique_values\": 20,\n
\"samples\": [\n 0.1\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"slope\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 2,\n \"num_unique_values\": 3,\n \"samples\":
[\n 1\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"ca\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 1,\n \"min\": 0,\n \"max\": 3,\n
\"num_unique_values\": 4,\n \"samples\": [\n 0\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"thal\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": 0,\n
\"min\": 0,\n \"max\": 2,\n \"num_unique_values\": 3,\n
\"samples\": [\n 0\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"condition\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 1,\n \"num_unique_values\": 2,\n \"samples\":
[\n 1\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n }\n ]\
n}","type":"dataframe","variable_name":"outliers"}
Outliers in 'restecg':
{"summary":"{\n \"name\": \"outliers\",\n \"rows\": 0,\n
\"fields\": [\n {\n \"column\": \"age\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"sex\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"cp\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"trestbps\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"chol\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"fbs\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"restecg\",\n \"properties\": {\n \"dtype\": \"number\",\
n \"std\": null,\n \"min\": null,\n \"max\":
null,\n \"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"thalach\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"exang\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"oldpeak\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"slope\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"ca\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"thal\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"condition\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n }\n ]\n}","type":"dataframe","variable_name":"outliers"}
Outliers in 'thalach':
{"summary":"{\n \"name\": \"outliers\",\n \"rows\": 1,\n
\"fields\": [\n {\n \"column\": \"age\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
null,\n \"min\": 67,\n \"max\": 67,\n
\"num_unique_values\": 1,\n \"samples\": [\n 67\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"sex\",\n \"properties\": {\
n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": 1,\n \"max\": 1,\n \"num_unique_values\": 1,\n
\"samples\": [\n 1\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"cp\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": null,\n \"min\": 3,\n
\"max\": 3,\n \"num_unique_values\": 1,\n \"samples\":
[\n 3\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"trestbps\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": null,\n \"min\": 120,\n
\"max\": 120,\n \"num_unique_values\": 1,\n \"samples\":
[\n 120\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"chol\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": 237,\n \"max\": 237,\n
\"num_unique_values\": 1,\n \"samples\": [\n 237\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"fbs\",\n \"properties\": {\
n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": 0,\n \"max\": 0,\n \"num_unique_values\": 1,\n
\"samples\": [\n 0\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"restecg\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": null,\n \"min\": 0,\n
\"max\": 0,\n \"num_unique_values\": 1,\n \"samples\":
[\n 0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"thalach\",\n \"properties\": {\n \"dtype\": \"number\",\
n \"std\": null,\n \"min\": 71,\n \"max\": 71,\n
\"num_unique_values\": 1,\n \"samples\": [\n 71\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"exang\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": 0,\n \"max\": 0,\n \"num_unique_values\": 1,\n
\"samples\": [\n 0\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"oldpeak\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": null,\n \"min\": 1.0,\n
\"max\": 1.0,\n \"num_unique_values\": 1,\n \"samples\":
[\n 1.0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"slope\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": 1,\n \"max\": 1,\n
\"num_unique_values\": 1,\n \"samples\": [\n 1\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"ca\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\": 0,\n
\"max\": 0,\n \"num_unique_values\": 1,\n \"samples\":
[\n 0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"thal\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": 0,\n \"max\": 0,\n
\"num_unique_values\": 1,\n \"samples\": [\n 0\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"condition\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
null,\n \"min\": 1,\n \"max\": 1,\n
\"num_unique_values\": 1,\n \"samples\": [\n 1\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n }\n ]\n}","type":"dataframe","variable_name":"outliers"}
Outliers in 'exang':
{"summary":"{\n \"name\": \"outliers\",\n \"rows\": 0,\n
\"fields\": [\n {\n \"column\": \"age\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"sex\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"cp\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"trestbps\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"chol\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"fbs\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"restecg\",\n \"properties\": {\n \"dtype\": \"number\",\
n \"std\": null,\n \"min\": null,\n \"max\":
null,\n \"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"thalach\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"exang\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"oldpeak\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"slope\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"ca\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"thal\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"condition\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n }\n ]\n}","type":"dataframe","variable_name":"outliers"}
Outliers in 'oldpeak':
{"summary":"{\n \"name\": \"outliers\",\n \"rows\": 5,\n
\"fields\": [\n {\n \"column\": \"age\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
4,\n \"min\": 51,\n \"max\": 62,\n
\"num_unique_values\": 5,\n \"samples\": [\n 62,\n
51,\n 58\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"sex\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 1,\n
\"num_unique_values\": 2,\n \"samples\": [\n 0,\n
1\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"cp\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 1,\n \"min\": 0,\n \"max\": 3,\n
\"num_unique_values\": 2,\n \"samples\": [\n 3,\n
0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"trestbps\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 24,\n \"min\": 114,\n
\"max\": 178,\n \"num_unique_values\": 4,\n \"samples\":
[\n 160,\n 140\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"chol\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 62,\n \"min\": 164,\n
\"max\": 318,\n \"num_unique_values\": 5,\n \"samples\":
[\n 164,\n 298\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"fbs\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 0,\n \"num_unique_values\": 1,\n \"samples\":
[\n 0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"restecg\",\n \"properties\": {\n \"dtype\": \"number\",\
n \"std\": 1,\n \"min\": 0,\n \"max\": 2,\n
\"num_unique_values\": 3,\n \"samples\": [\n 2\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"thalach\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
15,\n \"min\": 111,\n \"max\": 145,\n
\"num_unique_values\": 4,\n \"samples\": [\n 140\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"exang\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": 0,\n
\"min\": 0,\n \"max\": 1,\n \"num_unique_values\": 2,\n
\"samples\": [\n 1\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"oldpeak\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 0.923038460737146,\n \"min\":
4.2,\n \"max\": 6.2,\n \"num_unique_values\": 4,\n
\"samples\": [\n 6.2\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"slope\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 0,\n \"min\": 1,\n
\"max\": 2,\n \"num_unique_values\": 2,\n \"samples\":
[\n 1\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"ca\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 1,\n \"min\": 0,\n \"max\": 3,\n
\"num_unique_values\": 2,\n \"samples\": [\n 3\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"thal\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": 0,\n
\"min\": 1,\n \"max\": 2,\n \"num_unique_values\": 2,\n
\"samples\": [\n 1\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"condition\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 1,\n \"num_unique_values\": 2,\n \"samples\":
[\n 1\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n }\n ]\
n}","type":"dataframe","variable_name":"outliers"}
Outliers in 'slope':
{"summary":"{\n \"name\": \"outliers\",\n \"rows\": 0,\n
\"fields\": [\n {\n \"column\": \"age\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"sex\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"cp\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"trestbps\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"chol\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"fbs\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"restecg\",\n \"properties\": {\n \"dtype\": \"number\",\
n \"std\": null,\n \"min\": null,\n \"max\":
null,\n \"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"thalach\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"exang\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"oldpeak\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"slope\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"ca\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"thal\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"condition\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n }\n ]\n}","type":"dataframe","variable_name":"outliers"}
Outliers in 'ca':
{"summary":"{\n \"name\": \"outliers\",\n \"rows\": 20,\n
\"fields\": [\n {\n \"column\": \"age\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
8,\n \"min\": 45,\n \"max\": 77,\n
\"num_unique_values\": 15,\n \"samples\": [\n 63,\n
57,\n 66\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"sex\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 1,\n
\"num_unique_values\": 2,\n \"samples\": [\n 0,\n
1\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"cp\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 1,\n \"max\": 3,\n
\"num_unique_values\": 3,\n \"samples\": [\n 1,\n
2\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"trestbps\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 16,\n \"min\": 108,\n
\"max\": 165,\n \"num_unique_values\": 13,\n
\"samples\": [\n 108,\n 128\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"chol\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 62,\n \"min\": 149,\n
\"max\": 407,\n \"num_unique_values\": 19,\n
\"samples\": [\n 246,\n 304\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"fbs\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 1,\n \"num_unique_values\": 2,\n \"samples\":
[\n 1,\n 0\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"restecg\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 2,\n \"num_unique_values\": 3,\n \"samples\":
[\n 0,\n 2\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"thalach\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 18,\n \"min\": 106,\n
\"max\": 173,\n \"num_unique_values\": 18,\n
\"samples\": [\n 120,\n 146\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"exang\",\n \"properties\": {\
n \"dtype\": \"number\",\n \"std\": 0,\n \"min\":
0,\n \"max\": 1,\n \"num_unique_values\": 2,\n
\"samples\": [\n 0,\n 1\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"oldpeak\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\":
1.7085774322825593,\n \"min\": 0.0,\n \"max\": 6.2,\n
\"num_unique_values\": 14,\n \"samples\": [\n 1.9,\n
2.2\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"slope\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 2,\n
\"num_unique_values\": 3,\n \"samples\": [\n 1,\n
0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"ca\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 3,\n \"max\": 3,\n
\"num_unique_values\": 1,\n \"samples\": [\n 3\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"thal\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": 0,\n
\"min\": 0,\n \"max\": 2,\n \"num_unique_values\": 3,\n
\"samples\": [\n 1\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"condition\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 1,\n \"num_unique_values\": 2,\n \"samples\":
[\n 0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n }\n ]\
n}","type":"dataframe","variable_name":"outliers"}
Outliers in 'thal':
{"summary":"{\n \"name\": \"outliers\",\n \"rows\": 0,\n
\"fields\": [\n {\n \"column\": \"age\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"sex\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"cp\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"trestbps\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"chol\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"fbs\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"restecg\",\n \"properties\": {\n \"dtype\": \"number\",\
n \"std\": null,\n \"min\": null,\n \"max\":
null,\n \"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"thalach\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"exang\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"oldpeak\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"slope\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"ca\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"thal\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"condition\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n }\n ]\n}","type":"dataframe","variable_name":"outliers"}
Outliers in 'condition':
{"summary":"{\n \"name\": \"outliers\",\n \"rows\": 0,\n
\"fields\": [\n {\n \"column\": \"age\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"sex\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"cp\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"trestbps\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"chol\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"fbs\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"restecg\",\n \"properties\": {\n \"dtype\": \"number\",\
n \"std\": null,\n \"min\": null,\n \"max\":
null,\n \"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"thalach\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"exang\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"oldpeak\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": null,\n
\"min\": null,\n \"max\": null,\n \"num_unique_values\":
0,\n \"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"slope\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"ca\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": null,\n \"min\":
null,\n \"max\": null,\n \"num_unique_values\": 0,\n
\"samples\": [],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"thal\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"condition\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
null,\n \"min\": null,\n \"max\": null,\n
\"num_unique_values\": 0,\n \"samples\": [],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n }\n ]\n}","type":"dataframe","variable_name":"outliers"}
from sklearn.preprocessing import LabelEncoder,MinMaxScaler
# Separate features (X) and target (y)
X = df.drop("condition", axis=1)
y = df["condition"]
print("Original labels:")
print(df["condition"].tolist())
Original labels:
[0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0,
0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1,
0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1,
0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 0, 0, 1, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1,
1, 1, 1, 1, 0, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1,
1, 1, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
0, 1, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1,
1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1,
0, 0, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0,
0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1]
from sklearn.preprocessing import MinMaxScaler
scaler = MinMaxScaler()
df[['age', 'trestbps', 'chol', 'thalach', 'oldpeak']] =
scaler.fit_transform(df[['age', 'trestbps', 'chol', 'thalach',
'oldpeak']])
df.head()
{"summary":"{\n \"name\": \"df\",\n \"rows\": 297,\n \"fields\": [\
n {\n \"column\": \"age\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 0.18853616002284923,\n
\"min\": 0.0,\n \"max\": 0.9999999999999999,\n
\"num_unique_values\": 41,\n \"samples\": [\n
0.4374999999999999,\n 0.27083333333333337,\n
0.6041666666666666\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"sex\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 1,\n
\"num_unique_values\": 2,\n \"samples\": [\n 0,\n
1\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"cp\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 3,\n
\"num_unique_values\": 4,\n \"samples\": [\n 1,\n
3\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"trestbps\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 0.16757364496791516,\n \"min\":
0.0,\n \"max\": 1.0,\n \"num_unique_values\": 50,\n
\"samples\": [\n 0.5094339622641509,\n
0.4716981132075472\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"chol\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0.11871594186104785,\n \"min\": 0.0,\n \"max\":
0.9999999999999998,\n \"num_unique_values\": 152,\n
\"samples\": [\n 0.5342465753424657,\n
0.49086757990867574\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"fbs\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 1,\n
\"num_unique_values\": 2,\n \"samples\": [\n 0,\n
1\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"restecg\",\n \"properties\": {\n \"dtype\": \"number\",\
n \"std\": 0,\n \"min\": 0,\n \"max\": 2,\n
\"num_unique_values\": 3,\n \"samples\": [\n 2,\n
0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"thalach\",\n \"properties\": {\n \"dtype\": \"number\",\
n \"std\": 0.17512642794931907,\n \"min\": 0.0,\n
\"max\": 0.9999999999999999,\n \"num_unique_values\": 91,\n
\"samples\": [\n 0.7557251908396946,\n
0.7099236641221373\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"exang\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 1,\n
\"num_unique_values\": 2,\n \"samples\": [\n 1,\n
0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"oldpeak\",\n \"properties\": {\n \"dtype\": \"number\",\
n \"std\": 0.18808431965272515,\n \"min\": 0.0,\n
\"max\": 1.0,\n \"num_unique_values\": 40,\n
\"samples\": [\n 0.1129032258064516,\n
0.04838709677419355\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"slope\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 2,\n
\"num_unique_values\": 3,\n \"samples\": [\n 1,\n
0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"ca\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 3,\n
\"num_unique_values\": 4,\n \"samples\": [\n 2,\n
3\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"thal\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 0,\n \"min\": 0,\n \"max\": 2,\n
\"num_unique_values\": 3,\n \"samples\": [\n 0,\n
2\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"condition\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 0,\n \"min\": 0,\n
\"max\": 1,\n \"num_unique_values\": 2,\n \"samples\":
[\n 1,\n 0\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n }\n ]\
n}","type":"dataframe","variable_name":"df"}
feature selection
from sklearn.feature_selection import SelectKBest, f_classif, chi2
x = df[['age', 'trestbps', 'chol', 'thalach', 'oldpeak']]
y = df['condition']
selector = SelectKBest(score_func=f_classif, k='all')
x_new = selector.fit_transform(x, y)
selected_features=x.columns[selector.get_support()]
print(selected_features)
Index(['age', 'trestbps', 'chol', 'thalach', 'oldpeak'],
dtype='object')
selector=SelectKBest(chi2,k=2)
x_new=selector.fit_transform(x,y)
elected_features=x.columns[selector.get_support()]
print(selected_features)
Index(['age', 'trestbps', 'chol', 'thalach', 'oldpeak'],
dtype='object')