import pandas as pd
import matplotlib.pyplot as plt
import sklearn
from sklearn.linear_model import LogisticRegression
import numpy as np
import seaborn as sns
#% matplotlib inline
import math
titanic_data = pd.read_csv("C:\\Users\\OCHIN\\Desktop\\Titanic.csv")
#print(titanic_data.head())
#print(titanic_data.shape)
#print(titanic_data.head(5))
#titanic_data.dropna(inplace=True)
#sns.countplot(x="survived", data=titanic_data)
#sns.countplot(x="survived", hue="male", data=titanic_data)
#sns.countplot(x="survived", hue="pclass", data=titanic_data)
#titanic_data ["age"].plot.hist()
#plt.show()
#titanic_data.info()
# Data Wrangling
#print(titanic_data.isnull())
###Training
y=titanic_data["survived"]
X=titanic_data.drop("survived",axis=1)
from sklearn.model_selection import train_test_split
X_train,X_test,y_train,y_test=train_test_split(X,y,test_size=0.3, random_state=42)
# type: (object, object, object, object)
logmodel = LogisticRegression()
logmodel.fit(X_train,y_train)
predictions=logmodel.predict (X_test)
from sklearn.metrics import confusion_matrix
print(confusion_matrix(y_test,predictions))
from sklearn.metrics import accuracy_score
print(accuracy_score(y_test,predictions))