F1 Score
Evaluation metric for classification algorithms

F1 score combines precision and recall relative to a specific positive class -The F1 score can be interpreted as a weighted average of the precision and recall, where an F1 score reaches its best value at 1 and worst at 0
F1 Score Documentation

# FORMULA
# F1 = 2 * (precision * recall) / (precision + recall)

# imports 
import pandas as pd

# load dataset
path = 'titanic_data.csv'
X = pd.read_csv(path)

X.head(1)

# only store numeric data in features
X = X._get_numeric_data()
X.head(1)

# create response vector y
y = X.Survived
y.head(3)

0    0
1    1
2    1
Name: Survived, dtype: int64

# delete 'Survived', the response vector (Series)
X.drop('Survived', axis=1, inplace=True)

# we drop age for the sake of this example because it contains NaN in some examples
X.drop('Age', axis=1, inplace=True)

# check delete
X.head()

# imports for classifiers and metrics
from sklearn.tree import DecisionTreeClassifier
from sklearn.naive_bayes import GaussianNB
from sklearn.metrics import f1_score

# train/test split
from sklearn.cross_validation import train_test_split
X_train, X_test, y_train, y_test = train_test_split(X, y, random_state=0)

# Decision Tree Classifier

# instantiate
dtc = DecisionTreeClassifier()

# fit
dtc.fit(X_train, y_train)

# predict
y_pred = dtc.predict(X_test)

# f1 score
score = f1_score(y_pred, y_test)

# print
print "Decision Tree F1 score: {:.2f}".format(score)

Decision Tree F1 score: 0.55

# Gaussian Naive Bayes

# instantiate
gnb = GaussianNB()

# fit
gnb.fit(X_train, y_train)

# predict
y_pred_2 = gnb.predict(X_test)

# f1 score
score_2 = f1_score(y_pred_2, y_test)

# print
print "GaussianNB F1 score: {: .2f}".format(score_2)

GaussianNB F1 score:  0.53

	PassengerId	Pclass	SibSp	Fare
0	1	3	1	7.2500
1	2	1	1	71.2833
2	3	3	0	7.9250
3	4	1	1	53.1000
4	5	3	0	8.0500