Finished Model Evaluation Metrics

2019-07-12 02:01:41 +01:00
parent b5dd5aa345
commit af3c2caa6a
14 changed files with 8668 additions and 0 deletions
--- a/python/Supervised
+++ b/python/Supervised
@@ -0,0 +1,35 @@
+# Import statements
+from sklearn.tree import DecisionTreeClassifier
+from sklearn.metrics import accuracy_score
+import pandas as pd
+import numpy as np
+from sklearn.model_selection import train_test_split
+
+# Import the train test split
+# http://scikit-learn.org/0.16/modules/generated/sklearn.cross_validation.train_test_split.html
+
+
+# Read in the data.
+data = np.asarray(pd.read_csv('data.csv', header=None))
+# Assign the features to the variable X, and the labels to the variable y.
+X = data[:, 0:2]
+y = data[:, 2]
+
+# Use train test split to split your data
+# Use a test size of 25% and a random state of 42
+X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.25,
+                                                    random_state=42)
+
+# Instantiate your decision tree model
+model = DecisionTreeClassifier()
+
+# TODO: Fit the model to the training data.
+model.fit(X_train, y_train)
+
+# TODO: Make predictions on the test data
+y_pred = model.predict(X_test)
+
+# TODO: Calculate the accuracy and assign it to the variable acc on the test
+# data.
+acc = accuracy_score(y_test, y_pred)
+print(acc)