From 0273476710d12b2e5e49c9f41f589f549b797b8c Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?G=C3=BCnter=20Windsperger?= Date: Sat, 5 Jun 2021 15:18:06 +0200 Subject: [PATCH] Create classifier.py --- competition/classifier.py | 24 ++++++++++++++++++++++++ 1 file changed, 24 insertions(+) create mode 100644 competition/classifier.py diff --git a/competition/classifier.py b/competition/classifier.py new file mode 100644 index 0000000..023bcc5 --- /dev/null +++ b/competition/classifier.py @@ -0,0 +1,24 @@ +# 1. Importing new CSV data in pandas dataframes +import pandas as pd +import pickle +from sklearn import preprocessing + +data = pd.read_csv("input.csv") +x = data.to_numpy() + +# Preprocessing data - encode ip addresses to numerical values +le = preprocessing.LabelEncoder() +le.fit(data['sourceIPAddress']) +data['sourceIPAddress'] = le.transform(data['sourceIPAddress']) +le.fit(data['destinationIPAddress']) +data['destinationIPAddress'] = le.transform(data['destinationIPAddress']) + +# 3. Loading a trained model +model = pickle.load(open('network_traffic_classifier.sav', 'rb')) +y_pred = model.predict(x) + +print(data) + +data.append(y_pred) + +