python 3 fixes, initial commit

tobybreckon · tobybreckon · commit 0b037e69da64 · 2016-10-30T21:16:54.000Z
diff --git a/tools/randomize.py b/tools/randomize.py
@@ -0,0 +1,43 @@
+#####################################################################
+
+# Example : randomize loaded CVS file and write out to file
+# basic illustrative python script
+
+# Author : Toby Breckon, toby.breckon@durham.ac.uk
+
+# Copyright (c) 2014 / 2016 School of Engineering & Computing Science,
+#                    Durham University, UK
+# License : LGPL - http://www.gnu.org/licenses/lgpl.html
+
+#####################################################################
+
+import csv
+import cv2
+import numpy as np
+
+from random import shuffle
+
+########### Load Data Set - Example
+
+# load full data set (unsplit)
+
+reader=csv.reader(open("input.data","rt", encoding='ascii'),delimiter=',')
+
+
+entry_list = []
+
+for row in reader:
+        entry_list.append(row)
+
+########### randomize (different order for every file loaded)
+# N.B. to randomize attributes / labels together - append into single np array
+# with one {attribute/label} pair together, then shuffle
+
+shuffle(entry_list)
+
+########### Write Data Set - Example
+
+writer = csv.writer(open("output.data", "wt", encoding='ascii'), delimiter=',')
+writer.writerows(entry_list)
+
+#####################################################################
diff --git a/tools/reader.py b/tools/reader.py
@@ -0,0 +1,78 @@
+#####################################################################
+
+# Example : load HAPT data set only
+# basic illustrative python script
+
+# For use with test / training datasets : HAPT-data-set-DU
+
+# Author : Toby Breckon, toby.breckon@durham.ac.uk
+
+# Copyright (c) 2014 School of Engineering & Computing Science,
+#                    Durham University, UK
+# License : LGPL - http://www.gnu.org/licenses/lgpl.html
+
+#####################################################################
+
+import csv
+import cv2
+import os
+import numpy as np
+
+########### Define classes
+
+classes = {} # define mapping of cla
+inv_classes = {v: k for k, v in classes.items()}
+
+########### Load Data Set
+
+path_to_data = "../../assignment/2016-17/HAPT-data-set-DU" # edit this
+
+# Training data - as currenrtly split
+
+attribute_list = []
+label_list = []
+
+reader=csv.reader(open(os.path.join(path_to_data, "Train/x_train.txt"),"rt", encoding='ascii'),delimiter=' ')
+for row in reader:
+        # attributes in columns 0-561
+        attribute_list.append(list(row[i] for i in (range(0,561))))
+
+reader=csv.reader(open(os.path.join(path_to_data, "Train/y_train.txt"),"rt", encoding='ascii'),delimiter=' ')
+for row in reader:
+        # attributes in column 1
+        label_list.append(row[0])
+
+training_attributes=np.array(attribute_list).astype(np.float32)
+training_labels=np.array(label_list).astype(np.float32)
+
+# Testing data - as currently split
+
+attribute_list = []
+label_list = []
+
+reader=csv.reader(open(os.path.join(path_to_data, "Test/x_test.txt"),"rt", encoding='ascii'),delimiter=' ')
+for row in reader:
+        # attributes in columns 0-561
+        attribute_list.append(list(row[i] for i in (range(0,561))))
+
+reader=csv.reader(open(os.path.join(path_to_data, "Test/y_test.txt"),"rt", encoding='ascii'),delimiter=' ')
+for row in reader:
+        # attributes in column 1
+        label_list.append(row[0])
+
+testing_attributes=np.array(attribute_list).astype(np.float32)
+testing_labels=np.array(label_list).astype(np.float32)
+
+###########  test output for sanity
+
+print(training_attributes)
+print(len(training_attributes))
+print(training_labels)
+print(len(training_labels))
+
+print(testing_attributes)
+print(len(testing_attributes))
+print(testing_labels)
+print(len(testing_labels))
+
+#####################################################################
diff --git a/tools/selectlines.py b/tools/selectlines.py
@@ -0,0 +1,46 @@
+#####################################################################
+
+# Example : select subset of lines from CVS file and write to files
+# basic illustrative python script
+
+# Author : Toby Breckon, toby.breckon@durham.ac.uk
+
+# Copyright (c) 2014 / 2016 School of Engineering & Computing Science,
+#                    Durham University, UK
+# License : LGPL - http://www.gnu.org/licenses/lgpl.html
+
+#####################################################################
+
+import csv
+import cv2
+import numpy as np
+import math
+
+from random import shuffle
+
+########### Load Data Set - Example
+
+# load full data set (unsplit)
+
+reader=csv.reader(open("input.data","rt", encoding='ascii'),delimiter=',')
+
+entry_list = []
+
+for row in reader:
+        entry_list.append(row)
+
+########### Write Data Set - Example
+
+# write first N% of the entries to first file
+
+N = 30.0
+
+writerA = csv.writer(open("outputA.data", "wt", encoding='ascii'), delimiter=',')
+writerA.writerows(entry_list[0:int(math.floor(len(entry_list)* (N/100.0)))])
+
+# write the remaining (100-N)% of the entries of the second file
+
+writerB = csv.writer(open("outputB.data", "wt", encoding='ascii'), delimiter=',')
+writerB.writerows(entry_list[int(math.floor(len(entry_list)* (N/100.0))):len(entry_list)])
+
+#####################################################################