diff --git a/tools/karoo_multiclassifier.py b/tools/karoo_multiclassifier.py index cd1d34d..92502a4 100644 --- a/tools/karoo_multiclassifier.py +++ b/tools/karoo_multiclassifier.py @@ -4,7 +4,8 @@ ''' This is a toy script, designed to allow you to play with multiclass classification using the same underlying function -as employed by Karoo GP. +as employed by Karoo GP. Keep in mind that a linear multiclass classifier such as this is suited only for data which +itself has a linear (eg: time series) component, else GP will struggle to force the data to fit. ''' from numpy import arange diff --git a/tools/karoo_normalise.py b/tools/karoo_normalise.py index 856386b..f21c11f 100644 --- a/tools/karoo_normalise.py +++ b/tools/karoo_normalise.py @@ -8,9 +8,9 @@ import numpy as np np.set_printoptions(linewidth = 320) # set the terminal to print 320 characters before line-wrapping in order to view Trees ''' -This script works with a raw dataset to prepare a new, normalised dataset. It does so by comparing all values in each -given column, finding the maximum and minimum values, and then modifying each value to fall between a high of 1 and -low of 0. The modified values are written to a new file, the original remaining untouched. +This script works with a dataset to prepare a new, normalised dataset. It does so by comparing all values in each given +column, finding the maximum and minimum values, and then modifying each value to fall between a high of 1 and low of 0. +The modified values are written to a new file, the original remaining untouched. This script can be used *after* karoo_features_sort.py, and assumes no header has yet been applied to the .csv. '''