-
Notifications
You must be signed in to change notification settings - Fork 5
Expand file tree
/
Copy pathvisualize_unsw_hist.py
More file actions
47 lines (42 loc) · 1.83 KB
/
visualize_unsw_hist.py
File metadata and controls
47 lines (42 loc) · 1.83 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
from __future__ import print_function
import numpy as np
from netlearner.utils import create_dir
from netlearner.utils import quantile_transform, log_transform
from preprocess.unsw import generate_dataset
from visualize.feature_plots import plot_feature_histogram
from visualize.feature_plots import plot_feature_with_labels
generate_dataset(one_hot_encode=False)
raw_train_dataset = np.load('UNSW/train_dataset.npy')
train_labels = np.load('UNSW/train_labels.npy')
raw_valid_dataset = np.load('UNSW/valid_dataset.npy')
valid_labels = np.load('UNSW/valid_labels.npy')
raw_test_dataset = np.load('UNSW/test_dataset.npy')
test_labels = np.load('UNSW/test_labels.npy')
# plot_single_feature_histogram(train_dataset, 'sjit')
print('Plot original dataset')
path = 'UNSW/Histogram/Original'
create_dir(path)
plot_feature_histogram(raw_train_dataset, path)
path = 'UNSW/FeatureComp/Original'
create_dir(path)
plot_feature_with_labels(raw_train_dataset, train_labels, path)
columns = np.array(range(1, 6) + range(8, 16) + range(17, 19) +
range(23, 25) + [26])
print('Plot quantile transformed dataset')
[train_dataset, valid_dataset, test_dataset] = quantile_transform(
raw_train_dataset, raw_valid_dataset, raw_test_dataset, columns)
path = 'UNSW/Histogram/QuantileTransformed'
create_dir(path)
plot_feature_histogram(train_dataset, path)
path = 'UNSW/FeatureComp/QuantileTransformed'
create_dir(path)
plot_feature_with_labels(train_dataset, train_labels, path)
print('Plot for log1p transformed dataset')
[train_dataset, valid_dataset, test_dataset] = log_transform(
raw_train_dataset, raw_valid_dataset, raw_test_dataset, columns)
path = 'UNSW/Histogram/LogTransformed'
create_dir(path)
plot_feature_histogram(train_dataset, path)
path = 'UNSW/FeatureComp/LogTransformed'
create_dir(path)
plot_feature_with_labels(train_dataset, train_labels, path)