-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathangle_encoding.py
More file actions
69 lines (54 loc) · 2.87 KB
/
Copy pathangle_encoding.py
File metadata and controls
69 lines (54 loc) · 2.87 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
import sys
import numpy as np
import pandas as pd
from sklearn.decomposition import PCA
from sklearn.preprocessing import StandardScaler
PCA_num_features = int(sys.argv[1])
data_set_train = pd.read_csv(f"Usable_data_sets/trainning_data_set.csv")
data_set_test = pd.read_csv(f"Usable_data_sets/test_data_set.csv")
data_set_train.rename(columns={list(data_set_train)[0]:"OldIndex"}, inplace=True)
data_set_test.rename(columns={list(data_set_test)[0]:"OldIndex"}, inplace=True)
FEATURES_NAMES = list(data_set_train)[2:]
COUNTER = 0
NUM_FEATURES = 12
NUM_SAMPLES_train = len(data_set_train)
NUM_SAMPLES_test = len(data_set_test)
def normalize_ang(array):
r = array.copy()
for i, elem in enumerate(array):
maxi = max([abs(x) for x in elem])
for j, num in enumerate(elem):
r[i][j] = num * np.pi / maxi
return r
def normalize(array):
r = array.copy()
for i, datapoint in enumerate(array):
soma_sq = sum([x for x in datapoint])
r[i] /= soma_sq
return r
def main():
train_data_set_features = data_set_train.loc[:, FEATURES_NAMES]
train_classes = data_set_train.loc[:, ["CLASSE"]].values
test_data_set_features = data_set_test.loc[:, FEATURES_NAMES]
test_classes = data_set_test.loc[:, ["CLASSE"]].values
if PCA_num_features != 12:
scaler = StandardScaler()
x_train_data = scaler.fit_transform(train_data_set_features)# Apply transform to both the training set and the test set.
x_test_data = scaler.transform(test_data_set_features)
pca = PCA(n_components=PCA_num_features)
train_data_set_features = pca.fit_transform(x_train_data)
test_data_set_features = pca.fit_transform(x_test_data)
train_classes_encode = [-1 if classe == "W" else 1 for classe in train_classes]
test_classes_encode = [-1 if classe == "W" else 1 for classe in test_classes]
train_np_data_set_features_std = normalize_ang(train_data_set_features)
test_np_data_set_features_std = normalize_ang(test_data_set_features)
np.savetxt(f"Encode_data/ang_enc_data_set_trainning_values.csv", train_np_data_set_features_std, delimiter=";")
np.savetxt(f"Encode_data/ang_enc_data_set_trainning_classes.csv", train_classes_encode, delimiter=";")
np.savetxt(f"Encode_data/ang_enc_data_set_test_values.csv", test_np_data_set_features_std, delimiter=";")
np.savetxt(f"Encode_data/ang_enc_data_set_test_classes.csv", test_classes_encode, delimiter=";")
print(f"Amplitude Enconding guardado em \"Encode_data/ang_enc_data_set_trainning_values.csv\"")
print(f"Amplitude Enconding guardado em \"Encode_data/ang_enc_data_set_trainning_classes.csv\"")
print(f"Amplitude Enconding guardado em \"Encode_data/ang_enc_data_set_test_values.csv\"")
print(f"Amplitude Enconding guardado em \"Encode_data/ang_enc_data_set_test_classes.csv\"")
if __name__ == '__main__':
main()