-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrun_madelon.py
106 lines (87 loc) · 4 KB
/
run_madelon.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
import timeit
import numpy as np
import scipy.io as sio
import torch
from sklearn import preprocessing
from sklearn.datasets import load_svmlight_file
from sklearn.linear_model import LogisticRegression
from model_LR_NN_PR import LogisticRegressionNet
if __name__ == "__main__":
dataset_name = "madelon"
train_path = f'./datasets//{dataset_name}'
test_path = f'./datasets//{dataset_name}.t'
train_set_x, train_set_y = load_svmlight_file(train_path)
train_set_x = train_set_x.todense()
train_set_y[train_set_y==-1] = 0
torch.random.manual_seed(0)
# device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
device = 'cpu'
N = train_set_x.shape[0] # batch size
in_dim = train_set_x.shape[1] # input dimension
out_dim = 1 # output dimension
learning_rate = 1e-1
tolerance = 1e-7
max_itr = 500
# preprocessing
scaler = preprocessing.StandardScaler()
train_set_x = scaler.fit_transform(train_set_x)
# np -> tensor
x = torch.from_numpy(train_set_x).float().to(device)
y = torch.from_numpy(train_set_y).float().to(device).squeeze_()
# Construct our model by instantiating the class defined above.
model = LogisticRegressionNet(in_dim, out_dim, y,lam=1.0,device=device)
# optimizer = torch.optim.SGD(model.parameters(), lr=learning_rate, momentum=0.0)
optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate, betas=(0.5, 0.999))
loss_prev = float('inf')
start = timeit.default_timer()
for t in range(max_itr+1):
loss = model(x)
# if (t % 5 == 0):
# print(t, loss.item())
if(abs(loss - loss_prev) <= tolerance):
break
# Zero gradients, perform a backward pass, and update the weights.
loss_prev = loss
optimizer.zero_grad()
loss.backward()
optimizer.step()
stop = timeit.default_timer()
time_our_method = stop - start
print('Number of itr : ', t)
# testing
test_set_x, test_set_y = load_svmlight_file(test_path)
test_set_x = test_set_x.todense()
scaler = preprocessing.StandardScaler()
test_set_x = scaler.fit_transform(test_set_x)
test_set_y[test_set_y==-1] = 0
x_test = torch.from_numpy(test_set_x).float().to(device)
y_test = torch.from_numpy(test_set_y).float().to(device).squeeze_()
y_predict = model.predict(x_test)
acc = 100 - torch.mean(abs(y_predict - y_test))*100
print('Time (our method): ', time_our_method)
print ("accurency (our method): ", acc.item())
#SKLearn Logistic Regression
#https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LogisticRegression.html
logreg_l1 = LogisticRegression(C=1.0, penalty='l1', tol=tolerance, max_iter=max_itr, solver='liblinear')
start = timeit.default_timer()
logreg_l1.fit(train_set_x, train_set_y.squeeze())
stop = timeit.default_timer()
time_lr_sklearn = stop - start
print('Time (sklearn LR-L1): ', time_lr_sklearn)
y_pred = logreg_l1.predict(test_set_x)
print ("accurency (sklearn LR-L1): ", 100 - np.mean(abs(y_pred - test_set_y))*100)
#SKLearn Logistic Regression
#https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LogisticRegression.html
logreg_l2 = LogisticRegression(C=1.0, penalty='l2', tol=tolerance, max_iter=max_itr, solver='liblinear')
start = timeit.default_timer()
logreg_l2.fit(train_set_x, train_set_y.squeeze())
stop = timeit.default_timer()
time_lr_sklearn = stop - start
print('Time (sklearn LR-L2): ', time_lr_sklearn)
y_pred = logreg_l2.predict(test_set_x)
print ("accurency (sklearn LR-L2): ", 100 - np.mean(abs(y_pred - test_set_y))*100)
# save results for draw ROC
y_prob_l1 = logreg_l1.predict_proba(test_set_x)
y_prob_l2 = logreg_l2.predict_proba(test_set_x)
y_score = model.predict_proba(x_test).detach().numpy()
sio.savemat(f"./results/{dataset_name}_ours.mat", {'score_our': y_score, 'score_sk_l1':y_prob_l1[:, 1], 'score_sk_l2':y_prob_l2[:, 1]})