L1LR/script_init_params.py at main · Majeed7/L1LR · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
import torch

import numpy as np
from sklearn import preprocessing
from sklearn.datasets import load_svmlight_file
import matplotlib.pyplot as plt
from scipy.signal import savgol_filter

from model_LR_NN_PR import LogisticRegressionNet

if __name__ == "__main__":
    train_path = './datasets//splice'
    train_set_x, train_set_y = load_svmlight_file(train_path)
    train_set_x = train_set_x.todense()
    train_set_y[train_set_y==-1] = 0

    torch.random.manual_seed(0)
    # device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
    device = 'cpu'

    N = train_set_x.shape[0]       # batch size
    in_dim = train_set_x.shape[1]  # input dimension
    out_dim = 1 # output dimension
    learning_rate = 7e-2
    max_itr = 150

    # preprocessing
    scaler = preprocessing.StandardScaler()
    train_set_x = scaler.fit_transform(train_set_x)

    # np -> tensor
    x = torch.from_numpy(train_set_x).float().to(device)
    y = torch.from_numpy(train_set_y).float().to(device)

    lam = 10
    weights_changes = np.zeros((3, in_dim-25, max_itr+1))

    for i in range(3):
        for j in range(in_dim-25):
            # Construct our model by instantiating the class defined above.
            model = LogisticRegressionNet(in_dim, out_dim, y,lam=lam,device=device)
            init_val = np.random.randn() if i == 2 else i
            model.weight[j].data.copy_(model.weight[j] + init_val)# = torch.tensor(np.random.randn()) if i == 2 else torch.tensor(i*1.)
            weights_changes[i][j][0] = model.weight[j].cpu().detach().numpy()
            # optimizer = torch.optim.SGD(model.parameters(), lr=learning_rate)
            optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate, betas=(0.5, 0.999))
            for t in range(1,max_itr+1):
                loss = model(x)
                loss.item()
                # Zero gradients, perform a backward pass, and update the weights.
                optimizer.zero_grad()
                loss.backward()
                optimizer.step()
                weights_changes[i][j][t] = model.weight[j].cpu().detach().numpy()


    plt.rcParams["font.family"] = "Arial"

    fig, ax = plt.subplots(1, 3, sharex=True, sharey=True, figsize=(18, 6), dpi=300)
    # fig.suptitle('Effects of different weight initialization on convergence', fontsize=26)
    for i in range(3):
        for j in range(in_dim-25):
            w_smooth = savgol_filter(weights_changes[i][j], 25, 2)
            ax[i].plot(w_smooth, label=f'W{j}', linestyle='-')

        # ax[i].legend()
        ax[i].set_title('Weights initial value = ' + ('Random' if i == 2 else str(i)), fontsize=16)
        ax[i].set_xlabel('Iteration', fontsize=18)
        ax[i].set_ylabel('Values of the Weights', fontsize=18)
    # plt.grid()
    plt.savefig(f'./chart_different_w_init.png', format='png', bbox_inches='tight')
    plt.savefig(f'./chart_different_w_init.eps', format='eps', bbox_inches='tight')
    plt.show()