ActuallyOpenAI
/
goingBALD


  
1

	
2

	
3

	
4

	
5

	
6

	
7

	
8

	
9

	
10

	
11

	
12

	
13

	
14

	
15

	
16

	
17

	
18

	
19

	
20

	
21

	
22

	
23

	
24

	
25

	
26

	
27

	
28

	
29

	
30

	
31

	
32

	
33

	
34

	
35

	
36

	
37

	
38

	
39

	
40

	
41

	
42

	
43

	
44

	
45

	
46

	
47

	
48

	
49

	
50

	
51

	
52

	
53

	
54

	
55

	
56

	
57

	
58

	
59

	
60

	
61

	
62

	
63

	
64

	
65

	
66

	
67

	
68

	
69

	
70

	
71

	
72

	
73

	
74

	
75

	
76

	
77

	
78

	
79

	
80

	
81

	
82

	
83

	
84

	
85

	
86

	
87

	
88

	
89

	
90

	
91

	
92

	
93

	
94

	
95

	
96

	
97

	
98

	
99

	
100

	
101

	
102

	
            """
Step 1: train a simple model.
Step 2: train a simple model using active learning.
Step 3: understand something.
Step 4: feel productive.
Step 5: ...
Step 6: profit.
"""
import os
import matplotlib.pyplot as plt
from torchnlp.word_to_vector import GloVe
import torch
import torch.nn.functional as F
import tqdm
from torch import nn
from torch.utils.data import DataLoader
from sklearn.metrics import f1_score

from bald import data_dir,vectors_dir,load_ner_dataset
from bald.dataset import ConllDataset
from bald.simple_model import ConllModel
from bald.utils import epoch_run

vectors = GloVe(cache=vectors_dir)

train_path = os.path.join(data_dir,"raw","CoNLL2003","eng.train")
train_ds = ConllDataset(data_path=train_path,vectors=vectors,emb_dim=300)

test_path = os.path.join(data_dir,"raw","CoNLL2003","eng.testa")
test_ds = ConllDataset(data_path=test_path,vectors=vectors,emb_dim=300)

max_seq_len = max(train_ds.max_seq_len,test_ds.max_seq_len)
train_ds.set_max_seq_len(max_seq_len)
test_ds.set_max_seq_len(max_seq_len)

train_dl = DataLoader(train_ds, batch_size=32, shuffle=True)
test_dl = DataLoader(test_ds, batch_size=32, shuffle=False)

model = ConllModel(
    max_seq_len = max_seq_len,
    num_labels = train_ds.num_labels,
    emb_dim = train_ds.emb_dim
    )

def loss_fun(input,target):
    batch_len,seq_len = target.size()
    target = target.view(batch_len*seq_len)
    return F.cross_entropy(input=input,target=target,ignore_index=0)

def score_fun(input,target):
    dims,labels = input.size()
    y_pred = F.softmax(input,dim=1)
    y_pred = torch.argmax(y_pred,dim=1)
    target = target.view(dims)
    return f1_score(
            y_true = target.cpu().data.numpy(),
            y_pred = y_pred.cpu().data.numpy(),
            labels = list(range(1,6)),
            average = "weighted",
        )

# optimizer = torch.optim.SGD(model.parameters(), lr=0.1, momentum=0.9)
optimizer = torch.optim.Adam(model.parameters())

# set number of epochs from command line
# num_epochs = int(input("Enter number of epochs: "))
num_epochs = 30

train_losses = []
test_losses = []

for epoch in range(num_epochs):
    print(f"\nEpoch {epoch+1}.")

    print("Training.")
    run_d = epoch_run(
        model = model,
        data_loader = train_dl,
        criterion = loss_fun,
        score_fun = score_fun,
        trainer_mode = True,
        optimizer = optimizer,
        )

    train_losses.append(run_d["loss"])
    print(f"Train f1 score is {run_d['score']}.")

    print("Evaluating.")
    run_d = epoch_run(
        model = model,
        data_loader = train_dl,
        criterion = loss_fun,
        score_fun = score_fun,
        trainer_mode = False,
        )
    test_losses.append(run_d["loss"])
    print(f"Test f1 score is {run_d['score']}.")

plt.plot(train_losses, label="train")
plt.plot(test_losses, label="test")
plt.legend()
plt.show()