├── exp └── test │ ├── run.err │ ├── run.sh │ ├── run_noatt.out │ └── run.out ├── models.py ├── _scratch ├── notes2.txt ├── notes.txt └── metacomp.py ├── vocab.py ├── hlog.py ├── .gitignore ├── grammar.py ├── seq.py ├── metacomp.py └── cp.py /exp/test/run.err: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /models.py: -------------------------------------------------------------------------------- 1 | import numpy as np 2 | import torch 3 | from torch import nn, optim 4 | import torch.utils.data as torch_data 5 | -------------------------------------------------------------------------------- /_scratch/notes2.txt: -------------------------------------------------------------------------------- 1 | learn to: 2 | retrieve mini training examples 3 | generate translations "nonparametrically" 4 | by interacting with K--V store 5 | -------------------------------------------------------------------------------- /exp/test/run.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | #export PYTHONPATH='../..:../../lib/fairseq' 4 | 5 | python -u ../../metacomp.py \ 6 | > run_noatt.out \ 7 | 2> run.err 8 | -------------------------------------------------------------------------------- /_scratch/notes.txt: -------------------------------------------------------------------------------- 1 | multitask training 2 | joint 3 | pre-train then fine-tune 4 | 5 | posterior regularization 6 | input length correlated with output length 7 | input reconstructable from output 8 | minimize collisions 9 | 10 | primitive: imagine recombining slices of input sequences 11 | on training sequences: likelihood 12 | on synthesized sequences: reconstruct input from output 13 | 14 | model structure 15 | start with a phrase table / learn glue with copying 16 | -------------------------------------------------------------------------------- /vocab.py: -------------------------------------------------------------------------------- 1 | class Vocab(object): 2 | PAD = '' 3 | SOS = '' 4 | EOS = '' 5 | 6 | def __init__(self): 7 | self._contents = {} 8 | self._rev_contents = {} 9 | self.add(self.PAD) 10 | self.add(self.SOS) 11 | self.add(self.EOS) 12 | 13 | def add(self, sym): 14 | if sym not in self._contents: 15 | i = len(self._contents) 16 | self._contents[sym] = i 17 | self._rev_contents[i] = sym 18 | return self._contents[sym] 19 | 20 | def __getitem__(self, sym): 21 | return self._contents[sym] 22 | 23 | def __len__(self): 24 | return len(self._contents) 25 | 26 | def encode(self, seq): 27 | return [self.sos()] + [self[i] for i in seq] + [self.eos()] 28 | 29 | def decode(self, seq): 30 | return ''.join(self._rev_contents[i] for i in seq) 31 | 32 | def pad(self): 33 | return self._contents[self.PAD] 34 | 35 | def sos(self): 36 | return self._contents[self.SOS] 37 | 38 | def eos(self): 39 | return self._contents[self.EOS] 40 | -------------------------------------------------------------------------------- /hlog.py: -------------------------------------------------------------------------------- 1 | from contextlib import contextmanager 2 | import logging 3 | import threading 4 | import time 5 | 6 | state = threading.local() 7 | state.path = [] 8 | 9 | @contextmanager 10 | def task(name, timer=True): 11 | state.path.append(name) 12 | begin = time.time() 13 | yield 14 | end = time.time() 15 | if timer: 16 | print('%s{%0.2fs}' % ('/'.join(state.path), end - begin)) 17 | state.path.pop() 18 | 19 | def group(name): 20 | return task(name, timer=False) 21 | 22 | def log(value): 23 | if isinstance(value, float): 24 | value = "%0.4f" % value 25 | print('%s %s' % ('/'.join(state.path), value)) 26 | 27 | def value(name, value): 28 | with task(name, timer=False): 29 | log(value) 30 | 31 | def loop(template, coll=None, counter=None, timer=True): 32 | assert not (coll is None and counter is None) 33 | if coll is None: 34 | seq = zip(counter, counter) 35 | elif counter is None: 36 | seq = enumerate(coll) 37 | else: 38 | assert len(counter) == len(coll) 39 | seq = zip(counter, coll) 40 | for i, item in seq: 41 | with task(template % i, timer): 42 | yield item 43 | 44 | def fn(name, timer=True): 45 | def wrap(underlying): 46 | def wrapped(*args, **kwargs): 47 | with task(name, timer): 48 | result = underlying(*args, **kwargs) 49 | return result 50 | return wrapped 51 | return wrap 52 | -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- 1 | # Byte-compiled / optimized / DLL files 2 | __pycache__/ 3 | *.py[cod] 4 | *$py.class 5 | 6 | # C extensions 7 | *.so 8 | 9 | # Distribution / packaging 10 | .Python 11 | build/ 12 | develop-eggs/ 13 | dist/ 14 | downloads/ 15 | eggs/ 16 | .eggs/ 17 | lib/ 18 | lib64/ 19 | parts/ 20 | sdist/ 21 | var/ 22 | wheels/ 23 | *.egg-info/ 24 | .installed.cfg 25 | *.egg 26 | MANIFEST 27 | 28 | # PyInstaller 29 | # Usually these files are written by a python script from a template 30 | # before PyInstaller builds the exe, so as to inject date/other infos into it. 31 | *.manifest 32 | *.spec 33 | 34 | # Installer logs 35 | pip-log.txt 36 | pip-delete-this-directory.txt 37 | 38 | # Unit test / coverage reports 39 | htmlcov/ 40 | .tox/ 41 | .coverage 42 | .coverage.* 43 | .cache 44 | nosetests.xml 45 | coverage.xml 46 | *.cover 47 | .hypothesis/ 48 | .pytest_cache/ 49 | 50 | # Translations 51 | *.mo 52 | *.pot 53 | 54 | # Django stuff: 55 | *.log 56 | local_settings.py 57 | db.sqlite3 58 | 59 | # Flask stuff: 60 | instance/ 61 | .webassets-cache 62 | 63 | # Scrapy stuff: 64 | .scrapy 65 | 66 | # Sphinx documentation 67 | docs/_build/ 68 | 69 | # PyBuilder 70 | target/ 71 | 72 | # Jupyter Notebook 73 | .ipynb_checkpoints 74 | 75 | # pyenv 76 | .python-version 77 | 78 | # celery beat schedule file 79 | celerybeat-schedule 80 | 81 | # SageMath parsed files 82 | *.sage.py 83 | 84 | # Environments 85 | .env 86 | .venv 87 | env/ 88 | venv/ 89 | ENV/ 90 | env.bak/ 91 | venv.bak/ 92 | 93 | # Spyder project settings 94 | .spyderproject 95 | .spyproject 96 | 97 | # Rope project settings 98 | .ropeproject 99 | 100 | # mkdocs documentation 101 | /site 102 | 103 | # mypy 104 | .mypy_cache/ 105 | 106 | *.swp 107 | -------------------------------------------------------------------------------- /grammar.py: -------------------------------------------------------------------------------- 1 | from collections import namedtuple 2 | import numpy as np 3 | 4 | NTRule = namedtuple('NTRule', ['lhs', 'rhs', 'i_e', 'i_f']) 5 | TRule = namedtuple('TRule', ['lhs', 'rhs_e', 'rhs_f']) 6 | class Grammar(object): 7 | def __init__(self, root, rules): 8 | self.root = root 9 | self.rules = rules 10 | 11 | def sample(self, lhs=None): 12 | if lhs is None: 13 | lhs = self.root 14 | rules = self.rules[lhs] 15 | rule = rules[np.random.randint(len(rules))] 16 | if isinstance(rule, TRule): 17 | return (rule.rhs_e,), (rule.rhs_f,) 18 | elif isinstance(rule, NTRule): 19 | produced = [self.sample(s) for s in rule.rhs] 20 | e = sum([produced[i][0] for i in rule.i_e], ()) 21 | f = sum([produced[i][1] for i in rule.i_f], ()) 22 | return e, f 23 | 24 | def prune(self): 25 | visited = {nt: False for nt in self.rules.keys()} 26 | generates = { 27 | nt: any(isinstance(r, TRule) for r in rr) 28 | for nt, rr in self.rules.items() 29 | } 30 | keep_rules = {} 31 | def check(nt): 32 | if visited[nt]: 33 | return generates[nt] 34 | visited[nt] = True 35 | usable = [ 36 | r for r in self.rules[nt] 37 | if isinstance(r, TRule) or all(check(n) for n in r.rhs) 38 | ] 39 | generates[nt] = generates[nt] or len(usable) > 0 40 | keep_rules[nt] = usable 41 | return generates[nt] 42 | 43 | check(self.root) 44 | keep_rules = { 45 | nt: rr 46 | for nt, rr in keep_rules.items() 47 | if visited[nt] and generates[nt] 48 | } 49 | return Grammar(self.root, keep_rules) 50 | 51 | class GrammarBuilder(object): 52 | def symbols(self, n_t): 53 | return [chr(ord('a') + i) for i in range(n_t)] 54 | 55 | def _try_sample(self, n_nt, n_t, n_nt_rules, n_t_rules): 56 | assert n_nt > 1 57 | assert n_t > 1 58 | nt_names = [chr(ord('A') + i) for i in range(n_nt)] 59 | t_e_names = [chr(ord('a') + i) for i in range(n_t)] 60 | t_f_names = [chr(ord('a') + i) for i in range(n_t)] 61 | np.random.shuffle(t_f_names) 62 | #t_e_names = list(range(n_t)) 63 | #t_f_names = list(range(n_t)) 64 | 65 | i_e = (0, 1) 66 | i_f = (0, 1) if np.random.randint(2) == 0 else (1, 0) 67 | 68 | nt_rules = [] 69 | for _ in range(n_nt_rules): 70 | lhs = np.random.randint(n_nt - 1) 71 | rhs1 = lhs + 1 + np.random.randint(n_nt - lhs - 1) 72 | rhs2 = lhs + 1 + np.random.randint(n_nt - lhs - 1) 73 | nt_rules.append(NTRule( 74 | nt_names[lhs], 75 | (nt_names[rhs1], nt_names[rhs2]), 76 | i_e, 77 | i_f 78 | )) 79 | 80 | t_rules = [] 81 | for _ in range(n_t_rules): 82 | lhs = np.random.randint(n_nt) 83 | rhs = np.random.randint(n_t) 84 | t_rules.append(TRule( 85 | nt_names[lhs], 86 | t_e_names[rhs], 87 | t_f_names[rhs] 88 | )) 89 | 90 | rules = {nt: [] for nt in nt_names} 91 | for rule in nt_rules: 92 | rules[rule.lhs].append(rule) 93 | for rule in t_rules: 94 | rules[rule.lhs].append(rule) 95 | 96 | grammar = Grammar(nt_names[0], rules) 97 | grammar = grammar.prune() 98 | if len(grammar.rules) == 0 or grammar.root not in grammar.rules: 99 | raise RuntimeError('sampled a bad grammar') 100 | return grammar 101 | 102 | def sample(self, n_nt, n_t, n_nt_rules, n_t_rules): 103 | counter = 0 104 | while counter < 100: 105 | try: 106 | return self._try_sample(n_nt, n_t, n_nt_rules, n_t_rules) 107 | except RuntimeError as e: 108 | counter += 1 109 | raise RuntimeError( 110 | "Couldn't generate a good grammar in 100 attempts - try adjusting " 111 | "sampler parameters" 112 | ) 113 | -------------------------------------------------------------------------------- /seq.py: -------------------------------------------------------------------------------- 1 | import torch 2 | from torch import nn 3 | import torch.nn.functional as F 4 | 5 | class Encoder(nn.Module): 6 | def __init__(self, vocab, n_embed, n_hidden, n_layers, bidirectional=True): 7 | super().__init__() 8 | self.vocab = vocab 9 | self.embed = nn.Embedding(len(vocab), n_embed, vocab.pad()) 10 | self.rnn = nn.LSTM( 11 | n_embed, 12 | n_hidden, 13 | n_layers, 14 | bidirectional=bidirectional, 15 | batch_first=True 16 | ) 17 | 18 | def forward(self, data): 19 | emb = self.embed(data) 20 | out, state = self.rnn(emb) 21 | return out, state 22 | 23 | class Decoder(nn.Module): 24 | def __init__(self, vocab): 25 | super().__init__() 26 | self.vocab = vocab 27 | 28 | # TODO 29 | def decode(self, context, state, device): 30 | n_batch = state[0].shape[1] 31 | data = torch.tensor([[self.vocab.sos()] for _ in range(n_batch)]).to(device) 32 | out = [[] for _ in range(n_batch)] 33 | hiddens = [[] for _ in range(n_batch)] 34 | for t in range(20): 35 | pred, state = self(context, data, state) 36 | best = pred.squeeze(1).argmax(dim=1) 37 | for i in range(n_batch): 38 | out[i].append(int(best[i].data)) 39 | hiddens[i].append(state[0][:, i, :]) 40 | data = best.unsqueeze(1) 41 | final = [] 42 | final_hiddens = [] 43 | for o, h in zip(out, hiddens): 44 | try: 45 | end = o.index(self.vocab.eos()) 46 | final.append(o[:end]) 47 | final_hiddens.append(h[:end]) 48 | except ValueError: 49 | final.append(o) 50 | final_hiddens.append(h) 51 | return final, final_hiddens 52 | 53 | def forward(self, context, data, state): 54 | n_batch, n_seq = data.shape 55 | preds = [] 56 | for t in range(n_seq): 57 | pred, state = self.step(context, data[:, t], state) 58 | preds.append(pred) 59 | preds = torch.stack(preds, dim=1) 60 | return preds, state 61 | 62 | class SimpleDecoder(Decoder): 63 | def __init__(self, vocab, n_embed, n_hidden, n_layers): 64 | super().__init__(vocab) 65 | self.embed = nn.Embedding(len(vocab), n_embed, vocab.pad()) 66 | self.rnn = nn.LSTM( 67 | n_embed, 68 | n_hidden, 69 | n_layers, 70 | batch_first=True 71 | ) 72 | self.predict = nn.Linear(n_hidden, len(vocab)) 73 | 74 | def step(self, context, data, state): 75 | emb = self.embed(data) 76 | out, state = self.rnn(emb.unsqueeze(1), state) 77 | pred = self.predict(out).squeeze(1) 78 | return pred, state 79 | 80 | #def forward(self, data, state): 81 | # emb = self.embed(data) 82 | # out, state = self.rnn(emb, state) 83 | # pred = self.predict(out) 84 | # return pred, state 85 | 86 | class AttDecoder(Decoder): 87 | def __init__(self, vocab, n_embed, n_ctx, n_hidden, n_layers): 88 | super().__init__(vocab) 89 | # TODO the Luong way 90 | self.att_key = nn.Linear(n_ctx, n_hidden) 91 | self.att_val = nn.Linear(n_ctx, n_hidden) 92 | self.embed = nn.Embedding(len(vocab), n_embed, vocab.pad()) 93 | self.rnn = nn.LSTM( 94 | n_embed + n_hidden, 95 | n_hidden, 96 | n_layers, 97 | batch_first=True 98 | ) 99 | self.predict = nn.Linear(n_hidden, len(vocab)) 100 | 101 | def step(self, context, data, state): 102 | hid, _ = state 103 | key = self.att_key(context) 104 | hid = hid.squeeze(0).unsqueeze(1).expand_as(key) 105 | att = F.softmax((key * hid).sum(dim=2), 1) 106 | pooled = (context * att.unsqueeze(2).expand_as(context)).sum(dim=1) 107 | 108 | val = self.att_val(pooled) 109 | emb = self.embed(data) 110 | feats = torch.cat((emb, val), dim=1) 111 | 112 | out, state = self.rnn(feats.unsqueeze(1), state) 113 | pred = self.predict(out).squeeze(1) 114 | return pred, state 115 | -------------------------------------------------------------------------------- /_scratch/metacomp.py: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env python3 2 | 3 | from collections import namedtuple 4 | import numpy as np 5 | import torch 6 | from torch import nn, optim 7 | from torch.autograd import Variable 8 | 9 | VOCAB_SIZE = 2 10 | START = 1 11 | STOP = 2 12 | FULL_VOCAB_SIZE = VOCAB_SIZE + 3 13 | #TRAIN_LENS = [i for i in range(20) if i % 2 == 0] 14 | #TEST_LENS = [i for i in range(20) if i % 2 == 1] 15 | TRAIN_LENS = [i for i in range(5)] 16 | TEST_LENS = [i for i in range(5, 10)] 17 | LENS = list(TRAIN_LENS) + list(TEST_LENS) 18 | MAX_LEN = max(LENS) + 1 + 2 19 | 20 | N_EMBED = 64 21 | N_HIDDEN = 256 22 | 23 | Batch = namedtuple('Batch', 'e_seq f_seq e_obs f_obs f_tgt') 24 | 25 | def unwrap(var): 26 | return var.data.cpu().numpy() 27 | 28 | def sample_copy(n, test=False): 29 | lens = TEST_LENS if test else TRAIN_LENS 30 | data = np.random.randint(VOCAB_SIZE, size=(n, MAX_LEN)) + 3 31 | seq = [[] for _ in range(n)] 32 | obs = np.zeros((MAX_LEN, n, FULL_VOCAB_SIZE)) 33 | tgt = np.zeros((MAX_LEN, n), dtype=np.int64) 34 | for i in range(n): 35 | seq[i].append(START) 36 | obs[0, i, START] = 1 37 | l = np.random.choice(lens) 38 | last = l + 2 39 | for j in range(1, last): 40 | seq[i].append(data[i, j]) 41 | obs[j, i, data[i, j]] = 1 42 | tgt[j-1, i] = data[i, j] 43 | obs[last, i, STOP] = 1 44 | tgt[last-1, i] = STOP 45 | seq[i].append(STOP) 46 | 47 | obs = Variable(torch.FloatTensor(obs)) 48 | tgt = Variable(torch.LongTensor(tgt)) 49 | return Batch(seq, seq, obs, obs, tgt) 50 | 51 | class Decoder(nn.Module): 52 | def __init__(self): 53 | emb = N_EMBED 54 | hid = N_HIDDEN 55 | super().__init__() 56 | self._embed = nn.Linear(FULL_VOCAB_SIZE, emb) 57 | self._rnn = nn.GRU(input_size=emb, hidden_size=hid, num_layers=1) 58 | self._predict = nn.Linear(hid, FULL_VOCAB_SIZE) 59 | self._softmax = nn.Softmax(dim=1) 60 | 61 | def forward(self, state, inp): 62 | emb = self._embed(inp) 63 | rep, enc = self._rnn(emb, state) 64 | logits = self._predict(rep) 65 | return enc, logits 66 | 67 | def decode(self, init_state, max_len, sample=False): 68 | n_stack, n_batch, _ = init_state.shape 69 | out = [[START] for _ in range(n_batch)] 70 | tok_inp = [START for _ in range(n_batch)] 71 | done = [False for _ in range(n_batch)] 72 | state = init_state 73 | for _ in range(max_len): 74 | hot_inp = np.zeros((1, n_batch, FULL_VOCAB_SIZE)) 75 | for i, t in enumerate(tok_inp): 76 | hot_inp[0, i, t] = 1 77 | hot_inp = Variable(torch.FloatTensor(hot_inp)) 78 | if init_state.is_cuda: 79 | hot_inp = hot_inp.cuda() 80 | new_state, label_logits = self(state, hot_inp) 81 | label_logits = label_logits.squeeze(0) 82 | label_probs = unwrap(self._softmax(label_logits)) 83 | new_tok_inp = [] 84 | for i, row in enumerate(label_probs): 85 | if sample: 86 | tok = np.random.choice(row.size, p=row) 87 | else: 88 | tok = row.argmax() 89 | new_tok_inp.append(tok) 90 | if not done[i]: 91 | out[i].append(tok) 92 | done[i] = done[i] or tok == STOP 93 | state = new_state 94 | tok_inp = new_tok_inp 95 | if all(done): 96 | break 97 | return out 98 | 99 | class Encoder(nn.Module): 100 | def __init__(self): 101 | super().__init__() 102 | self._embed = nn.Linear(FULL_VOCAB_SIZE, N_EMBED) 103 | self._rnn = nn.GRU(input_size=N_EMBED, hidden_size=N_HIDDEN, num_layers=1) 104 | 105 | def forward(self, obs): 106 | emb = self._embed(obs) 107 | _, enc = self._rnn(emb) 108 | return enc 109 | 110 | class Model(nn.Module): 111 | def __init__(self): 112 | super().__init__() 113 | self.encoder = Encoder() 114 | self.decoder = Decoder() 115 | self.loss = nn.CrossEntropyLoss() 116 | 117 | def forward(self, batch): 118 | enc = self.encoder(batch.e_obs) 119 | _, dec = self.decoder(enc, batch.f_obs) 120 | size_l, size_n, size_v = dec.shape 121 | dec = dec.view(size_l * size_n, size_v) 122 | tgt = batch.f_tgt.view(size_l * size_n) 123 | loss = self.loss(dec, tgt) 124 | return loss 125 | 126 | def decode(self, batch): 127 | enc = self.encoder(batch.e_obs) 128 | dec = self.decoder.decode(enc, MAX_LEN) 129 | return dec 130 | 131 | def validate(model, batch): 132 | pred = model.decode(batch) 133 | score = 0 134 | count = 0 135 | for i, (f, pf) in enumerate(zip(batch.f_seq, pred)): 136 | score += int(f == pf) 137 | count += 1 138 | if i < 3: 139 | print(f[1:-1]) 140 | print(pf[1:-1]) 141 | print() 142 | print(1. * score / count) 143 | print() 144 | 145 | def main(): 146 | model = Model() 147 | opt = optim.Adam(model.parameters(), 1e-3) 148 | for i in range(100): 149 | l = 0. 150 | for j in range(10): 151 | batch = sample_copy(100) 152 | loss = model(batch) 153 | opt.zero_grad() 154 | loss.backward() 155 | opt.step() 156 | ll, = unwrap(loss) 157 | l += ll 158 | 159 | print(l) 160 | validate(model, sample_copy(100)) 161 | validate(model, sample_copy(100, test=True)) 162 | print() 163 | 164 | 165 | main() 166 | -------------------------------------------------------------------------------- /metacomp.py: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env python3 2 | 3 | from grammar import GrammarBuilder 4 | import hlog 5 | from seq import Encoder, SimpleDecoder, AttDecoder 6 | from vocab import Vocab 7 | 8 | import numpy as np 9 | import torch 10 | from torch import nn, optim 11 | import torch.utils.data as torch_data 12 | 13 | DEVICE=torch.device('cuda:0') 14 | 15 | BATCH_LANGS = 50 16 | BATCH_EXAMPLES = 5 17 | N_NT = 5 18 | N_T = 10 19 | N_NT_RULES = 20 20 | N_T_RULES = 5 21 | 22 | N_EMB = 64 23 | N_HID = 512 24 | N_LAYERS = 1 25 | 26 | START = '<' 27 | MID = '|' 28 | END = '>' 29 | 30 | class Dataset(torch_data.Dataset): 31 | def __init__(self): 32 | self._gb = GrammarBuilder() 33 | self.vocab = Vocab() 34 | self.start = self.vocab.add(START) 35 | self.mid = self.vocab.add(MID) 36 | self.end = self.vocab.add(END) 37 | for s in self._gb.symbols(N_T): 38 | self.vocab.add(s) 39 | 40 | def __len__(self): 41 | return 10 * BATCH_LANGS 42 | 43 | def __getitem__(self, i): 44 | grammar = self._gb.sample(N_NT, N_T, N_NT_RULES, N_T_RULES) 45 | samples = list(set(grammar.sample() for _ in range(2 * BATCH_EXAMPLES))) 46 | samples = [ 47 | (self.vocab.encode(e), self.vocab.encode(f)) 48 | for e, f in samples 49 | ] 50 | if len(samples) == 1: 51 | samples = samples + samples 52 | samp_in = samples[1:BATCH_EXAMPLES+1] 53 | samp_out = samples[0] 54 | while len(samp_in) < BATCH_EXAMPLES: 55 | samp_in += samples[1:BATCH_EXAMPLES-len(samp_in)+1] 56 | 57 | in_stacked = [] 58 | for e, f in samp_in: 59 | in_stacked += ( 60 | [self.start] + list(e) + [self.mid] + list(f) + [self.end] 61 | ) 62 | out_e, out_f = samp_out 63 | 64 | return in_stacked, out_e, out_f 65 | 66 | def collate(self, samples): 67 | n_batch = len(samples) 68 | pad = self.vocab.pad() 69 | ex, out_e, out_f = zip(*samples) 70 | 71 | ex_data = np.full( 72 | (n_batch, max(len(e) for e in ex)), 73 | pad, 74 | dtype=np.int64 75 | ) 76 | out_e_data = np.full( 77 | (n_batch, max(len(o) for o in out_e)), 78 | pad, 79 | dtype=np.int64 80 | ) 81 | out_f_data = np.full( 82 | (n_batch, max(len(o) for o in out_f)), 83 | pad, 84 | dtype=np.int64 85 | ) 86 | 87 | for i in range(n_batch): 88 | ex_data[i, :len(ex[i])] = ex[i] 89 | out_e_data[i, :len(out_e[i])] = out_e[i] 90 | out_f_data[i, :len(out_f[i])] = out_f[i] 91 | 92 | return ( 93 | torch.tensor(ex_data).to(DEVICE), 94 | torch.tensor(out_e_data).to(DEVICE), 95 | torch.tensor(out_f_data).to(DEVICE), 96 | [self.vocab.decode(o[1:-1]) for o in out_f] 97 | ) 98 | 99 | class Model(nn.Module): 100 | def __init__(self, dataset, n_embed, n_hidden, n_layers): 101 | super().__init__() 102 | self.ex_encoder = Encoder(dataset.vocab, n_embed, n_hidden, n_layers) 103 | self.out_encoder = Encoder(dataset.vocab, n_embed, n_hidden, n_layers) 104 | self.out_decoder = SimpleDecoder(dataset.vocab, n_embed, n_hidden, n_layers) 105 | 106 | def _encode(self, ex, out_e): 107 | enc_ex, state_ex = self.ex_encoder(ex) 108 | enc_out, state_out = self.out_encoder(out_e) 109 | 110 | # TODO 111 | state_h = (state_ex[0] + state_out[0]).sum(dim=0, keepdim=True) 112 | state_c = (state_ex[1] + state_out[1]).sum(dim=0, keepdim=True) 113 | 114 | return enc_out, (state_h, state_c) 115 | 116 | def forward(self, ex, out_e, out_f): 117 | context, state = self._encode(ex, out_e) 118 | dec, _ = self.out_decoder(context, out_f, state) 119 | return dec 120 | 121 | def decode(self, ex, out_e): 122 | context, state = self._encode(ex, out_e) 123 | return self.out_decoder.decode(context, state, DEVICE) 124 | 125 | class Trainer(object): 126 | def __init__(self, dataset, model): 127 | model.to(DEVICE) 128 | objective = nn.CrossEntropyLoss(ignore_index=dataset.vocab.pad()).to(DEVICE) 129 | self.dataset = dataset 130 | self.model = model 131 | self.objective = objective 132 | 133 | @hlog.fn('train') 134 | def train(self): 135 | opt = optim.Adam(model.parameters(), lr=0.002) 136 | sched = optim.lr_scheduler.ReduceLROnPlateau( 137 | opt, 138 | factor=0.5, 139 | verbose=True 140 | ) 141 | loader = torch_data.DataLoader(dataset, BATCH_LANGS, collate_fn=dataset.collate) 142 | for i_epoch in hlog.loop('epoch_%03d', counter=range(1000)): 143 | epoch_loss = 0 144 | for ex, out_e, out_f, _ in loader: 145 | n_tgts = BATCH_LANGS * (out_f.shape[1] - 1) 146 | pred = self.model.forward(ex, out_e, out_f)[:, :-1, :] 147 | pred = pred.contiguous().view(n_tgts, len(self.dataset.vocab)) 148 | tgt = out_f[:, 1:].contiguous().view(n_tgts) 149 | loss = self.objective(pred, tgt) 150 | opt.zero_grad() 151 | loss.backward() 152 | opt.step() 153 | 154 | epoch_loss += float(loss) 155 | 156 | #dec = self.model.decode(ex, out_e) 157 | #print(dec) 158 | 159 | hlog.value('loss', epoch_loss) 160 | sched.step(epoch_loss) 161 | 162 | for ex, out_e, out_f, pp_f in loader: 163 | dec = self.model.decode(ex, out_e) 164 | dec = [self.dataset.vocab.decode(d) for d in dec] 165 | for d, p in list(zip(dec, pp_f))[:5]: 166 | hlog.value('ex', '%s %s' % (d, p)) 167 | break 168 | 169 | dataset = Dataset() 170 | model = Model(dataset, N_EMB, N_HID, N_LAYERS) 171 | trainer = Trainer(dataset, model) 172 | trainer.train() 173 | -------------------------------------------------------------------------------- /cp.py: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env python3 2 | 3 | import hlog 4 | from seq import Encoder, SimpleDecoder, AttDecoder 5 | from vocab import Vocab 6 | 7 | from collections import defaultdict, namedtuple 8 | import numpy as np 9 | from scipy import stats 10 | import torch 11 | from torch import nn, optim 12 | import torch.utils.data as torch_data 13 | 14 | DEVICE=torch.device('cuda:0') 15 | 16 | N_SYMS = 5 17 | N_EMB = 64 18 | N_HID = 512 19 | N_LAYERS = 1 20 | 21 | BATCH_SIZE = 64 22 | #TRAIN_LENS = list(range(1, 10)) 23 | #VAL_LENS = list(range(1, 10)) 24 | TRAIN_LENS = [3, 4, 5, 6, 12, 13] 25 | VAL_LENS = [7, 8, 9, 10, 11] 26 | 27 | 28 | class Dataset(torch_data.Dataset): 29 | def __init__(self, val=False): 30 | self.vocab = Vocab() 31 | self.syms = [chr(ord('a') + i) for i in range(N_SYMS)] 32 | for s in self.syms: 33 | self.vocab.add(s) 34 | self.val = val 35 | 36 | def __len__(self): 37 | return 10 * BATCH_SIZE 38 | 39 | def __getitem__(self, i): 40 | if self.val: 41 | seq_len = np.random.choice(VAL_LENS) 42 | else: 43 | seq_len = np.random.choice(TRAIN_LENS) 44 | seq = [np.random.choice(self.syms) for _ in range(seq_len)] 45 | return self.vocab.encode(seq) 46 | 47 | def collate(self, seqs): 48 | n_batch = len(seqs) 49 | pad = self.vocab.pad() 50 | data = np.full((n_batch, max(len(s) for s in seqs)), pad, dtype=np.int64) 51 | for i in range(n_batch): 52 | data[i, :len(seqs[i])] = seqs[i] 53 | return [s[1:-1] for s in seqs], torch.tensor(data).to(DEVICE) 54 | 55 | class Model(nn.Module): 56 | def __init__(self, dataset, n_embed, n_hidden, n_layers): 57 | super().__init__() 58 | self.encoder = Encoder(dataset.vocab, n_embed, n_hidden, n_layers, 59 | bidirectional=False) 60 | self.decoder = AttDecoder(dataset.vocab, n_embed, n_hidden, n_hidden, n_layers) 61 | 62 | def forward(self, data): 63 | context, state = self.encoder(data) 64 | pred, _ = self.decoder(context, data, state) 65 | return pred 66 | 67 | def decode(self, data): 68 | context, state = self.encoder(data) 69 | dec, hiddens = self.decoder.decode(context, state, DEVICE) 70 | return dec, hiddens 71 | 72 | #ActInfo = namedtuple('ActInfo', 'index seq counter completion') 73 | 74 | def counter_fn(sign=1, normalize=None): 75 | def analyze(seq): 76 | if normalize == 'first': 77 | offset = seq[0] 78 | elif normalize == 'last': 79 | offset = seq[-1] 80 | seq = list(reversed(seq)) 81 | else: 82 | offset = 0 83 | seq = [sign * (a - offset) for a in seq] 84 | indices = list(range(len(seq))) 85 | return indices, seq 86 | return analyze 87 | 88 | def length_fn(sign=1): 89 | def analyze(seq): 90 | return [sign * len(seq)], [seq[0]] 91 | return analyze 92 | 93 | ANALYZERS = { 94 | 'count+': counter_fn(), 95 | 'count-': counter_fn(sign=-1), 96 | 'count+f': counter_fn(normalize='first'), 97 | 'count-l': counter_fn(sign=-1, normalize='last'), 98 | 'len+': length_fn(), 99 | 'len-': length_fn(sign=-1) 100 | } 101 | 102 | def analyze(hiddens): 103 | n_a = N_HID * N_LAYERS 104 | 105 | ana_data = {k: defaultdict(lambda: ([], [])) for k in ANALYZERS} 106 | 107 | for i in range(len(hiddens)): 108 | t = torch.stack(hiddens[i]).view(-1, n_a).t() 109 | for i_a in range(n_a): 110 | seq = t[i_a, :].detach().cpu().numpy().tolist() 111 | for name, ana in ANALYZERS.items(): 112 | x, y = ana(seq) 113 | xs, ys = ana_data[name][i_a] 114 | xs += x 115 | ys += y 116 | 117 | for name in ANALYZERS: 118 | scores = {i_a: stats.pearsonr(*ana_data[name][i_a]) for i_a in range(n_a)} 119 | i_a = max(scores, key=lambda i: scores[i][0]) 120 | print(name) 121 | print(scores[i_a]) 122 | for hseq in hiddens[:10]: 123 | t = torch.stack(hseq).view(-1, n_a).t() 124 | seq = t[i_a, :].detach().cpu().numpy().tolist() 125 | print(' '.join('%0.2f' % ss for ss in seq)) 126 | print() 127 | 128 | 129 | #i_counter, counter_score = min(scores.items(), key=lambda x: x[1]) 130 | #print(i_counter, counter_score) 131 | #print(max(scores.items(), key=lambda x: x[1])) 132 | #for hseq in hiddens: 133 | # t = torch.stack(hseq).view(-1, n_a).t() 134 | # s = t[i_counter, :].detach().cpu().numpy().tolist() 135 | # print(' '.join('%0.3f' % ss for ss in s)) 136 | # increments = [s[i] - s[i-1] for i in range(1, len(s))] 137 | # print(' '.join('%0.3f' % ss for ss in increments)) 138 | # print() 139 | ##print(seq_data[i_counter]) 140 | #print(counter_score) 141 | #print() 142 | 143 | #print(max(comp_scores.items(), key=lambda x: x[1])) 144 | #print(min(count_scores.items(), key=lambda x: x[1])) 145 | #print(min(comp_scores.items(), key=lambda x: x[1])) 146 | 147 | dataset = Dataset() 148 | val_dataset = Dataset(val=True) 149 | model = Model(dataset, N_EMB, N_HID, N_LAYERS).to(DEVICE) 150 | loader = torch_data.DataLoader(dataset, BATCH_SIZE, collate_fn=dataset.collate) 151 | val_loader = torch_data.DataLoader(val_dataset, BATCH_SIZE, collate_fn=dataset.collate) 152 | 153 | obj = nn.CrossEntropyLoss(ignore_index=dataset.vocab.pad()).to(DEVICE) 154 | opt = optim.Adam(model.parameters(), lr=0.001) 155 | #sched = optim.lr_scheduler.ReduceLROnPlateau( 156 | # opt, factor=0.5, verbose=True 157 | #) 158 | sched = optim.lr_scheduler.StepLR( 159 | opt, step_size=10, gamma=0.1 160 | ) 161 | for i_epoch in hlog.loop('%03d', counter=range(30)): 162 | epoch_loss = 0 163 | epoch_acc = 0 164 | epoch_count = 0 165 | for seqs, data in loader: 166 | n_tgts = data.shape[0] * (data.shape[1] - 1) 167 | pred = model(data)[:, :-1, :] 168 | pred = pred.contiguous().view(n_tgts, len(dataset.vocab)) 169 | tgt = data[:, 1:].contiguous().view(n_tgts) 170 | loss = obj(pred, tgt) 171 | opt.zero_grad() 172 | loss.backward() 173 | opt.step() 174 | epoch_loss += float(loss) 175 | 176 | dec, hiddens = model.decode(data) 177 | acc = np.mean([d == s for d, s in zip(dec, seqs)]) 178 | epoch_acc += acc 179 | epoch_count += 1 180 | 181 | analyze(hiddens) 182 | 183 | val_acc = 0 184 | val_count = 0 185 | for seqs, data in val_loader: 186 | dec, hiddens = model.decode(data) 187 | acc = np.mean([d == s for d, s in zip(dec, seqs)]) 188 | val_acc += acc 189 | val_count += 1 190 | 191 | hlog.value('loss', epoch_loss / epoch_count) 192 | hlog.value('acc', epoch_acc / epoch_count) 193 | hlog.value('vacc', val_acc / val_count) 194 | #sched.step(epoch_loss) 195 | sched.step() 196 | -------------------------------------------------------------------------------- /exp/test/run_noatt.out: -------------------------------------------------------------------------------- 1 | train/epoch_000/loss 21.8896 2 | train/epoch_000/ex iii bc 3 | train/epoch_000/ex hhhhhhhhhhh eeef 4 | train/epoch_000/ex iii gb 5 | train/epoch_000/ex bbbbbbbbbbbbbbbbbbbb cccccccc 6 | train/epoch_000/ex hhhhhhhhhhhh aaa 7 | train/epoch_000{1.30s} 8 | train/epoch_001/loss 16.8406 9 | train/epoch_001/ex jjjjjjjjj hhhhh 10 | train/epoch_001/ex iiiiiiiiiiiiiiiiiiii hh 11 | train/epoch_001/ex jjjjjjj iii 12 | train/epoch_001/ex jjjjjjjj ddd 13 | train/epoch_001/ex jjjjjjjj iiie 14 | train/epoch_001{1.30s} 15 | train/epoch_002/loss 15.1637 16 | train/epoch_002/ex iiiiiiii ffcciffe 17 | train/epoch_002/ex a d 18 | train/epoch_002/ex j ib 19 | train/epoch_002/ex fffffff djjddj 20 | train/epoch_002/ex iii dcc 21 | train/epoch_002{1.30s} 22 | train/epoch_003/loss 13.7067 23 | train/epoch_003/ex ddddddd fffcfcff 24 | train/epoch_003/ex ggg hbg 25 | train/epoch_003/ex dddddd hhhhhh 26 | train/epoch_003/ex a f 27 | train/epoch_003/ex dddd ffff 28 | train/epoch_003{1.25s} 29 | train/epoch_004/loss 13.5993 30 | train/epoch_004/ex ffff eii 31 | train/epoch_004/ex bbb di 32 | train/epoch_004/ex fffff eeed 33 | train/epoch_004/ex jjjjjjjj iiiiiii 34 | train/epoch_004/ex ff db 35 | train/epoch_004{1.29s} 36 | train/epoch_005/loss 13.3177 37 | train/epoch_005/ex hhhh fffff 38 | train/epoch_005/ex i d 39 | train/epoch_005/ex gg ddi 40 | train/epoch_005/ex d g 41 | train/epoch_005/ex gg ei 42 | train/epoch_005{1.25s} 43 | train/epoch_006/loss 13.0066 44 | train/epoch_006/ex aa bb 45 | train/epoch_006/ex ddddd hhhhh 46 | train/epoch_006/ex hhhhhh fffff 47 | train/epoch_006/ex ddddd gbibc 48 | train/epoch_006/ex bbb ccb 49 | train/epoch_006{1.28s} 50 | train/epoch_007/loss 12.3043 51 | train/epoch_007/ex d e 52 | train/epoch_007/ex d d 53 | train/epoch_007/ex hhh eef 54 | train/epoch_007/ex hhh ddd 55 | train/epoch_007/ex dd gb 56 | train/epoch_007{1.25s} 57 | train/epoch_008/loss 12.6044 58 | train/epoch_008/ex eeeee fffff 59 | train/epoch_008/ex eeeeee dddddd 60 | train/epoch_008/ex iiiiiiiii ieiiieeii 61 | train/epoch_008/ex ii ih 62 | train/epoch_008/ex ii gi 63 | train/epoch_008{1.29s} 64 | train/epoch_009/loss 12.4201 65 | train/epoch_009/ex aaaa eaee 66 | train/epoch_009/ex cc if 67 | train/epoch_009/ex ccc ddd 68 | train/epoch_009/ex aaa gge 69 | train/epoch_009/ex iiiiii eeeeee 70 | train/epoch_009{1.25s} 71 | train/epoch_010/loss 12.1638 72 | train/epoch_010/ex aa jj 73 | train/epoch_010/ex iiiiiii ggggggg 74 | train/epoch_010/ex cc ee 75 | train/epoch_010/ex dddddd gggggg 76 | train/epoch_010/ex i i 77 | train/epoch_010{1.29s} 78 | train/epoch_011/loss 12.1983 79 | train/epoch_011/ex i i 80 | train/epoch_011/ex f c 81 | train/epoch_011/ex f a 82 | train/epoch_011/ex ddd jjg 83 | train/epoch_011/ex ddddddd bbbbbbb 84 | train/epoch_011{1.26s} 85 | train/epoch_012/loss 12.1329 86 | train/epoch_012/ex jjjjj hhhhh 87 | train/epoch_012/ex bbbbb ieeee 88 | train/epoch_012/ex bbbbbb gggggg 89 | train/epoch_012/ex bbbb bbcf 90 | train/epoch_012/ex d h 91 | train/epoch_012{1.25s} 92 | train/epoch_013/loss 11.7830 93 | train/epoch_013/ex ffffff gggggg 94 | train/epoch_013/ex bb jb 95 | train/epoch_013/ex d d 96 | train/epoch_013/ex i d 97 | train/epoch_013/ex iiii fffe 98 | train/epoch_013{1.28s} 99 | train/epoch_014/loss 11.6701 100 | train/epoch_014/ex jjjjjjjj jjjjjjjj 101 | train/epoch_014/ex a a 102 | train/epoch_014/ex hhhhh ggggg 103 | train/epoch_014/ex a b 104 | train/epoch_014/ex a d 105 | train/epoch_014{1.28s} 106 | train/epoch_015/loss 11.8334 107 | train/epoch_015/ex cccc fjji 108 | train/epoch_015/ex cccccc cccccc 109 | train/epoch_015/ex hhhh fiff 110 | train/epoch_015/ex hhhh iiie 111 | train/epoch_015/ex ddddd ccccc 112 | train/epoch_015{1.27s} 113 | train/epoch_016/loss 11.5445 114 | train/epoch_016/ex ddd dda 115 | train/epoch_016/ex bb fj 116 | train/epoch_016/ex dddddd eeeeee 117 | train/epoch_016/ex ggg ggj 118 | train/epoch_016/ex j g 119 | train/epoch_016{1.29s} 120 | train/epoch_017/loss 11.4088 121 | train/epoch_017/ex bbbb aaja 122 | train/epoch_017/ex bbbb ddcd 123 | train/epoch_017/ex gggg gggb 124 | train/epoch_017/ex gggggg bbgggg 125 | train/epoch_017/ex bbbbb bbbbb 126 | train/epoch_017{1.27s} 127 | train/epoch_018/loss 11.5917 128 | train/epoch_018/ex eeeee hbbbb 129 | train/epoch_018/ex f j 130 | train/epoch_018/ex ggg bgb 131 | train/epoch_018/ex eeeeee cccjcj 132 | train/epoch_018/ex ggggggg ggggggi 133 | train/epoch_018{1.25s} 134 | train/epoch_019/loss 11.9625 135 | train/epoch_019/ex ddddddd bbbbbbb 136 | train/epoch_019/ex hhhhh jjajj 137 | train/epoch_019/ex gggg gggg 138 | train/epoch_019/ex gggggg gggggg 139 | train/epoch_019/ex ggggg geegg 140 | train/epoch_019{1.28s} 141 | train/epoch_020/loss 11.3669 142 | train/epoch_020/ex gg fh 143 | train/epoch_020/ex ggggg ciiid 144 | train/epoch_020/ex eeeee djjjj 145 | train/epoch_020/ex gggg heeh 146 | train/epoch_020/ex b a 147 | train/epoch_020{1.27s} 148 | train/epoch_021/loss 11.9595 149 | train/epoch_021/ex aaa iii 150 | train/epoch_021/ex aaaa iiff 151 | train/epoch_021/ex gggg fiid 152 | train/epoch_021/ex aa ff 153 | train/epoch_021/ex aaa fff 154 | train/epoch_021{1.29s} 155 | train/epoch_022/loss 11.5341 156 | train/epoch_022/ex dddddd fffdff 157 | train/epoch_022/ex bbbbb ccccc 158 | train/epoch_022/ex i e 159 | train/epoch_022/ex iii hhc 160 | train/epoch_022/ex iiiiii gggggg 161 | train/epoch_022{1.26s} 162 | train/epoch_023/loss 11.5181 163 | train/epoch_023/ex dddddd dddddd 164 | train/epoch_023/ex jjjjjjjj ffffffff 165 | train/epoch_023/ex bbbbbbb eeeeeee 166 | train/epoch_023/ex jj jj 167 | train/epoch_023/ex ddddddd eeeeeae 168 | train/epoch_023{1.27s} 169 | train/epoch_024/loss 11.5087 170 | train/epoch_024/ex jj ia 171 | train/epoch_024/ex ccc fac 172 | train/epoch_024/ex ccccc diidi 173 | train/epoch_024/ex eeeee biiii 174 | train/epoch_024/ex cc af 175 | train/epoch_024{1.27s} 176 | train/epoch_025/loss 11.4661 177 | train/epoch_025/ex cccc biii 178 | train/epoch_025/ex jj ag 179 | train/epoch_025/ex jjj bij 180 | train/epoch_025/ex cccc dcdd 181 | train/epoch_025/ex j f 182 | train/epoch_025{1.26s} 183 | train/epoch_026/loss 11.7014 184 | train/epoch_026/ex aaa aaa 185 | train/epoch_026/ex ccc dfd 186 | train/epoch_026/ex iiii aaaj 187 | train/epoch_026/ex jj bc 188 | train/epoch_026/ex hhh hhh 189 | train/epoch_026{1.27s} 190 | train/epoch_027/loss 11.6740 191 | train/epoch_027/ex jj jd 192 | train/epoch_027/ex ccc ddd 193 | train/epoch_027/ex c i 194 | train/epoch_027/ex eeeeee abiiii 195 | train/epoch_027/ex gg ja 196 | train/epoch_027{1.26s} 197 | train/epoch_028/loss 11.0693 198 | train/epoch_028/ex ggg fff 199 | train/epoch_028/ex bbbb gggg 200 | train/epoch_028/ex bbbb ccgg 201 | train/epoch_028/ex gggg bddd 202 | train/epoch_028/ex gggg dede 203 | train/epoch_028{1.27s} 204 | train/epoch_029/loss 10.9515 205 | train/epoch_029/ex jjjj bbbb 206 | train/epoch_029/ex cc gh 207 | train/epoch_029/ex j j 208 | train/epoch_029/ex e j 209 | train/epoch_029/ex d d 210 | train/epoch_029{1.29s} 211 | train/epoch_030/loss 11.0099 212 | train/epoch_030/ex g g 213 | train/epoch_030/ex gggg faff 214 | train/epoch_030/ex cccccccc cccccccc 215 | train/epoch_030/ex ccc jjb 216 | train/epoch_030/ex b i 217 | train/epoch_030{1.24s} 218 | train/epoch_031/loss 11.0173 219 | train/epoch_031/ex iiiiiii hjhjhjh 220 | train/epoch_031/ex jjjjjjjj iiiiieii 221 | train/epoch_031/ex gggg hhhh 222 | train/epoch_031/ex j j 223 | train/epoch_031/ex hh ha 224 | train/epoch_031{1.28s} 225 | train/epoch_032/loss 10.9600 226 | train/epoch_032/ex jj dd 227 | train/epoch_032/ex hhhhhh ggaaga 228 | train/epoch_032/ex f d 229 | train/epoch_032/ex gggggg jjjjjj 230 | train/epoch_032/ex jjjjjjjj ffffffff 231 | train/epoch_032{1.26s} 232 | train/epoch_033/loss 11.4437 233 | train/epoch_033/ex hhhh cccc 234 | train/epoch_033/ex eeeee iafaf 235 | train/epoch_033/ex iii eda 236 | train/epoch_033/ex eeeeeee hhhhfff 237 | train/epoch_033/ex jj dh 238 | train/epoch_033{1.26s} 239 | train/epoch_034/loss 10.8139 240 | train/epoch_034/ex ddd aaa 241 | train/epoch_034/ex f g 242 | train/epoch_034/ex dddd gggf 243 | train/epoch_034/ex hhh hhh 244 | train/epoch_034/ex gggggggg gggggggg 245 | train/epoch_034{1.26s} 246 | train/epoch_035/loss 10.4774 247 | train/epoch_035/ex jjjjjj bhhhgb 248 | train/epoch_035/ex g a 249 | train/epoch_035/ex g j 250 | train/epoch_035/ex aaaaaaa ggggggg 251 | train/epoch_035/ex eeeeeeeee ccccccccc 252 | train/epoch_035{1.26s} 253 | train/epoch_036/loss 10.6643 254 | train/epoch_036/ex aaaa ddde 255 | train/epoch_036/ex j j 256 | train/epoch_036/ex eeeeeeee eeeeeeee 257 | train/epoch_036/ex jjj aig 258 | train/epoch_036/ex e h 259 | train/epoch_036{1.27s} 260 | train/epoch_037/loss 10.8361 261 | train/epoch_037/ex h g 262 | train/epoch_037/ex gggg baaa 263 | train/epoch_037/ex g c 264 | train/epoch_037/ex jj jj 265 | train/epoch_037/ex bbbb ggge 266 | train/epoch_037{1.27s} 267 | train/epoch_038/loss 9.9229 268 | train/epoch_038/ex ccc aaa 269 | train/epoch_038/ex hhhh ifff 270 | train/epoch_038/ex gggggg hhfggh 271 | train/epoch_038/ex ggg hgg 272 | train/epoch_038/ex hhhhh ghggh 273 | train/epoch_038{1.25s} 274 | train/epoch_039/loss 10.6858 275 | train/epoch_039/ex ggggg fffff 276 | train/epoch_039/ex hhhhhhhhh bbbbhbbbb 277 | train/epoch_039/ex ddd jhh 278 | train/epoch_039/ex ddd fii 279 | train/epoch_039/ex jjj hhh 280 | train/epoch_039{1.30s} 281 | train/epoch_040/loss 10.2436 282 | train/epoch_040/ex fffff fcffh 283 | train/epoch_040/ex ff ef 284 | train/epoch_040/ex aaa gii 285 | train/epoch_040/ex ffffffff ffffffff 286 | train/epoch_040/ex aaaa gicc 287 | train/epoch_040{1.25s} 288 | train/epoch_041/loss 9.9133 289 | train/epoch_041/ex d c 290 | train/epoch_041/ex jjjjj didii 291 | train/epoch_041/ex ggg ggg 292 | train/epoch_041/ex ffff fffc 293 | train/epoch_041/ex gggggg bbbbbi 294 | train/epoch_041{1.24s} 295 | train/epoch_042/loss 9.8541 296 | train/epoch_042/ex bbbbb ejeff 297 | train/epoch_042/ex jjjjj fjjjj 298 | train/epoch_042/ex h d 299 | train/epoch_042/ex gggggggg bbbbbbbf 300 | train/epoch_042/ex ggg hhh 301 | train/epoch_042{1.24s} 302 | train/epoch_043/loss 10.1383 303 | train/epoch_043/ex i j 304 | train/epoch_043/ex ggggg gghgg 305 | train/epoch_043/ex gggggg ggggfg 306 | train/epoch_043/ex e e 307 | train/epoch_043/ex jd jf 308 | train/epoch_043{1.27s} 309 | train/epoch_044/loss 9.5657 310 | train/epoch_044/ex h d 311 | train/epoch_044/ex bbb ccb 312 | train/epoch_044/ex e e 313 | train/epoch_044/ex g b 314 | train/epoch_044/ex bf fd 315 | train/epoch_044{1.27s} 316 | train/epoch_045/loss 9.1681 317 | train/epoch_045/ex jjjj bjbb 318 | train/epoch_045/ex h h 319 | train/epoch_045/ex ddd dee 320 | train/epoch_045/ex aaaa aaaa 321 | train/epoch_045/ex jjj hha 322 | train/epoch_045{1.28s} 323 | train/epoch_046/loss 9.6376 324 | train/epoch_046/ex hhh che 325 | train/epoch_046/ex i j 326 | train/epoch_046/ex ffffffff ffffffff 327 | train/epoch_046/ex d b 328 | train/epoch_046/ex eeee aeee 329 | train/epoch_046{1.25s} 330 | train/epoch_047/loss 8.4740 331 | train/epoch_047/ex bb ff 332 | train/epoch_047/ex iiiii iiiii 333 | train/epoch_047/ex aaa aja 334 | train/epoch_047/ex ddd ddi 335 | train/epoch_047/ex gggggg gggggg 336 | train/epoch_047{1.25s} 337 | train/epoch_048/loss 8.4864 338 | train/epoch_048/ex iii iii 339 | train/epoch_048/ex ccc hhh 340 | train/epoch_048/ex bbb aai 341 | train/epoch_048/ex c h 342 | train/epoch_048/ex dddddd cccccc 343 | train/epoch_048{1.29s} 344 | train/epoch_049/loss 8.3088 345 | train/epoch_049/ex bbbbbb gbghbb 346 | train/epoch_049/ex bbbbbbbb bbbbbbbb 347 | train/epoch_049/ex ggg gcb 348 | train/epoch_049/ex ccccccc iiccccc 349 | train/epoch_049/ex aaaa eaee 350 | train/epoch_049{1.25s} 351 | train/epoch_050/loss 8.4498 352 | train/epoch_050/ex aaaa aaac 353 | train/epoch_050/ex hhhhhhhhhhh fiihffihfiff 354 | train/epoch_050/ex c a 355 | train/epoch_050/ex fffff fbfff 356 | train/epoch_050/ex ffff fbff 357 | train/epoch_050{1.28s} 358 | train/epoch_051/loss 7.9924 359 | train/epoch_051/ex eeeeeee eeeeeee 360 | train/epoch_051/ex gg gc 361 | train/epoch_051/ex hhhh hhhh 362 | train/epoch_051/ex jjjjj jjjfj 363 | train/epoch_051/ex jjjjj jjjjj 364 | train/epoch_051{1.28s} 365 | train/epoch_052/loss 7.5025 366 | train/epoch_052/ex h b 367 | train/epoch_052/ex hh ha 368 | train/epoch_052/ex h h 369 | train/epoch_052/ex ccb ccb 370 | train/epoch_052/ex iie ege 371 | train/epoch_052{1.26s} 372 | train/epoch_053/loss 7.8173 373 | train/epoch_053/ex ib hg 374 | train/epoch_053/ex h a 375 | train/epoch_053/ex dji idi 376 | train/epoch_053/ex cccccc cccccc 377 | train/epoch_053/ex aaaa hdaa 378 | train/epoch_053{1.28s} 379 | train/epoch_054/loss 7.5550 380 | train/epoch_054/ex ddd dcc 381 | train/epoch_054/ex bbb jjj 382 | train/epoch_054/ex hhhhhhh hhhhhhh 383 | train/epoch_054/ex bbb bbb 384 | train/epoch_054/ex ddd ddd 385 | train/epoch_054{1.27s} 386 | train/epoch_055/loss 7.6156 387 | train/epoch_055/ex hhhhh chhhh 388 | train/epoch_055/ex jj ii 389 | train/epoch_055/ex ddddd deedd 390 | train/epoch_055/ex dddd dddd 391 | train/epoch_055/ex hhh feb 392 | train/epoch_055{1.26s} 393 | train/epoch_056/loss 7.2569 394 | train/epoch_056/ex jj ff 395 | train/epoch_056/ex h j 396 | train/epoch_056/ex g b 397 | train/epoch_056/ex jjjj fjjj 398 | train/epoch_056/ex aaabb abbba 399 | train/epoch_056{1.29s} 400 | train/epoch_057/loss 7.1361 401 | train/epoch_057/ex ccccc ccccc 402 | train/epoch_057/ex if ai 403 | train/epoch_057/ex iiiiii eiiiii 404 | train/epoch_057/ex gggggg bbgbbb 405 | train/epoch_057/ex ghg hgh 406 | train/epoch_057{1.25s} 407 | train/epoch_058/loss 7.0003 408 | train/epoch_058/ex aaaaaaa ggggaag 409 | train/epoch_058/ex eeeeee eeeeee 410 | train/epoch_058/ex aaaaaa ccacca 411 | train/epoch_058/ex hf hf 412 | train/epoch_058/ex d d 413 | train/epoch_058{1.29s} 414 | train/epoch_059/loss 7.1866 415 | train/epoch_059/ex aaaaa aadaa 416 | train/epoch_059/ex cccccf ffcfac 417 | train/epoch_059/ex bbb bba 418 | train/epoch_059/ex aa ah 419 | train/epoch_059/ex fff fff 420 | train/epoch_059{1.28s} 421 | train/epoch_060/loss 6.9411 422 | train/epoch_060/ex jjjjjjjj jjjjaaac 423 | train/epoch_060/ex fff fff 424 | train/epoch_060/ex aaa cca 425 | train/epoch_060/ex h a 426 | train/epoch_060/ex fffff ffbbf 427 | train/epoch_060{1.29s} 428 | train/epoch_061/loss 7.0724 429 | train/epoch_061/ex ff ff 430 | train/epoch_061/ex jjjj ejje 431 | train/epoch_061/ex cccf fffc 432 | train/epoch_061/ex j g 433 | train/epoch_061/ex eee iii 434 | train/epoch_061{1.29s} 435 | train/epoch_062/loss 8.0127 436 | train/epoch_062/ex dddd gddd 437 | train/epoch_062/ex fff ddd 438 | train/epoch_062/ex bbbbb bbbb 439 | train/epoch_062/ex fffff fgggg 440 | train/epoch_062/ex gbd gbg 441 | train/epoch_062{1.31s} 442 | train/epoch_063/loss 7.5818 443 | train/epoch_063/ex eeh eii 444 | train/epoch_063/ex gggg aggg 445 | train/epoch_063/ex eeee eeej 446 | train/epoch_063/ex ggg aaa 447 | train/epoch_063/ex c g 448 | train/epoch_063{1.24s} 449 | train/epoch_064/loss 6.6310 450 | train/epoch_064/ex b b 451 | train/epoch_064/ex bcb bcb 452 | train/epoch_064/ex d b 453 | train/epoch_064/ex bbbb ccbc 454 | train/epoch_064/ex g j 455 | train/epoch_064{1.27s} 456 | train/epoch_065/loss 7.1209 457 | train/epoch_065/ex gg dh 458 | train/epoch_065/ex bbbbb bbjbb 459 | train/epoch_065/ex bbbbb bbfbf 460 | train/epoch_065/ex j j 461 | train/epoch_065/ex jjj jdj 462 | train/epoch_065{1.24s} 463 | train/epoch_066/loss 6.4592 464 | train/epoch_066/ex jf fh 465 | train/epoch_066/ex ii ii 466 | train/epoch_066/ex dc cd 467 | train/epoch_066/ex dd di 468 | train/epoch_066/ex aa ii 469 | train/epoch_066{1.26s} 470 | train/epoch_067/loss 6.4710 471 | train/epoch_067/ex ffff cfff 472 | train/epoch_067/ex eeeeeee eieeeee 473 | train/epoch_067/ex gggggg gggggg 474 | train/epoch_067/ex jf fj 475 | train/epoch_067/ex aa ga 476 | train/epoch_067{1.26s} 477 | train/epoch_068/loss 6.6270 478 | train/epoch_068/ex jjjjj djjjj 479 | train/epoch_068/ex fffff jjdjj 480 | train/epoch_068/ex bbbbb bbbbb 481 | train/epoch_068/ex i c 482 | train/epoch_068/ex bdbd addc 483 | train/epoch_068{1.27s} 484 | train/epoch_069/loss 6.9235 485 | train/epoch_069/ex ddddddd ddddddd 486 | train/epoch_069/ex hahah hahhf 487 | train/epoch_069/ex bbb ddd 488 | train/epoch_069/ex g a 489 | train/epoch_069/ex haaaa aahaj 490 | train/epoch_069{1.26s} 491 | train/epoch_070/loss 6.1613 492 | train/epoch_070/ex eae aee 493 | train/epoch_070/ex jjjje jjddf 494 | train/epoch_070/ex eeeeee eeeeee 495 | train/epoch_070/ex cbb bbc 496 | train/epoch_070/ex fffff ffhff 497 | train/epoch_070{1.29s} 498 | train/epoch_071/loss 6.6061 499 | train/epoch_071/ex ii ii 500 | train/epoch_071/ex iii aii 501 | train/epoch_071/ex eeeeee eeeeee 502 | train/epoch_071/ex eeeeeeee eeeeeeee 503 | train/epoch_071/ex jjjjjjjj jjjjjjjj 504 | train/epoch_071{1.27s} 505 | train/epoch_072/loss 6.2274 506 | train/epoch_072/ex j b 507 | train/epoch_072/ex hhiiiii hhhiiii 508 | train/epoch_072/ex jjjjj ejjjj 509 | train/epoch_072/ex aaj aaj 510 | train/epoch_072/ex jfjfj fjjjf 511 | train/epoch_072{1.26s} 512 | train/epoch_073/loss 6.6819 513 | train/epoch_073/ex b j 514 | train/epoch_073/ex bcbc bicb 515 | train/epoch_073/ex bb bb 516 | train/epoch_073/ex aaaa aaaa 517 | train/epoch_073/ex d h 518 | train/epoch_073{1.24s} 519 | train/epoch_074/loss 5.8375 520 | train/epoch_074/ex j j 521 | train/epoch_074/ex igig ighf 522 | train/epoch_074/ex jjjjjjj jjjjjjj 523 | train/epoch_074/ex hddh hdhh 524 | train/epoch_074/ex eeee eaaa 525 | train/epoch_074{1.30s} 526 | train/epoch_075/loss 6.2506 527 | train/epoch_075/ex effe eeef 528 | train/epoch_075/ex aiii ggig 529 | train/epoch_075/ex b a 530 | train/epoch_075/ex dde eie 531 | train/epoch_075/ex bffffffb bffbbbfb 532 | train/epoch_075{1.29s} 533 | train/epoch_076/loss 6.4191 534 | train/epoch_076/ex eeeee ceeee 535 | train/epoch_076/ex e h 536 | train/epoch_076/ex cccc bccg 537 | train/epoch_076/ex iii iii 538 | train/epoch_076/ex ic db 539 | train/epoch_076{1.29s} 540 | train/epoch_077/loss 6.5926 541 | train/epoch_077/ex eee eef 542 | train/epoch_077/ex jjjjj ejejj 543 | train/epoch_077/ex jjjjjjj jjjjjjj 544 | train/epoch_077/ex ggggg ggggg 545 | train/epoch_077/ex iiia iiaa 546 | train/epoch_077{1.24s} 547 | train/epoch_078/loss 6.2125 548 | train/epoch_078/ex ffffffffj ffjffffff 549 | train/epoch_078/ex bbbbbb bbbbbb 550 | train/epoch_078/ex hh aa 551 | train/epoch_078/ex bb gg 552 | train/epoch_078/ex gggggg gggggg 553 | train/epoch_078{1.27s} 554 | train/epoch_079/loss 6.1175 555 | train/epoch_079/ex bjbj bfbj 556 | train/epoch_079/ex eeeeee eeeeee 557 | train/epoch_079/ex he eg 558 | train/epoch_079/ex ddd dda 559 | train/epoch_079/ex bbbbbb bbbibb 560 | train/epoch_079{1.24s} 561 | train/epoch_080/loss 5.9942 562 | train/epoch_080/ex ggg ggf 563 | train/epoch_080/ex h c 564 | train/epoch_080/ex ibi bfi 565 | train/epoch_080/ex j g 566 | train/epoch_080/ex h e 567 | train/epoch_080{1.25s} 568 | train/epoch_081/loss 6.2856 569 | train/epoch_081/ex ggge heee 570 | train/epoch_081/ex ebib eiib 571 | train/epoch_081/ex eeeeee eeeeee 572 | train/epoch_081/ex eeeeee eeeeec 573 | train/epoch_081/ex bbbbbbb dbbbbbb 574 | train/epoch_081{1.20s} 575 | train/epoch_082/loss 5.8819 576 | train/epoch_082/ex b g 577 | train/epoch_082/ex i j 578 | train/epoch_082/ex eeee ccee 579 | train/epoch_082/ex agaaaa aaggag 580 | train/epoch_082/ex j j 581 | train/epoch_082{1.25s} 582 | train/epoch_083/loss 6.3647 583 | train/epoch_083/ex gggg gggg 584 | train/epoch_083/ex hd bh 585 | train/epoch_083/ex jjjjj jjjjj 586 | train/epoch_083/ex aa gg 587 | train/epoch_083/ex d i 588 | train/epoch_083{1.28s} 589 | train/epoch_084/loss 5.9172 590 | train/epoch_084/ex eeeeee eeeeee 591 | train/epoch_084/ex bbbbb bbcbb 592 | train/epoch_084/ex dbddbdb bdbdbbd 593 | train/epoch_084/ex ccg cgg 594 | train/epoch_084/ex cccc gggc 595 | train/epoch_084{1.28s} 596 | train/epoch_085/loss 5.9106 597 | Epoch 85: reducing learning rate of group 0 to 1.0000e-03. 598 | train/epoch_085/ex jj jj 599 | train/epoch_085/ex hed dhd 600 | train/epoch_085/ex aaa aaa 601 | train/epoch_085/ex b j 602 | train/epoch_085/ex hhhhh hhhhh 603 | train/epoch_085{1.28s} 604 | train/epoch_086/loss 6.0638 605 | train/epoch_086/ex gj gb 606 | train/epoch_086/ex ggggg beggg 607 | train/epoch_086/ex ja ej 608 | train/epoch_086/ex if ij 609 | train/epoch_086/ex aa aj 610 | train/epoch_086{1.29s} 611 | train/epoch_087/loss 5.7187 612 | train/epoch_087/ex cccc cccc 613 | train/epoch_087/ex eee eee 614 | train/epoch_087/ex fff fff 615 | train/epoch_087/ex efefe ifaea 616 | train/epoch_087/ex g f 617 | train/epoch_087{1.26s} 618 | train/epoch_088/loss 5.8355 619 | train/epoch_088/ex jf jg 620 | train/epoch_088/ex jjj jje 621 | train/epoch_088/ex cccce cceee 622 | train/epoch_088/ex iii ggg 623 | train/epoch_088/ex hhhhhhh hhhhahh 624 | train/epoch_088{1.26s} 625 | train/epoch_089/loss 5.9665 626 | train/epoch_089/ex i g 627 | train/epoch_089/ex a d 628 | train/epoch_089/ex a c 629 | train/epoch_089/ex ie ji 630 | train/epoch_089/ex ccc ccc 631 | train/epoch_089{1.24s} 632 | train/epoch_090/loss 5.6940 633 | train/epoch_090/ex iiii iiie 634 | train/epoch_090/ex didddi dididd 635 | train/epoch_090/ex iii iii 636 | train/epoch_090/ex iii iii 637 | train/epoch_090/ex dddddddd hddddddd 638 | train/epoch_090{1.25s} 639 | train/epoch_091/loss 5.3599 640 | train/epoch_091/ex b j 641 | train/epoch_091/ex gggggg gggggg 642 | train/epoch_091/ex ddda bddi 643 | train/epoch_091/ex bbb fff 644 | train/epoch_091/ex aab bba 645 | train/epoch_091{1.29s} 646 | train/epoch_092/loss 5.6582 647 | train/epoch_092/ex bbbbb bbbbb 648 | train/epoch_092/ex g e 649 | train/epoch_092/ex g i 650 | train/epoch_092/ex ccchcch cchchhc 651 | train/epoch_092/ex aag gga 652 | train/epoch_092{1.27s} 653 | train/epoch_093/loss 6.0616 654 | train/epoch_093/ex ddddf dddfd 655 | train/epoch_093/ex icccci iiaiia 656 | train/epoch_093/ex bj bj 657 | train/epoch_093/ex d h 658 | train/epoch_093/ex bbe cce 659 | train/epoch_093{1.28s} 660 | train/epoch_094/loss 5.7914 661 | train/epoch_094/ex ddc bdd 662 | train/epoch_094/ex g a 663 | train/epoch_094/ex iiiiii iiiiii 664 | train/epoch_094/ex cchcch hcccch 665 | train/epoch_094/ex ebe beb 666 | train/epoch_094{1.26s} 667 | train/epoch_095/loss 5.7248 668 | train/epoch_095/ex bbbb bbbb 669 | train/epoch_095/ex c e 670 | train/epoch_095/ex aa hh 671 | train/epoch_095/ex d h 672 | train/epoch_095/ex eeeee eeeee 673 | train/epoch_095{1.24s} 674 | train/epoch_096/loss 5.9161 675 | train/epoch_096/ex ce ig 676 | train/epoch_096/ex iih aii 677 | train/epoch_096/ex ggg ggg 678 | train/epoch_096/ex jejeje jejeej 679 | train/epoch_096/ex jje jij 680 | train/epoch_096{1.26s} 681 | train/epoch_097/loss 5.5123 682 | train/epoch_097/ex di dh 683 | train/epoch_097/ex hj ja 684 | train/epoch_097/ex fffff fffff 685 | train/epoch_097/ex dgd dcb 686 | train/epoch_097/ex ffffffff ffffffff 687 | train/epoch_097{1.27s} 688 | train/epoch_098/loss 5.7965 689 | train/epoch_098/ex hhhhhh hhhhhh 690 | train/epoch_098/ex fff fff 691 | train/epoch_098/ex bf bj 692 | train/epoch_098/ex cccj ccce 693 | train/epoch_098/ex ggggggggj ffgggggjg 694 | train/epoch_098{1.28s} 695 | train/epoch_099/loss 5.7147 696 | train/epoch_099/ex bi gi 697 | train/epoch_099/ex aab aab 698 | train/epoch_099/ex ddhhh hdhhh 699 | train/epoch_099/ex jja jff 700 | train/epoch_099/ex eeee eeee 701 | train/epoch_099{1.29s} 702 | train/epoch_100/loss 5.5634 703 | train/epoch_100/ex hhhg hhhg 704 | train/epoch_100/ex b i 705 | train/epoch_100/ex ccd cjc 706 | train/epoch_100/ex hhhhh hhhhh 707 | train/epoch_100/ex c j 708 | train/epoch_100{1.29s} 709 | train/epoch_101/loss 6.0748 710 | train/epoch_101/ex dcdd dcdd 711 | train/epoch_101/ex ic ci 712 | train/epoch_101/ex dbdbdb bdbdbd 713 | train/epoch_101/ex aagaaa aggggg 714 | train/epoch_101/ex f a 715 | train/epoch_101{1.30s} 716 | train/epoch_102/loss 5.9902 717 | Epoch 102: reducing learning rate of group 0 to 5.0000e-04. 718 | train/epoch_102/ex aaggg ggaai 719 | train/epoch_102/ex ffffa fafff 720 | train/epoch_102/ex bgb gbg 721 | train/epoch_102/ex dh id 722 | train/epoch_102/ex iii iii 723 | train/epoch_102{1.28s} 724 | train/epoch_103/loss 5.7274 725 | train/epoch_103/ex aaf haa 726 | train/epoch_103/ex ccc ccb 727 | train/epoch_103/ex eeeeehhh hhheheee 728 | train/epoch_103/ex jjji jiii 729 | train/epoch_103/ex hh hf 730 | train/epoch_103{1.26s} 731 | train/epoch_104/loss 5.8842 732 | train/epoch_104/ex ggggg ggggg 733 | train/epoch_104/ex ea ea 734 | train/epoch_104/ex g f 735 | train/epoch_104/ex ggg gga 736 | train/epoch_104/ex ddddddddd ddddddddd 737 | train/epoch_104{1.27s} 738 | train/epoch_105/loss 5.4631 739 | train/epoch_105/ex ha ca 740 | train/epoch_105/ex aae faa 741 | train/epoch_105/ex iii fff 742 | train/epoch_105/ex hfh fhi 743 | train/epoch_105/ex iiiiii iiiiii 744 | train/epoch_105{1.26s} 745 | train/epoch_106/loss 5.7931 746 | train/epoch_106/ex aeeaea iaaaie 747 | train/epoch_106/ex bbb bbb 748 | train/epoch_106/ex j b 749 | train/epoch_106/ex d e 750 | train/epoch_106/ex d d 751 | train/epoch_106{1.29s} 752 | train/epoch_107/loss 5.7125 753 | train/epoch_107/ex eeeee eeeee 754 | train/epoch_107/ex aaaaa aaaaa 755 | train/epoch_107/ex aaaaa aaaah 756 | train/epoch_107/ex ede aed 757 | train/epoch_107/ex efgh fhgh 758 | train/epoch_107{1.27s} 759 | train/epoch_108/loss 5.6252 760 | train/epoch_108/ex ad ce 761 | train/epoch_108/ex bba aab 762 | train/epoch_108/ex hhi hhi 763 | train/epoch_108/ex bd gd 764 | train/epoch_108/ex d h 765 | train/epoch_108{1.23s} 766 | train/epoch_109/loss 5.6111 767 | train/epoch_109/ex a c 768 | train/epoch_109/ex aha hag 769 | train/epoch_109/ex i j 770 | train/epoch_109/ex ja ai 771 | train/epoch_109/ex eie eie 772 | train/epoch_109{1.26s} 773 | train/epoch_110/loss 5.9572 774 | train/epoch_110/ex eeeee eeeee 775 | train/epoch_110/ex cjcjcj cjccjc 776 | train/epoch_110/ex iij jji 777 | train/epoch_110/ex fb bf 778 | train/epoch_110/ex fffdd ddddf 779 | train/epoch_110{1.26s} 780 | train/epoch_111/loss 6.0238 781 | train/epoch_111/ex ddd fff 782 | train/epoch_111/ex j b 783 | train/epoch_111/ex bbbbbbb bbbbbbb 784 | train/epoch_111/ex hhhhh hhhhh 785 | train/epoch_111/ex afaa faff 786 | train/epoch_111{1.25s} 787 | train/epoch_112/loss 6.1947 788 | train/epoch_112/ex e e 789 | train/epoch_112/ex eeeeeeh eeeehhh 790 | train/epoch_112/ex ec eg 791 | train/epoch_112/ex ccccj jcccj 792 | train/epoch_112/ex ga ga 793 | train/epoch_112{1.29s} 794 | train/epoch_113/loss 5.6839 795 | Epoch 113: reducing learning rate of group 0 to 2.5000e-04. 796 | train/epoch_113/ex jjj jjj 797 | train/epoch_113/ex fdfd fbfb 798 | train/epoch_113/ex bb bb 799 | train/epoch_113/ex hhh hhh 800 | train/epoch_113/ex d f 801 | train/epoch_113{1.27s} 802 | train/epoch_114/loss 5.2755 803 | train/epoch_114/ex aa aa 804 | train/epoch_114/ex eeg jee 805 | train/epoch_114/ex bbbb bbbb 806 | train/epoch_114/ex ccc ccc 807 | train/epoch_114/ex e e 808 | train/epoch_114{1.28s} 809 | train/epoch_115/loss 5.2350 810 | train/epoch_115/ex jjjjjj jjjjjj 811 | train/epoch_115/ex aaaaga aggaaa 812 | train/epoch_115/ex ggg ggg 813 | train/epoch_115/ex beeeeeeb ebbbbeeb 814 | train/epoch_115/ex iii fff 815 | train/epoch_115{1.27s} 816 | train/epoch_116/loss 5.5642 817 | train/epoch_116/ex dddd dddd 818 | train/epoch_116/ex ig ig 819 | train/epoch_116/ex chchc bhchh 820 | train/epoch_116/ex bbbb bbbb 821 | train/epoch_116/ex gjgg jjgj 822 | train/epoch_116{1.29s} 823 | train/epoch_117/loss 5.8783 824 | train/epoch_117/ex ffff fffi 825 | train/epoch_117/ex gggga ggaaa 826 | train/epoch_117/ex bi ib 827 | train/epoch_117/ex bbb jjj 828 | train/epoch_117/ex bbbbbb bbbbbb 829 | train/epoch_117{1.27s} 830 | train/epoch_118/loss 5.9089 831 | train/epoch_118/ex aah ahh 832 | train/epoch_118/ex jjd jjb 833 | train/epoch_118/ex e h 834 | train/epoch_118/ex hac cha 835 | train/epoch_118/ex bbbbb bbbbb 836 | train/epoch_118{1.26s} 837 | train/epoch_119/loss 5.6352 838 | train/epoch_119/ex aaaaa aaaaa 839 | train/epoch_119/ex cccbcccc cbbccccc 840 | train/epoch_119/ex gag igi 841 | train/epoch_119/ex hhhh hhhh 842 | train/epoch_119/ex g c 843 | train/epoch_119{1.27s} 844 | train/epoch_120/loss 5.2391 845 | train/epoch_120/ex ggd ggh 846 | train/epoch_120/ex jdjd jdjd 847 | train/epoch_120/ex gb ca 848 | train/epoch_120/ex cch cch 849 | train/epoch_120/ex cfc fec 850 | train/epoch_120{1.28s} 851 | train/epoch_121/loss 5.3019 852 | train/epoch_121/ex iii iii 853 | train/epoch_121/ex ee ee 854 | train/epoch_121/ex chch jcch 855 | train/epoch_121/ex i j 856 | train/epoch_121/ex aaac caaa 857 | train/epoch_121{1.28s} 858 | train/epoch_122/loss 5.6026 859 | train/epoch_122/ex hhh jjj 860 | train/epoch_122/ex hhj jhh 861 | train/epoch_122/ex aaaaj aaaaj 862 | train/epoch_122/ex eeeeee eeeeee 863 | train/epoch_122/ex bdbd gbdb 864 | train/epoch_122{1.25s} 865 | train/epoch_123/loss 5.4459 866 | train/epoch_123/ex dggddgg fddgdgg 867 | train/epoch_123/ex ggggggg ggggggg 868 | train/epoch_123/ex gggggggggf ggggfggggd 869 | train/epoch_123/ex ffh ffh 870 | train/epoch_123/ex hhhhh hhhhh 871 | train/epoch_123{1.28s} 872 | train/epoch_124/loss 5.1775 873 | train/epoch_124/ex gghg hhgg 874 | train/epoch_124/ex ghg ghg 875 | train/epoch_124/ex ggg ggg 876 | train/epoch_124/ex fi hi 877 | train/epoch_124/ex cc jj 878 | train/epoch_124{1.28s} 879 | train/epoch_125/loss 5.3209 880 | train/epoch_125/ex hhhhh hhhhh 881 | train/epoch_125/ex iai iha 882 | train/epoch_125/ex jjg gjj 883 | train/epoch_125/ex bbb bbg 884 | train/epoch_125/ex acac caca 885 | train/epoch_125{1.27s} 886 | train/epoch_126/loss 5.6072 887 | train/epoch_126/ex ggggggg ggggggg 888 | train/epoch_126/ex aaaaa aaaaa 889 | train/epoch_126/ex dddb eddd 890 | train/epoch_126/ex eeeeeee eeeeeee 891 | train/epoch_126/ex ijijijij jijjiiij 892 | train/epoch_126{1.29s} 893 | train/epoch_127/loss 5.5849 894 | train/epoch_127/ex hhhd hhhd 895 | train/epoch_127/ex jji bjj 896 | train/epoch_127/ex j i 897 | train/epoch_127/ex aaaa aaaa 898 | train/epoch_127/ex iie iee 899 | train/epoch_127{1.29s} 900 | train/epoch_128/loss 5.7705 901 | train/epoch_128/ex bbe bbe 902 | train/epoch_128/ex d j 903 | train/epoch_128/ex bf eb 904 | train/epoch_128/ex ddddd ddddd 905 | train/epoch_128/ex fffff fffff 906 | train/epoch_128{1.29s} 907 | train/epoch_129/loss 4.9824 908 | train/epoch_129/ex hj jh 909 | train/epoch_129/ex gigig igigi 910 | train/epoch_129/ex aaa aaa 911 | train/epoch_129/ex c a 912 | train/epoch_129/ex e d 913 | train/epoch_129{1.29s} 914 | train/epoch_130/loss 5.5260 915 | train/epoch_130/ex ijibi bibib 916 | train/epoch_130/ex eh be 917 | train/epoch_130/ex d d 918 | train/epoch_130/ex eeeeeee eeeeeee 919 | train/epoch_130/ex iiiijii jjijjii 920 | train/epoch_130{1.24s} 921 | train/epoch_131/loss 5.5508 922 | train/epoch_131/ex hhhhhhhhhhh hhhhhhhhhhh 923 | train/epoch_131/ex gb ga 924 | train/epoch_131/ex e g 925 | train/epoch_131/ex ggd ggd 926 | train/epoch_131/ex ggge ggge 927 | train/epoch_131{1.27s} 928 | train/epoch_132/loss 5.5362 929 | train/epoch_132/ex jj jj 930 | train/epoch_132/ex d i 931 | train/epoch_132/ex iic iid 932 | train/epoch_132/ex ggb gbb 933 | train/epoch_132/ex ebe ebj 934 | train/epoch_132{1.26s} 935 | train/epoch_133/loss 4.9556 936 | train/epoch_133/ex gdggdgd gdggggd 937 | train/epoch_133/ex i i 938 | train/epoch_133/ex bbbbbee ebbbbbb 939 | train/epoch_133/ex ddddddd ddddddd 940 | train/epoch_133/ex jje eea 941 | train/epoch_133{1.29s} 942 | train/epoch_134/loss 5.4120 943 | train/epoch_134/ex aaa aaa 944 | train/epoch_134/ex ibi ibi 945 | train/epoch_134/ex gggggggg gggggggg 946 | train/epoch_134/ex iia aii 947 | train/epoch_134/ex hhhh hhhh 948 | train/epoch_134{1.26s} 949 | train/epoch_135/loss 5.2009 950 | train/epoch_135/ex i i 951 | train/epoch_135/ex ggghgggg gggghhgh 952 | train/epoch_135/ex ggi ggc 953 | train/epoch_135/ex bc cb 954 | train/epoch_135/ex d d 955 | train/epoch_135{1.24s} 956 | train/epoch_136/loss 4.9664 957 | train/epoch_136/ex jjjff eeefj 958 | train/epoch_136/ex jjj jjj 959 | train/epoch_136/ex aaa aaa 960 | train/epoch_136/ex g g 961 | train/epoch_136/ex jjhj jhjj 962 | train/epoch_136{1.27s} 963 | train/epoch_137/loss 5.2092 964 | train/epoch_137/ex dde dee 965 | train/epoch_137/ex hah ich 966 | train/epoch_137/ex h c 967 | train/epoch_137/ex hhha ahhh 968 | train/epoch_137/ex ddd ddd 969 | train/epoch_137{1.31s} 970 | train/epoch_138/loss 5.5136 971 | train/epoch_138/ex aaa aaa 972 | train/epoch_138/ex aaaaaaa aaaaaaa 973 | train/epoch_138/ex c a 974 | train/epoch_138/ex aaa aaa 975 | train/epoch_138/ex c a 976 | train/epoch_138{1.25s} 977 | train/epoch_139/loss 5.5350 978 | train/epoch_139/ex bbjbbj bjbjjj 979 | train/epoch_139/ex i h 980 | train/epoch_139/ex hhfh hhfh 981 | train/epoch_139/ex hhhhh hhhhh 982 | train/epoch_139/ex ffjf ffjf 983 | train/epoch_139{1.28s} 984 | train/epoch_140/loss 5.3522 985 | train/epoch_140/ex g c 986 | train/epoch_140/ex cc gg 987 | train/epoch_140/ex dddb gddd 988 | train/epoch_140/ex h i 989 | train/epoch_140/ex jccccj ccchjc 990 | train/epoch_140{1.29s} 991 | train/epoch_141/loss 5.7261 992 | train/epoch_141/ex ffffi iiiif 993 | train/epoch_141/ex ddddddddd ddddddddd 994 | train/epoch_141/ex ffff ffff 995 | train/epoch_141/ex ffffh ffffh 996 | train/epoch_141/ex eh he 997 | train/epoch_141{1.31s} 998 | train/epoch_142/loss 5.4427 999 | train/epoch_142/ex cf cf 1000 | train/epoch_142/ex g c 1001 | train/epoch_142/ex di hd 1002 | train/epoch_142/ex c c 1003 | train/epoch_142/ex cccc gggh 1004 | train/epoch_142{1.26s} 1005 | train/epoch_143/loss 5.9232 1006 | train/epoch_143/ex ah hi 1007 | train/epoch_143/ex e h 1008 | train/epoch_143/ex bbbbb bbbbb 1009 | train/epoch_143/ex eeeee eeeee 1010 | train/epoch_143/ex a i 1011 | train/epoch_143{1.30s} 1012 | train/epoch_144/loss 5.6765 1013 | Epoch 144: reducing learning rate of group 0 to 1.2500e-04. 1014 | train/epoch_144/ex c e 1015 | train/epoch_144/ex cecece ceecec 1016 | train/epoch_144/ex b i 1017 | train/epoch_144/ex iii iii 1018 | train/epoch_144/ex e d 1019 | train/epoch_144{1.24s} 1020 | train/epoch_145/loss 5.5937 1021 | train/epoch_145/ex hhhd hggg 1022 | train/epoch_145/ex ea ec 1023 | train/epoch_145/ex hj hf 1024 | train/epoch_145/ex aaaa jjjj 1025 | train/epoch_145/ex cccj cccj 1026 | train/epoch_145{1.28s} 1027 | train/epoch_146/loss 5.4225 1028 | train/epoch_146/ex ffe ffe 1029 | train/epoch_146/ex hhhh hhhc 1030 | train/epoch_146/ex aaf jaa 1031 | train/epoch_146/ex iiiiiid aiiiiii 1032 | train/epoch_146/ex jc jb 1033 | train/epoch_146{1.28s} 1034 | train/epoch_147/loss 5.3764 1035 | train/epoch_147/ex b b 1036 | train/epoch_147/ex j h 1037 | train/epoch_147/ex fff fff 1038 | train/epoch_147/ex gg ee 1039 | train/epoch_147/ex c i 1040 | train/epoch_147{1.32s} 1041 | train/epoch_148/loss 5.4966 1042 | train/epoch_148/ex iiaaa iiifa 1043 | train/epoch_148/ex i g 1044 | train/epoch_148/ex b b 1045 | train/epoch_148/ex eieei eiiei 1046 | train/epoch_148/ex e g 1047 | train/epoch_148{1.23s} 1048 | train/epoch_149/loss 5.5123 1049 | train/epoch_149/ex hhd dhh 1050 | train/epoch_149/ex ieeie iecci 1051 | train/epoch_149/ex jg jf 1052 | train/epoch_149/ex ja jb 1053 | train/epoch_149/ex if fh 1054 | train/epoch_149{1.28s} 1055 | train/epoch_150/loss 5.4662 1056 | train/epoch_150/ex fi fi 1057 | train/epoch_150/ex cccjj cjjjj 1058 | train/epoch_150/ex jjj jjj 1059 | train/epoch_150/ex dda dda 1060 | train/epoch_150/ex bbbbb bbbbb 1061 | train/epoch_150{1.24s} 1062 | train/epoch_151/loss 5.2341 1063 | train/epoch_151/ex bbbbbe ebbbbb 1064 | train/epoch_151/ex g f 1065 | train/epoch_151/ex hhh hhh 1066 | train/epoch_151/ex cbbc bbcb 1067 | train/epoch_151/ex cch hcc 1068 | train/epoch_151{1.25s} 1069 | train/epoch_152/loss 5.0248 1070 | train/epoch_152/ex ggi cgg 1071 | train/epoch_152/ex e j 1072 | train/epoch_152/ex ddf ddg 1073 | train/epoch_152/ex ae ha 1074 | train/epoch_152/ex ddddddd ddddddd 1075 | train/epoch_152{1.26s} 1076 | train/epoch_153/loss 4.6959 1077 | train/epoch_153/ex fff fff 1078 | train/epoch_153/ex eg he 1079 | train/epoch_153/ex e g 1080 | train/epoch_153/ex hhhhhh hhhhhh 1081 | train/epoch_153/ex hhhhh hhhhh 1082 | train/epoch_153{1.24s} 1083 | train/epoch_154/loss 5.2163 1084 | train/epoch_154/ex aaaaaaa aaaaaaa 1085 | train/epoch_154/ex d e 1086 | train/epoch_154/ex djd djd 1087 | train/epoch_154/ex ehbbh beehb 1088 | train/epoch_154/ex c d 1089 | train/epoch_154{1.31s} 1090 | train/epoch_155/loss 5.3194 1091 | train/epoch_155/ex bbbbb bbbbb 1092 | train/epoch_155/ex aaaa aaaa 1093 | train/epoch_155/ex jjj jjj 1094 | train/epoch_155/ex eeeee eeeee 1095 | train/epoch_155/ex iiii iiii 1096 | train/epoch_155{1.25s} 1097 | train/epoch_156/loss 5.3465 1098 | train/epoch_156/ex dadad addad 1099 | train/epoch_156/ex e d 1100 | train/epoch_156/ex ddddh gdddd 1101 | train/epoch_156/ex gghgggh gghghhh 1102 | train/epoch_156/ex cccccccc cccccccc 1103 | train/epoch_156{1.27s} 1104 | train/epoch_157/loss 5.4544 1105 | train/epoch_157/ex cecec cecee 1106 | train/epoch_157/ex jjj jjj 1107 | train/epoch_157/ex jj jj 1108 | train/epoch_157/ex fffff fffff 1109 | train/epoch_157/ex gggggg gggggg 1110 | train/epoch_157{1.27s} 1111 | train/epoch_158/loss 5.1598 1112 | train/epoch_158/ex ggggg ggggg 1113 | train/epoch_158/ex ddd ddd 1114 | train/epoch_158/ex ef ej 1115 | train/epoch_158/ex jdjj cjjd 1116 | train/epoch_158/ex iiiii iiiii 1117 | train/epoch_158{1.30s} 1118 | train/epoch_159/loss 5.4419 1119 | train/epoch_159/ex fggf fcff 1120 | train/epoch_159/ex jj jj 1121 | train/epoch_159/ex jj jj 1122 | train/epoch_159/ex iiiif iigii 1123 | train/epoch_159/ex aaa aaa 1124 | train/epoch_159{1.26s} 1125 | train/epoch_160/loss 5.5807 1126 | train/epoch_160/ex gggg gggg 1127 | train/epoch_160/ex aabaaab bababbb 1128 | train/epoch_160/ex ia ai 1129 | train/epoch_160/ex ccdccdd ddcdcdd 1130 | train/epoch_160/ex jjj jjj 1131 | train/epoch_160{1.24s} 1132 | train/epoch_161/loss 5.1813 1133 | train/epoch_161/ex iai iai 1134 | train/epoch_161/ex ddh ddi 1135 | train/epoch_161/ex e f 1136 | train/epoch_161/ex hhh hhh 1137 | train/epoch_161/ex iiiia iiiih 1138 | train/epoch_161{1.25s} 1139 | train/epoch_162/loss 5.3061 1140 | train/epoch_162/ex b g 1141 | train/epoch_162/ex aaaaa aaaaa 1142 | train/epoch_162/ex jjj bbb 1143 | train/epoch_162/ex eed dde 1144 | train/epoch_162/ex eegg ggee 1145 | train/epoch_162{1.29s} 1146 | train/epoch_163/loss 5.3052 1147 | train/epoch_163/ex i j 1148 | train/epoch_163/ex dd dd 1149 | train/epoch_163/ex gggggg gggggg 1150 | train/epoch_163/ex jejej fjeej 1151 | train/epoch_163/ex jjjje jjjje 1152 | train/epoch_163{1.26s} 1153 | train/epoch_164/loss 5.3230 1154 | Epoch 164: reducing learning rate of group 0 to 6.2500e-05. 1155 | train/epoch_164/ex eeeee eeeee 1156 | train/epoch_164/ex hj ih 1157 | train/epoch_164/ex ic bh 1158 | train/epoch_164/ex iic iie 1159 | train/epoch_164/ex i j 1160 | train/epoch_164{1.26s} 1161 | train/epoch_165/loss 5.2181 1162 | train/epoch_165/ex bbbb bbbb 1163 | train/epoch_165/ex gggggg gggggg 1164 | train/epoch_165/ex hhihh aaiih 1165 | train/epoch_165/ex aaaaa aaaaa 1166 | train/epoch_165/ex gggg gggg 1167 | train/epoch_165{1.25s} 1168 | train/epoch_166/loss 5.1452 1169 | train/epoch_166/ex jjajj jjgjj 1170 | train/epoch_166/ex igi gig 1171 | train/epoch_166/ex hhd jhh 1172 | train/epoch_166/ex gggggg gggggg 1173 | train/epoch_166/ex iii iii 1174 | train/epoch_166{1.26s} 1175 | train/epoch_167/loss 4.9266 1176 | train/epoch_167/ex jd jd 1177 | train/epoch_167/ex jjj jjj 1178 | train/epoch_167/ex eeaeeea aaaaeae 1179 | train/epoch_167/ex aa aa 1180 | train/epoch_167/ex aag ggj 1181 | train/epoch_167{1.31s} 1182 | train/epoch_168/loss 5.2572 1183 | train/epoch_168/ex ggjg ggfe 1184 | train/epoch_168/ex bccb dbdd 1185 | train/epoch_168/ex aaaaa aaaaa 1186 | train/epoch_168/ex aaa aaa 1187 | train/epoch_168/ex hh hh 1188 | train/epoch_168{1.31s} 1189 | train/epoch_169/loss 5.2025 1190 | train/epoch_169/ex ddh hdd 1191 | train/epoch_169/ex fff fff 1192 | train/epoch_169/ex ggh igg 1193 | train/epoch_169/ex c i 1194 | train/epoch_169/ex gga gga 1195 | train/epoch_169{1.26s} 1196 | train/epoch_170/loss 5.5033 1197 | train/epoch_170/ex c e 1198 | train/epoch_170/ex eeeae eeeae 1199 | train/epoch_170/ex gdgdg egeeg 1200 | train/epoch_170/ex gggg gggg 1201 | train/epoch_170/ex eje jaj 1202 | train/epoch_170{1.29s} 1203 | train/epoch_171/loss 4.7844 1204 | train/epoch_171/ex beeb beeb 1205 | train/epoch_171/ex hhhhh hhhhh 1206 | train/epoch_171/ex gggggg gggggg 1207 | train/epoch_171/ex g d 1208 | train/epoch_171/ex ch be 1209 | train/epoch_171{1.25s} 1210 | train/epoch_172/loss 5.1988 1211 | train/epoch_172/ex hhih jiih 1212 | train/epoch_172/ex b j 1213 | train/epoch_172/ex jjej ejee 1214 | train/epoch_172/ex eeb gee 1215 | train/epoch_172/ex ffffffff ffffffff 1216 | train/epoch_172{1.28s} 1217 | train/epoch_173/loss 5.0899 1218 | train/epoch_173/ex jjje jjji 1219 | train/epoch_173/ex iic gii 1220 | train/epoch_173/ex diiddiiid iidididdd 1221 | train/epoch_173/ex jjjjj ijjjj 1222 | train/epoch_173/ex hdhhdh hddgdh 1223 | train/epoch_173{1.29s} 1224 | train/epoch_174/loss 5.1988 1225 | train/epoch_174/ex hd ah 1226 | train/epoch_174/ex fff jdd 1227 | train/epoch_174/ex aaaa bbbb 1228 | train/epoch_174/ex ddg ddb 1229 | train/epoch_174/ex eeee eeee 1230 | train/epoch_174{1.27s} 1231 | train/epoch_175/loss 4.8534 1232 | Epoch 175: reducing learning rate of group 0 to 3.1250e-05. 1233 | train/epoch_175/ex eee eee 1234 | train/epoch_175/ex e g 1235 | train/epoch_175/ex ddd ddd 1236 | train/epoch_175/ex ddc ddc 1237 | train/epoch_175/ex cc bb 1238 | train/epoch_175{1.27s} 1239 | train/epoch_176/loss 5.3783 1240 | train/epoch_176/ex dh ch 1241 | train/epoch_176/ex accaa accca 1242 | train/epoch_176/ex be eb 1243 | train/epoch_176/ex fffff fffff 1244 | train/epoch_176/ex aaa aaa 1245 | train/epoch_176{1.26s} 1246 | train/epoch_177/loss 5.3563 1247 | train/epoch_177/ex bbbbb bbbbb 1248 | train/epoch_177/ex cccc cccc 1249 | train/epoch_177/ex bi dj 1250 | train/epoch_177/ex gggg gggi 1251 | train/epoch_177/ex fff fff 1252 | train/epoch_177{1.24s} 1253 | train/epoch_178/loss 5.2602 1254 | train/epoch_178/ex iia aai 1255 | train/epoch_178/ex aaa aaa 1256 | train/epoch_178/ex e b 1257 | train/epoch_178/ex jdj jcj 1258 | train/epoch_178/ex jj jj 1259 | train/epoch_178{1.29s} 1260 | train/epoch_179/loss 5.1049 1261 | train/epoch_179/ex hhch aaca 1262 | train/epoch_179/ex iiii iiii 1263 | train/epoch_179/ex bd db 1264 | train/epoch_179/ex d d 1265 | train/epoch_179/ex fe ge 1266 | train/epoch_179{1.25s} 1267 | train/epoch_180/loss 4.9885 1268 | train/epoch_180/ex hhhhh hhhhh 1269 | train/epoch_180/ex eege ggeg 1270 | train/epoch_180/ex ecec cece 1271 | train/epoch_180/ex hdhhdhhhdd dhhhhdhdhh 1272 | train/epoch_180/ex gggggg gggggg 1273 | train/epoch_180{1.27s} 1274 | train/epoch_181/loss 5.5772 1275 | train/epoch_181/ex bbbbbbb bbbbbbb 1276 | train/epoch_181/ex aafa afaa 1277 | train/epoch_181/ex ddgg ggdd 1278 | train/epoch_181/ex gg gg 1279 | train/epoch_181/ex bc cf 1280 | train/epoch_181{1.26s} 1281 | train/epoch_182/loss 4.9859 1282 | train/epoch_182/ex jaj aja 1283 | train/epoch_182/ex jjf jjf 1284 | train/epoch_182/ex fafafafa cafaafaf 1285 | train/epoch_182/ex aaa aaa 1286 | train/epoch_182/ex jjii jiii 1287 | train/epoch_182{1.31s} 1288 | train/epoch_183/loss 5.1117 1289 | train/epoch_183/ex cc cc 1290 | train/epoch_183/ex iei ije 1291 | train/epoch_183/ex cccc eeee 1292 | train/epoch_183/ex eg ge 1293 | train/epoch_183/ex eec ecc 1294 | train/epoch_183{1.27s} 1295 | train/epoch_184/loss 5.3804 1296 | train/epoch_184/ex ea ae 1297 | train/epoch_184/ex ai ag 1298 | train/epoch_184/ex hh hh 1299 | train/epoch_184/ex ei ei 1300 | train/epoch_184/ex bfb fbg 1301 | train/epoch_184{1.27s} 1302 | train/epoch_185/loss 5.1830 1303 | train/epoch_185/ex icic ieic 1304 | train/epoch_185/ex aaaa aaaa 1305 | train/epoch_185/ex dhd dih 1306 | train/epoch_185/ex aaaaa aaaaa 1307 | train/epoch_185/ex hhdhh dhhdd 1308 | train/epoch_185{1.24s} 1309 | train/epoch_186/loss 5.3116 1310 | Epoch 186: reducing learning rate of group 0 to 1.5625e-05. 1311 | train/epoch_186/ex ccc ccc 1312 | train/epoch_186/ex cbj jcj 1313 | train/epoch_186/ex d d 1314 | train/epoch_186/ex hhj ddj 1315 | train/epoch_186/ex ddh hhc 1316 | train/epoch_186{1.28s} 1317 | train/epoch_187/loss 5.0081 1318 | train/epoch_187/ex daadda ddadda 1319 | train/epoch_187/ex bd bd 1320 | train/epoch_187/ex bc cb 1321 | train/epoch_187/ex ia di 1322 | train/epoch_187/ex didi didi 1323 | train/epoch_187{1.27s} 1324 | train/epoch_188/loss 5.7458 1325 | train/epoch_188/ex fffffffdfff ffffffdffff 1326 | train/epoch_188/ex eeieei ieeiee 1327 | train/epoch_188/ex ggfg ggfg 1328 | train/epoch_188/ex cccccee eeeeeaa 1329 | train/epoch_188/ex aaaaaaaf aaacaaaa 1330 | train/epoch_188{1.30s} 1331 | train/epoch_189/loss 5.5837 1332 | train/epoch_189/ex bbd ddb 1333 | train/epoch_189/ex fff fff 1334 | train/epoch_189/ex cb gb 1335 | train/epoch_189/ex ddiddii ddidddi 1336 | train/epoch_189/ex ga ig 1337 | train/epoch_189{1.27s} 1338 | train/epoch_190/loss 5.5785 1339 | train/epoch_190/ex hhhhhhh hhhhhhh 1340 | train/epoch_190/ex bbb bbb 1341 | train/epoch_190/ex eiei ieie 1342 | train/epoch_190/ex iiiiiiif iiiiiiif 1343 | train/epoch_190/ex hhhhf hhhhi 1344 | train/epoch_190{1.23s} 1345 | train/epoch_191/loss 5.1677 1346 | train/epoch_191/ex ddddh dddjd 1347 | train/epoch_191/ex ddd ddd 1348 | train/epoch_191/ex ibi bdi 1349 | train/epoch_191/ex aae aac 1350 | train/epoch_191/ex g g 1351 | train/epoch_191{1.27s} 1352 | train/epoch_192/loss 5.1850 1353 | train/epoch_192/ex aaaa aaaa 1354 | train/epoch_192/ex ei eh 1355 | train/epoch_192/ex hhhhhh hhhhhh 1356 | train/epoch_192/ex gge agg 1357 | train/epoch_192/ex giigi ggdig 1358 | train/epoch_192{1.27s} 1359 | train/epoch_193/loss 5.2440 1360 | train/epoch_193/ex iii iii 1361 | train/epoch_193/ex hhhhhh hhhhhh 1362 | train/epoch_193/ex d h 1363 | train/epoch_193/ex aaaaaaa aaaaaaa 1364 | train/epoch_193/ex i h 1365 | train/epoch_193{1.23s} 1366 | train/epoch_194/loss 5.6167 1367 | train/epoch_194/ex eb ge 1368 | train/epoch_194/ex d d 1369 | train/epoch_194/ex cccc cccc 1370 | train/epoch_194/ex beeb bffe 1371 | train/epoch_194/ex eejj jjee 1372 | train/epoch_194{1.26s} 1373 | train/epoch_195/loss 5.3146 1374 | train/epoch_195/ex eeege egeee 1375 | train/epoch_195/ex ebeeb ebeeb 1376 | train/epoch_195/ex iigiiig eigggii 1377 | train/epoch_195/ex eeeeee eeeeee 1378 | train/epoch_195/ex hh bb 1379 | train/epoch_195{1.29s} 1380 | train/epoch_196/loss 5.2539 1381 | train/epoch_196/ex gggb bggg 1382 | train/epoch_196/ex ii ii 1383 | train/epoch_196/ex gggg gggg 1384 | train/epoch_196/ex efefef feeffe 1385 | train/epoch_196/ex ddd ddd 1386 | train/epoch_196{1.29s} 1387 | train/epoch_197/loss 5.4117 1388 | Epoch 197: reducing learning rate of group 0 to 7.8125e-06. 1389 | train/epoch_197/ex hhe fhh 1390 | train/epoch_197/ex bbbbbb bbbbbb 1391 | train/epoch_197/ex bbbbb bbbbb 1392 | train/epoch_197/ex ggiig giigg 1393 | train/epoch_197/ex cch cch 1394 | train/epoch_197{1.25s} 1395 | train/epoch_198/loss 5.2192 1396 | train/epoch_198/ex bbbbbb bbbbbb 1397 | train/epoch_198/ex e h 1398 | train/epoch_198/ex ggghg ggghh 1399 | train/epoch_198/ex jjjjjjjj jjjjjjjj 1400 | train/epoch_198/ex b j 1401 | train/epoch_198{1.26s} 1402 | train/epoch_199/loss 5.1540 1403 | train/epoch_199/ex jccj jcce 1404 | train/epoch_199/ex ai ih 1405 | train/epoch_199/ex eeeeeee eeeeeee 1406 | train/epoch_199/ex ccf hcc 1407 | train/epoch_199/ex fffg fggg 1408 | train/epoch_199{1.25s} 1409 | train/epoch_200/loss 5.0232 1410 | train/epoch_200/ex eeeee eeeee 1411 | train/epoch_200/ex gjc gcj 1412 | train/epoch_200/ex ggjgg jjjgj 1413 | train/epoch_200/ex eeeed eeddd 1414 | train/epoch_200/ex hd hd 1415 | train/epoch_200{1.29s} 1416 | train/epoch_201/loss 5.5400 1417 | train/epoch_201/ex aae iaa 1418 | train/epoch_201/ex aia iai 1419 | train/epoch_201/ex h e 1420 | train/epoch_201/ex b i 1421 | train/epoch_201/ex hhhhhhhhhh hhhhhhhhhb 1422 | train/epoch_201{1.26s} 1423 | train/epoch_202/loss 5.1476 1424 | train/epoch_202/ex gf gb 1425 | train/epoch_202/ex jjjjjjjj jjjjjjjj 1426 | train/epoch_202/ex aaa aaa 1427 | train/epoch_202/ex eeejeeee jjjjejje 1428 | train/epoch_202/ex fffff fffff 1429 | train/epoch_202{1.26s} 1430 | train/epoch_203/loss 4.9573 1431 | train/epoch_203/ex hihhihihi hiihhiihi 1432 | train/epoch_203/ex bbbbe cbbbb 1433 | train/epoch_203/ex gbgbgb bggbgd 1434 | train/epoch_203/ex feef eefe 1435 | train/epoch_203/ex cccg ggcc 1436 | train/epoch_203{1.25s} 1437 | train/epoch_204/loss 4.7114 1438 | train/epoch_204/ex cc cc 1439 | train/epoch_204/ex gi gj 1440 | train/epoch_204/ex did idc 1441 | train/epoch_204/ex ddddh gdddd 1442 | train/epoch_204/ex aaf aac 1443 | train/epoch_204{1.30s} 1444 | train/epoch_205/loss 5.4390 1445 | train/epoch_205/ex haaaaaah ahhaaahh 1446 | train/epoch_205/ex bbbbbb bbbbbb 1447 | train/epoch_205/ex cbcb bcbc 1448 | train/epoch_205/ex efe efe 1449 | train/epoch_205/ex cccccccc cccccccc 1450 | train/epoch_205{1.26s} 1451 | train/epoch_206/loss 4.9031 1452 | train/epoch_206/ex d d 1453 | train/epoch_206/ex gggggggg gggggggg 1454 | train/epoch_206/ex ddd ddd 1455 | train/epoch_206/ex i e 1456 | train/epoch_206/ex ffi eff 1457 | train/epoch_206{1.23s} 1458 | train/epoch_207/loss 5.1592 1459 | train/epoch_207/ex hhhhhhh hhhhhhh 1460 | train/epoch_207/ex aaa aaa 1461 | train/epoch_207/ex jjee jjee 1462 | train/epoch_207/ex ggggd jgggg 1463 | train/epoch_207/ex ggg ggg 1464 | train/epoch_207{1.26s} 1465 | train/epoch_208/loss 5.5376 1466 | Epoch 208: reducing learning rate of group 0 to 3.9063e-06. 1467 | train/epoch_208/ex eeeea eeiee 1468 | train/epoch_208/ex gggggg gggggg 1469 | train/epoch_208/ex ffd dff 1470 | train/epoch_208/ex iii iii 1471 | train/epoch_208/ex eeeeee eeeeee 1472 | train/epoch_208{1.26s} 1473 | train/epoch_209/loss 5.0808 1474 | train/epoch_209/ex b f 1475 | train/epoch_209/ex hj bj 1476 | train/epoch_209/ex iei aia 1477 | train/epoch_209/ex g i 1478 | train/epoch_209/ex cc cc 1479 | train/epoch_209{1.28s} 1480 | train/epoch_210/loss 5.3517 1481 | train/epoch_210/ex hhhh hhhh 1482 | train/epoch_210/ex ed de 1483 | train/epoch_210/ex bbb bbb 1484 | train/epoch_210/ex bbb bbb 1485 | train/epoch_210/ex dd cc 1486 | train/epoch_210{1.29s} 1487 | train/epoch_211/loss 5.0591 1488 | train/epoch_211/ex iif gii 1489 | train/epoch_211/ex a a 1490 | train/epoch_211/ex ccc ccc 1491 | train/epoch_211/ex dh da 1492 | train/epoch_211/ex hhhh hhhh 1493 | train/epoch_211{1.22s} 1494 | train/epoch_212/loss 5.2907 1495 | train/epoch_212/ex bb bb 1496 | train/epoch_212/ex dccddc cddccd 1497 | train/epoch_212/ex iig gff 1498 | train/epoch_212/ex aj bg 1499 | train/epoch_212/ex ddj jdd 1500 | train/epoch_212{1.26s} 1501 | train/epoch_213/loss 5.2698 1502 | train/epoch_213/ex iiiiii iiiiii 1503 | train/epoch_213/ex iiii iiii 1504 | train/epoch_213/ex j a 1505 | train/epoch_213/ex cce fcc 1506 | train/epoch_213/ex cc cc 1507 | train/epoch_213{1.24s} 1508 | train/epoch_214/loss 5.0994 1509 | train/epoch_214/ex iaiai iaiai 1510 | train/epoch_214/ex iiiii iiiii 1511 | train/epoch_214/ex aaaa ffff 1512 | train/epoch_214/ex jjjje ejjjj 1513 | train/epoch_214/ex e j 1514 | train/epoch_214{1.34s} 1515 | train/epoch_215/loss 5.4496 1516 | train/epoch_215/ex iie iij 1517 | train/epoch_215/ex gd dh 1518 | train/epoch_215/ex aa aa 1519 | train/epoch_215/ex ccc ccc 1520 | train/epoch_215/ex cc cc 1521 | train/epoch_215{1.29s} 1522 | train/epoch_216/loss 5.3148 1523 | train/epoch_216/ex e e 1524 | train/epoch_216/ex ccccc ccccc 1525 | train/epoch_216/ex bbh abb 1526 | train/epoch_216/ex ii ii 1527 | train/epoch_216/ex fhhf hhfh 1528 | train/epoch_216{1.26s} 1529 | train/epoch_217/loss 5.2914 1530 | train/epoch_217/ex iib iih 1531 | train/epoch_217/ex e c 1532 | train/epoch_217/ex ggh igg 1533 | train/epoch_217/ex i j 1534 | train/epoch_217/ex aai iie 1535 | train/epoch_217{1.27s} 1536 | train/epoch_218/loss 5.2549 1537 | train/epoch_218/ex fc if 1538 | train/epoch_218/ex dccdcd ddccdc 1539 | train/epoch_218/ex g f 1540 | train/epoch_218/ex ccc ccc 1541 | train/epoch_218/ex b b 1542 | train/epoch_218{1.26s} 1543 | train/epoch_219/loss 5.4063 1544 | Epoch 219: reducing learning rate of group 0 to 1.9531e-06. 1545 | train/epoch_219/ex ddd ddd 1546 | train/epoch_219/ex cb bc 1547 | train/epoch_219/ex ccj jcc 1548 | train/epoch_219/ex g i 1549 | train/epoch_219/ex iii iii 1550 | train/epoch_219{1.28s} 1551 | train/epoch_220/loss 5.3781 1552 | train/epoch_220/ex dddde dddde 1553 | train/epoch_220/ex dadad badaa 1554 | train/epoch_220/ex i b 1555 | train/epoch_220/ex bbbbb ccccc 1556 | train/epoch_220/ex cbb bcc 1557 | train/epoch_220{1.25s} 1558 | train/epoch_221/loss 5.0902 1559 | train/epoch_221/ex bccb bccb 1560 | train/epoch_221/ex gg cc 1561 | train/epoch_221/ex gj gb 1562 | train/epoch_221/ex aaa aaa 1563 | train/epoch_221/ex jjgjj gggjg 1564 | train/epoch_221{1.27s} 1565 | train/epoch_222/loss 5.2141 1566 | train/epoch_222/ex ffjjf jjjfc 1567 | train/epoch_222/ex c j 1568 | train/epoch_222/ex ec ec 1569 | train/epoch_222/ex h a 1570 | train/epoch_222/ex hddh dhhd 1571 | train/epoch_222{1.28s} 1572 | train/epoch_223/loss 5.3852 1573 | train/epoch_223/ex j j 1574 | train/epoch_223/ex iiiii iiiig 1575 | train/epoch_223/ex e d 1576 | train/epoch_223/ex ic ec 1577 | train/epoch_223/ex eee eee 1578 | train/epoch_223{1.27s} 1579 | train/epoch_224/loss 5.3861 1580 | train/epoch_224/ex ffd ffc 1581 | train/epoch_224/ex aga cga 1582 | train/epoch_224/ex jjjjjjjj jjjjjjjj 1583 | train/epoch_224/ex haha haha 1584 | train/epoch_224/ex jja bjj 1585 | train/epoch_224{1.27s} 1586 | train/epoch_225/loss 5.2511 1587 | train/epoch_225/ex a a 1588 | train/epoch_225/ex ddddddd ddddddd 1589 | train/epoch_225/ex jji jii 1590 | train/epoch_225/ex ecce cecc 1591 | train/epoch_225/ex g i 1592 | train/epoch_225{1.25s} 1593 | train/epoch_226/loss 5.5886 1594 | train/epoch_226/ex ie ie 1595 | train/epoch_226/ex ijiijij ijijjji 1596 | train/epoch_226/ex hh hh 1597 | train/epoch_226/ex jjjjjjj jjjjjjj 1598 | train/epoch_226/ex b c 1599 | train/epoch_226{1.28s} 1600 | train/epoch_227/loss 5.7044 1601 | train/epoch_227/ex eeaee eeaae 1602 | train/epoch_227/ex c a 1603 | train/epoch_227/ex ae ag 1604 | train/epoch_227/ex e c 1605 | train/epoch_227/ex hhh ccc 1606 | train/epoch_227{1.25s} 1607 | train/epoch_228/loss 5.3983 1608 | train/epoch_228/ex cec cec 1609 | train/epoch_228/ex hhhhh hhhhh 1610 | train/epoch_228/ex hhhf hfff 1611 | train/epoch_228/ex eee eee 1612 | train/epoch_228/ex fffhh ffhhh 1613 | train/epoch_228{1.28s} 1614 | train/epoch_229/loss 5.2070 1615 | train/epoch_229/ex iiid aaii 1616 | train/epoch_229/ex ddf ddb 1617 | train/epoch_229/ex c c 1618 | train/epoch_229/ex je fj 1619 | train/epoch_229/ex bccb ibbe 1620 | train/epoch_229{1.27s} 1621 | train/epoch_230/loss 5.3275 1622 | Epoch 230: reducing learning rate of group 0 to 9.7656e-07. 1623 | train/epoch_230/ex b c 1624 | train/epoch_230/ex aaaaa aaaaa 1625 | train/epoch_230/ex eeeee eeeee 1626 | train/epoch_230/ex g i 1627 | train/epoch_230/ex ii ii 1628 | train/epoch_230{1.30s} 1629 | train/epoch_231/loss 5.1923 1630 | train/epoch_231/ex ggg ggg 1631 | train/epoch_231/ex j b 1632 | train/epoch_231/ex j f 1633 | train/epoch_231/ex jjje jjje 1634 | train/epoch_231/ex eed dde 1635 | train/epoch_231{1.26s} 1636 | train/epoch_232/loss 5.1092 1637 | train/epoch_232/ex jjbbj jjbjj 1638 | train/epoch_232/ex d e 1639 | train/epoch_232/ex eee eee 1640 | train/epoch_232/ex ddii dhii 1641 | train/epoch_232/ex fff fff 1642 | train/epoch_232{1.26s} 1643 | train/epoch_233/loss 5.5429 1644 | train/epoch_233/ex hhhhhh hhhhhh 1645 | train/epoch_233/ex aaaae eaaaa 1646 | train/epoch_233/ex ggb igg 1647 | train/epoch_233/ex cccg hggg 1648 | train/epoch_233/ex iii iii 1649 | train/epoch_233{1.29s} 1650 | train/epoch_234/loss 5.5095 1651 | train/epoch_234/ex dd dd 1652 | train/epoch_234/ex ggg ggg 1653 | train/epoch_234/ex hehheheh hehhhhhe 1654 | train/epoch_234/ex eef aee 1655 | train/epoch_234/ex bbb bbb 1656 | train/epoch_234{1.30s} 1657 | train/epoch_235/loss 5.0791 1658 | train/epoch_235/ex jbbbbj bbbjbj 1659 | train/epoch_235/ex gfgf gaha 1660 | train/epoch_235/ex hhhhhhh hhhhhhh 1661 | train/epoch_235/ex ja ai 1662 | train/epoch_235/ex bbbbbbb bbbbbbb 1663 | train/epoch_235{1.23s} 1664 | train/epoch_236/loss 5.7261 1665 | train/epoch_236/ex gb bh 1666 | train/epoch_236/ex eee eee 1667 | train/epoch_236/ex jd jb 1668 | train/epoch_236/ex jjjjjj jjjjjj 1669 | train/epoch_236/ex cc cc 1670 | train/epoch_236{1.28s} 1671 | train/epoch_237/loss 5.5262 1672 | train/epoch_237/ex gd di 1673 | train/epoch_237/ex ab bg 1674 | train/epoch_237/ex eeej eejj 1675 | train/epoch_237/ex aaaj jaaa 1676 | train/epoch_237/ex cccccccc jjjjjjjj 1677 | train/epoch_237{1.30s} 1678 | train/epoch_238/loss 5.4254 1679 | train/epoch_238/ex dcdcd acdac 1680 | train/epoch_238/ex dddddd dddddd 1681 | train/epoch_238/ex cggc cggc 1682 | train/epoch_238/ex aca cdc 1683 | train/epoch_238/ex fffff fffff 1684 | train/epoch_238{1.25s} 1685 | train/epoch_239/loss 5.4764 1686 | train/epoch_239/ex cccfc chccc 1687 | train/epoch_239/ex bbb bbb 1688 | train/epoch_239/ex d h 1689 | train/epoch_239/ex hbhbh hghbh 1690 | train/epoch_239/ex fada fdaf 1691 | train/epoch_239{1.27s} 1692 | train/epoch_240/loss 5.4601 1693 | train/epoch_240/ex i j 1694 | train/epoch_240/ex d d 1695 | train/epoch_240/ex iiiii iiiii 1696 | train/epoch_240/ex jej cje 1697 | train/epoch_240/ex bbgg eegg 1698 | train/epoch_240{1.30s} 1699 | train/epoch_241/loss 5.5127 1700 | Epoch 241: reducing learning rate of group 0 to 4.8828e-07. 1701 | train/epoch_241/ex aa jj 1702 | train/epoch_241/ex ggg ggg 1703 | train/epoch_241/ex cjh dcj 1704 | train/epoch_241/ex dd cc 1705 | train/epoch_241/ex iih iig 1706 | train/epoch_241{1.25s} 1707 | train/epoch_242/loss 4.8979 1708 | train/epoch_242/ex b j 1709 | train/epoch_242/ex jdj jhj 1710 | train/epoch_242/ex aaa aaa 1711 | train/epoch_242/ex eed jje 1712 | train/epoch_242/ex hhha hhha 1713 | train/epoch_242{1.28s} 1714 | train/epoch_243/loss 5.4021 1715 | train/epoch_243/ex ffffjff fffjfff 1716 | train/epoch_243/ex hhhhf hbhhh 1717 | train/epoch_243/ex jaajja jjjajd 1718 | train/epoch_243/ex jjjjjjj jjjjjjj 1719 | train/epoch_243/ex h h 1720 | train/epoch_243{1.25s} 1721 | train/epoch_244/loss 4.6780 1722 | train/epoch_244/ex gggggg gggggg 1723 | train/epoch_244/ex fd fd 1724 | train/epoch_244/ex ij if 1725 | train/epoch_244/ex jjjjjj jjjjjj 1726 | train/epoch_244/ex bh dh 1727 | train/epoch_244{1.26s} 1728 | train/epoch_245/loss 5.1940 1729 | train/epoch_245/ex bbjbbj bjfejj 1730 | train/epoch_245/ex cg cg 1731 | train/epoch_245/ex fddfd ffdjd 1732 | train/epoch_245/ex hh hh 1733 | train/epoch_245/ex cbc bcb 1734 | train/epoch_245{1.24s} 1735 | train/epoch_246/loss 5.2351 1736 | train/epoch_246/ex ba db 1737 | train/epoch_246/ex fdfdf ddfdf 1738 | train/epoch_246/ex eeeeg eeeeg 1739 | train/epoch_246/ex cg cg 1740 | train/epoch_246/ex beb beb 1741 | train/epoch_246{1.28s} 1742 | train/epoch_247/loss 4.7677 1743 | train/epoch_247/ex jj ee 1744 | train/epoch_247/ex h d 1745 | train/epoch_247/ex e a 1746 | train/epoch_247/ex aaa aaa 1747 | train/epoch_247/ex fccfcf fcifcc 1748 | train/epoch_247{1.29s} 1749 | train/epoch_248/loss 5.1935 1750 | train/epoch_248/ex babbaba bbdadbc 1751 | train/epoch_248/ex ei ef 1752 | train/epoch_248/ex jajaj jajja 1753 | train/epoch_248/ex fc ef 1754 | train/epoch_248/ex ggbg dfgg 1755 | train/epoch_248{1.26s} 1756 | train/epoch_249/loss 5.5594 1757 | train/epoch_249/ex dddddd dddddd 1758 | train/epoch_249/ex aaif afaa 1759 | train/epoch_249/ex ddd ddd 1760 | train/epoch_249/ex gga gga 1761 | train/epoch_249/ex g i 1762 | train/epoch_249{1.26s} 1763 | train/epoch_250/loss 5.5036 1764 | train/epoch_250/ex e e 1765 | train/epoch_250/ex gggg gggg 1766 | train/epoch_250/ex ac af 1767 | train/epoch_250/ex i f 1768 | train/epoch_250/ex eefe aeff 1769 | train/epoch_250{1.28s} 1770 | train/epoch_251/loss 5.1481 1771 | train/epoch_251/ex ffffff ffffff 1772 | train/epoch_251/ex ggggag ggggcg 1773 | train/epoch_251/ex gfg fgf 1774 | train/epoch_251/ex gg gg 1775 | train/epoch_251/ex iiiii iiiii 1776 | train/epoch_251{1.28s} 1777 | train/epoch_252/loss 5.4657 1778 | train/epoch_252/ex bbbbbb bbbbbb 1779 | train/epoch_252/ex hhh hhh 1780 | train/epoch_252/ex b f 1781 | train/epoch_252/ex aaff fffb 1782 | train/epoch_252/ex i f 1783 | train/epoch_252{1.27s} 1784 | train/epoch_253/loss 5.6542 1785 | train/epoch_253/ex j b 1786 | train/epoch_253/ex jjj jjj 1787 | train/epoch_253/ex eeb jjg 1788 | train/epoch_253/ex iiiiiii iiiiiii 1789 | train/epoch_253/ex ba bc 1790 | train/epoch_253{1.25s} 1791 | train/epoch_254/loss 5.5091 1792 | train/epoch_254/ex bbbbe ebbbb 1793 | train/epoch_254/ex icciicc cicciic 1794 | train/epoch_254/ex jjj jjj 1795 | train/epoch_254/ex jjcjjjjjj cjjjjjjcc 1796 | train/epoch_254/ex ab ab 1797 | train/epoch_254{1.24s} 1798 | train/epoch_255/loss 5.3215 1799 | Epoch 255: reducing learning rate of group 0 to 2.4414e-07. 1800 | train/epoch_255/ex ej dj 1801 | train/epoch_255/ex ccdcccdcdc dccdddccdc 1802 | train/epoch_255/ex hhhhh hhhhh 1803 | train/epoch_255/ex ia gb 1804 | train/epoch_255/ex e i 1805 | train/epoch_255{1.28s} 1806 | train/epoch_256/loss 5.2321 1807 | train/epoch_256/ex dddddh dddddh 1808 | train/epoch_256/ex eeaee aaeaa 1809 | train/epoch_256/ex g g 1810 | train/epoch_256/ex cc cc 1811 | train/epoch_256/ex cbbbbb bcccbb 1812 | train/epoch_256{1.29s} 1813 | train/epoch_257/loss 5.3356 1814 | train/epoch_257/ex ih ih 1815 | train/epoch_257/ex ce cb 1816 | train/epoch_257/ex d h 1817 | train/epoch_257/ex hhhh hhhh 1818 | train/epoch_257/ex ffjj fffj 1819 | train/epoch_257{1.26s} 1820 | train/epoch_258/loss 4.7755 1821 | train/epoch_258/ex cc bb 1822 | train/epoch_258/ex ddddedd ddddedd 1823 | train/epoch_258/ex e h 1824 | train/epoch_258/ex gggggg gggggg 1825 | train/epoch_258/ex e d 1826 | train/epoch_258{1.28s} 1827 | train/epoch_259/loss 5.1965 1828 | train/epoch_259/ex bbbbbba bbbbabb 1829 | train/epoch_259/ex gd db 1830 | train/epoch_259/ex bbbb bbbb 1831 | train/epoch_259/ex aaa aaa 1832 | train/epoch_259/ex ccccc cccch 1833 | train/epoch_259{1.25s} 1834 | train/epoch_260/loss 5.4111 1835 | train/epoch_260/ex iiib iiif 1836 | train/epoch_260/ex bb bb 1837 | train/epoch_260/ex hhh fff 1838 | train/epoch_260/ex cc cc 1839 | train/epoch_260/ex eaeeaea egaeeea 1840 | train/epoch_260{1.33s} 1841 | train/epoch_261/loss 5.2273 1842 | train/epoch_261/ex iiiiiii iiiiiii 1843 | train/epoch_261/ex beebbeb ebeebee 1844 | train/epoch_261/ex jjh jjh 1845 | train/epoch_261/ex jjjh jjjh 1846 | train/epoch_261/ex iii iii 1847 | train/epoch_261{1.26s} 1848 | train/epoch_262/loss 5.3265 1849 | train/epoch_262/ex a d 1850 | train/epoch_262/ex aac cce 1851 | train/epoch_262/ex eaeae beiei 1852 | train/epoch_262/ex bfffffbf fbfbbbff 1853 | train/epoch_262/ex jcj bcb 1854 | train/epoch_262{1.25s} 1855 | train/epoch_263/loss 5.5598 1856 | train/epoch_263/ex bbbbbb bbbbbb 1857 | train/epoch_263/ex b g 1858 | train/epoch_263/ex ffiii ffiff 1859 | train/epoch_263/ex hhh hhh 1860 | train/epoch_263/ex ffffffff ffffffff 1861 | train/epoch_263{1.29s} 1862 | train/epoch_264/loss 5.4356 1863 | train/epoch_264/ex ie ei 1864 | train/epoch_264/ex a c 1865 | train/epoch_264/ex hhha hhii 1866 | train/epoch_264/ex jjjjjjj jjjjjjj 1867 | train/epoch_264/ex bdi bdi 1868 | train/epoch_264{1.26s} 1869 | train/epoch_265/loss 5.2521 1870 | train/epoch_265/ex ggggjgggcg fcggcfgccc 1871 | train/epoch_265/ex fffif bffbb 1872 | train/epoch_265/ex e f 1873 | train/epoch_265/ex d d 1874 | train/epoch_265/ex ebeb egec 1875 | train/epoch_265{1.31s} 1876 | train/epoch_266/loss 5.0254 1877 | Epoch 266: reducing learning rate of group 0 to 1.2207e-07. 1878 | train/epoch_266/ex iiiii iiiii 1879 | train/epoch_266/ex cjc cji 1880 | train/epoch_266/ex ddd ddd 1881 | train/epoch_266/ex dggdddd ggdgggd 1882 | train/epoch_266/ex giigii igiiig 1883 | train/epoch_266{1.27s} 1884 | train/epoch_267/loss 5.1152 1885 | train/epoch_267/ex bbbbb bbbbb 1886 | train/epoch_267/ex b e 1887 | train/epoch_267/ex iiiiiih iiiiiih 1888 | train/epoch_267/ex cccf cfff 1889 | train/epoch_267/ex ccgg ccgg 1890 | train/epoch_267{1.28s} 1891 | train/epoch_268/loss 4.9526 1892 | train/epoch_268/ex gg cc 1893 | train/epoch_268/ex ec eg 1894 | train/epoch_268/ex dg dg 1895 | train/epoch_268/ex fff fff 1896 | train/epoch_268/ex fafa afaf 1897 | train/epoch_268{1.27s} 1898 | train/epoch_269/loss 5.3438 1899 | train/epoch_269/ex d h 1900 | train/epoch_269/ex bbbbbbbb bbbbbbbb 1901 | train/epoch_269/ex gj fj 1902 | train/epoch_269/ex adada aiiad 1903 | train/epoch_269/ex bi gb 1904 | train/epoch_269{1.28s} 1905 | train/epoch_270/loss 4.9941 1906 | train/epoch_270/ex ihi iaf 1907 | train/epoch_270/ex fcfc fcfa 1908 | train/epoch_270/ex ggg ggg 1909 | train/epoch_270/ex d a 1910 | train/epoch_270/ex jjjdjjd jjdjjjd 1911 | train/epoch_270{1.28s} 1912 | train/epoch_271/loss 5.0858 1913 | train/epoch_271/ex jjjjjjjj fjjjjjjj 1914 | train/epoch_271/ex ccaac aacff 1915 | train/epoch_271/ex fffffd ffbbff 1916 | train/epoch_271/ex aaa aaa 1917 | train/epoch_271/ex hhjjhhj jjhhhjg 1918 | train/epoch_271{1.27s} 1919 | train/epoch_272/loss 5.0796 1920 | train/epoch_272/ex je bj 1921 | train/epoch_272/ex gd df 1922 | train/epoch_272/ex bbbbb bbbbb 1923 | train/epoch_272/ex bbb bbb 1924 | train/epoch_272/ex hhj hhj 1925 | train/epoch_272{1.28s} 1926 | train/epoch_273/loss 5.1146 1927 | train/epoch_273/ex fd cd 1928 | train/epoch_273/ex bbe bbf 1929 | train/epoch_273/ex j a 1930 | train/epoch_273/ex eeeeei eeeeie 1931 | train/epoch_273/ex eeeeh heeee 1932 | train/epoch_273{1.25s} 1933 | train/epoch_274/loss 5.0802 1934 | train/epoch_274/ex aaaaa aaaaa 1935 | train/epoch_274/ex jjjjj jjjjj 1936 | train/epoch_274/ex ggg ggg 1937 | train/epoch_274/ex ddddddd ddddddd 1938 | train/epoch_274/ex bbba bbbd 1939 | train/epoch_274{1.25s} 1940 | train/epoch_275/loss 5.5460 1941 | train/epoch_275/ex eeeeeee eeeeeee 1942 | train/epoch_275/ex d a 1943 | train/epoch_275/ex hhh hhh 1944 | train/epoch_275/ex jjjji jjjii 1945 | train/epoch_275/ex gc cj 1946 | train/epoch_275{1.28s} 1947 | train/epoch_276/loss 5.2379 1948 | train/epoch_276/ex h e 1949 | train/epoch_276/ex eeejee ejeeee 1950 | train/epoch_276/ex eae ead 1951 | train/epoch_276/ex iiiiii iiiiii 1952 | train/epoch_276/ex eegg ggge 1953 | train/epoch_276{1.29s} 1954 | train/epoch_277/loss 5.6893 1955 | Epoch 277: reducing learning rate of group 0 to 6.1035e-08. 1956 | train/epoch_277/ex aaa jjj 1957 | train/epoch_277/ex fh ef 1958 | train/epoch_277/ex aaccaaa aacaaaa 1959 | train/epoch_277/ex iiiiiih iiihiii 1960 | train/epoch_277/ex bbbh bbbi 1961 | train/epoch_277{1.27s} 1962 | train/epoch_278/loss 5.3276 1963 | train/epoch_278/ex dde dde 1964 | train/epoch_278/ex ddddd ddddj 1965 | train/epoch_278/ex ggggcggg ggcggggg 1966 | train/epoch_278/ex jj jj 1967 | train/epoch_278/ex bbbbbb bbbbbb 1968 | train/epoch_278{1.25s} 1969 | train/epoch_279/loss 5.2399 1970 | train/epoch_279/ex hddh hddh 1971 | train/epoch_279/ex d e 1972 | train/epoch_279/ex fa bf 1973 | train/epoch_279/ex jg jg 1974 | train/epoch_279/ex aaaaa aaaaa 1975 | train/epoch_279{1.26s} 1976 | train/epoch_280/loss 5.1643 1977 | train/epoch_280/ex g j 1978 | train/epoch_280/ex h h 1979 | train/epoch_280/ex ig gi 1980 | train/epoch_280/ex hh hh 1981 | train/epoch_280/ex aaaaaaa aaaaaaa 1982 | train/epoch_280{1.25s} 1983 | train/epoch_281/loss 5.1157 1984 | train/epoch_281/ex djd dje 1985 | train/epoch_281/ex beeb feeb 1986 | train/epoch_281/ex ffe hff 1987 | train/epoch_281/ex bbbbb bbbbb 1988 | train/epoch_281/ex eeeeaeee eeeeefee 1989 | train/epoch_281{1.25s} 1990 | train/epoch_282/loss 5.2856 1991 | train/epoch_282/ex bbbc ebbb 1992 | train/epoch_282/ex iih iih 1993 | train/epoch_282/ex jccjj cjjcc 1994 | train/epoch_282/ex hh ee 1995 | train/epoch_282/ex de ed 1996 | train/epoch_282{1.25s} 1997 | train/epoch_283/loss 5.3017 1998 | train/epoch_283/ex aaa aaa 1999 | train/epoch_283/ex eeeee eeeee 2000 | train/epoch_283/ex eec cce 2001 | train/epoch_283/ex ddd ddd 2002 | train/epoch_283/ex jfjfj cfcfc 2003 | train/epoch_283{1.27s} 2004 | train/epoch_284/loss 5.6017 2005 | train/epoch_284/ex je gj 2006 | train/epoch_284/ex ddii diii 2007 | train/epoch_284/ex jjjjj jjjjd 2008 | train/epoch_284/ex eeehe eeiee 2009 | train/epoch_284/ex bbf bff 2010 | train/epoch_284{1.27s} 2011 | train/epoch_285/loss 5.3544 2012 | train/epoch_285/ex ddd ddd 2013 | train/epoch_285/ex hh hh 2014 | train/epoch_285/ex jjjfff jdffff 2015 | train/epoch_285/ex d d 2016 | train/epoch_285/ex ggg fff 2017 | train/epoch_285{1.24s} 2018 | train/epoch_286/loss 5.6557 2019 | train/epoch_286/ex d h 2020 | train/epoch_286/ex eee eee 2021 | train/epoch_286/ex fff fff 2022 | train/epoch_286/ex eeg gge 2023 | train/epoch_286/ex jjfjj fjjjf 2024 | train/epoch_286{1.26s} 2025 | train/epoch_287/loss 4.8377 2026 | train/epoch_287/ex fdfdf dfdfd 2027 | train/epoch_287/ex ie ie 2028 | train/epoch_287/ex i i 2029 | train/epoch_287/ex hj gh 2030 | train/epoch_287/ex iiii iiii 2031 | train/epoch_287{1.28s} 2032 | train/epoch_288/loss 5.2522 2033 | Epoch 288: reducing learning rate of group 0 to 3.0518e-08. 2034 | train/epoch_288/ex dddddd jjjjjj 2035 | train/epoch_288/ex ffff ffff 2036 | train/epoch_288/ex jajaj jjajb 2037 | train/epoch_288/ex i j 2038 | train/epoch_288/ex cccc cccc 2039 | train/epoch_288{1.28s} 2040 | train/epoch_289/loss 5.6880 2041 | train/epoch_289/ex bbbc bbbf 2042 | train/epoch_289/ex ib ih 2043 | train/epoch_289/ex fffff fffff 2044 | train/epoch_289/ex he eh 2045 | train/epoch_289/ex gf fh 2046 | train/epoch_289{1.28s} 2047 | train/epoch_290/loss 5.2706 2048 | train/epoch_290/ex e d 2049 | train/epoch_290/ex hhhg gggh 2050 | train/epoch_290/ex igigi ficii 2051 | train/epoch_290/ex bbb bbb 2052 | train/epoch_290/ex d d 2053 | train/epoch_290{1.27s} 2054 | train/epoch_291/loss 4.8553 2055 | train/epoch_291/ex jjjjj jjjjj 2056 | train/epoch_291/ex ddbb ddbb 2057 | train/epoch_291/ex aaa ddd 2058 | train/epoch_291/ex aaa aaj 2059 | train/epoch_291/ex hhh hhh 2060 | train/epoch_291{1.24s} 2061 | train/epoch_292/loss 4.8169 2062 | train/epoch_292/ex ddd ddd 2063 | train/epoch_292/ex ggggfg ggggfg 2064 | train/epoch_292/ex e e 2065 | train/epoch_292/ex jj jj 2066 | train/epoch_292/ex dh dh 2067 | train/epoch_292{1.26s} 2068 | train/epoch_293/loss 5.4846 2069 | train/epoch_293/ex bbbbib ibiiii 2070 | train/epoch_293/ex cchc cfcc 2071 | train/epoch_293/ex ddd hhh 2072 | train/epoch_293/ex ecce eeae 2073 | train/epoch_293/ex hhhh hhhh 2074 | train/epoch_293{1.29s} 2075 | train/epoch_294/loss 5.0858 2076 | train/epoch_294/ex d d 2077 | train/epoch_294/ex iai idi 2078 | train/epoch_294/ex aaaab acaaa 2079 | train/epoch_294/ex e e 2080 | train/epoch_294/ex eee eee 2081 | train/epoch_294{1.26s} 2082 | train/epoch_295/loss 5.4773 2083 | train/epoch_295/ex ccccc ccccc 2084 | train/epoch_295/ex e e 2085 | train/epoch_295/ex fif fif 2086 | train/epoch_295/ex gd dg 2087 | train/epoch_295/ex gh gh 2088 | train/epoch_295{1.26s} 2089 | train/epoch_296/loss 5.1608 2090 | train/epoch_296/ex j b 2091 | train/epoch_296/ex eeeeee eeeeee 2092 | train/epoch_296/ex ccj cch 2093 | train/epoch_296/ex ggg ggg 2094 | train/epoch_296/ex gggggg gggggg 2095 | train/epoch_296{1.27s} 2096 | train/epoch_297/loss 4.9794 2097 | train/epoch_297/ex da cd 2098 | train/epoch_297/ex jje jjb 2099 | train/epoch_297/ex hhhj hhhe 2100 | train/epoch_297/ex ggggj jjjjg 2101 | train/epoch_297/ex dde dde 2102 | train/epoch_297{1.27s} 2103 | train/epoch_298/loss 5.6060 2104 | train/epoch_298/ex iig eii 2105 | train/epoch_298/ex ff ff 2106 | train/epoch_298/ex ccc ccc 2107 | train/epoch_298/ex g g 2108 | train/epoch_298/ex hdhdhd ihhida 2109 | train/epoch_298{1.27s} 2110 | train/epoch_299/loss 5.2526 2111 | Epoch 299: reducing learning rate of group 0 to 1.5259e-08. 2112 | train/epoch_299/ex ff ff 2113 | train/epoch_299/ex eeg gaa 2114 | train/epoch_299/ex aaa aaa 2115 | train/epoch_299/ex g f 2116 | train/epoch_299/ex aaa ccc 2117 | train/epoch_299{1.27s} 2118 | train/epoch_300/loss 4.9922 2119 | train/epoch_300/ex hhj hjh 2120 | train/epoch_300/ex ccgcc cgccc 2121 | train/epoch_300/ex c c 2122 | train/epoch_300/ex ffg gff 2123 | train/epoch_300/ex eeee eeee 2124 | train/epoch_300{1.30s} 2125 | train/epoch_301/loss 5.2836 2126 | train/epoch_301/ex gh hg 2127 | train/epoch_301/ex ffcf ffcf 2128 | train/epoch_301/ex di ad 2129 | train/epoch_301/ex a i 2130 | train/epoch_301/ex fgfgf hfggf 2131 | train/epoch_301{1.27s} 2132 | train/epoch_302/loss 5.3875 2133 | train/epoch_302/ex b j 2134 | train/epoch_302/ex ei ed 2135 | train/epoch_302/ex jjbbj bjjbb 2136 | train/epoch_302/ex c c 2137 | train/epoch_302/ex iii iii 2138 | train/epoch_302{1.27s} 2139 | train/epoch_303/loss 5.4097 2140 | train/epoch_303/ex eed edd 2141 | train/epoch_303/ex j i 2142 | train/epoch_303/ex ddd ddd 2143 | train/epoch_303/ex ba ba 2144 | train/epoch_303/ex jjjja cjjjj 2145 | train/epoch_303{1.27s} 2146 | train/epoch_304/loss 5.7080 2147 | train/epoch_304/ex bbb bbb 2148 | train/epoch_304/ex e e 2149 | train/epoch_304/ex faaf chhf 2150 | train/epoch_304/ex eeeeee eeeeee 2151 | train/epoch_304/ex gd ge 2152 | train/epoch_304{1.30s} 2153 | train/epoch_305/loss 5.5396 2154 | train/epoch_305/ex jjjjjj jjjjjj 2155 | train/epoch_305/ex jjjj jjjj 2156 | train/epoch_305/ex bbbbbbb bbbbbbb 2157 | train/epoch_305/ex j g 2158 | train/epoch_305/ex eec ecc 2159 | train/epoch_305{1.31s} 2160 | train/epoch_306/loss 5.3308 2161 | train/epoch_306/ex jjjee jjeee 2162 | train/epoch_306/ex jjc jjc 2163 | train/epoch_306/ex a j 2164 | train/epoch_306/ex gab gbg 2165 | train/epoch_306/ex i g 2166 | train/epoch_306{1.27s} 2167 | train/epoch_307/loss 5.3554 2168 | train/epoch_307/ex b c 2169 | train/epoch_307/ex aaai iibb 2170 | train/epoch_307/ex iii iii 2171 | train/epoch_307/ex ffffff ffffff 2172 | train/epoch_307/ex aaaaaaa aaaaaaa 2173 | train/epoch_307{1.23s} 2174 | train/epoch_308/loss 5.0846 2175 | train/epoch_308/ex dcddc ccdcd 2176 | train/epoch_308/ex iii iii 2177 | train/epoch_308/ex he ah 2178 | train/epoch_308/ex ggjg jccj 2179 | train/epoch_308/ex aaee aaae 2180 | train/epoch_308{1.24s} 2181 | train/epoch_309/loss 5.5337 2182 | train/epoch_309/ex ffh ffh 2183 | train/epoch_309/ex bjbj jbjb 2184 | train/epoch_309/ex ed ef 2185 | train/epoch_309/ex hhjh hjhh 2186 | train/epoch_309/ex i f 2187 | train/epoch_309{1.28s} 2188 | train/epoch_310/loss 5.5638 2189 | train/epoch_310/ex f g 2190 | train/epoch_310/ex cgc jcg 2191 | train/epoch_310/ex gggggg gggggg 2192 | train/epoch_310/ex bd if 2193 | train/epoch_310/ex dddd dddd 2194 | train/epoch_310{1.32s} 2195 | train/epoch_311/loss 5.2004 2196 | train/epoch_311/ex ijijij ijajaj 2197 | train/epoch_311/ex cc cc 2198 | train/epoch_311/ex e d 2199 | train/epoch_311/ex hhhh hhhc 2200 | train/epoch_311/ex iia aai 2201 | train/epoch_311{1.27s} 2202 | train/epoch_312/loss 4.8153 2203 | train/epoch_312/ex fffffff fffffff 2204 | train/epoch_312/ex iifc icff 2205 | train/epoch_312/ex d a 2206 | train/epoch_312/ex eh he 2207 | train/epoch_312/ex ghhhhhh ggghhgh 2208 | train/epoch_312{1.29s} 2209 | train/epoch_313/loss 4.8723 2210 | train/epoch_313/ex eee eee 2211 | train/epoch_313/ex aaaa gaaa 2212 | train/epoch_313/ex bbdbbd dddbdb 2213 | train/epoch_313/ex e h 2214 | train/epoch_313/ex cecce eccie 2215 | train/epoch_313{1.27s} 2216 | train/epoch_314/loss 5.5505 2217 | train/epoch_314/ex cccjj ccccj 2218 | train/epoch_314/ex jdjjjdjdj jajbbdadd 2219 | train/epoch_314/ex ffj ffj 2220 | train/epoch_314/ex b j 2221 | train/epoch_314/ex aab jaa 2222 | train/epoch_314{1.29s} 2223 | train/epoch_315/loss 5.3223 2224 | train/epoch_315/ex jjjjj djjjj 2225 | train/epoch_315/ex ggggggi gggeggg 2226 | train/epoch_315/ex fffff fffff 2227 | train/epoch_315/ex i a 2228 | train/epoch_315/ex eef bee 2229 | train/epoch_315{1.25s} 2230 | train/epoch_316/loss 5.2569 2231 | train/epoch_316/ex gegge dgddg 2232 | train/epoch_316/ex ffffff ffffff 2233 | train/epoch_316/ex bhbhb bhaba 2234 | train/epoch_316/ex ffffffff ffffffff 2235 | train/epoch_316/ex ah hg 2236 | train/epoch_316{1.25s} 2237 | train/epoch_317/loss 5.5604 2238 | train/epoch_317/ex ffeffffffe aefefeeeee 2239 | train/epoch_317/ex ah ch 2240 | train/epoch_317/ex eeeee eeeee 2241 | train/epoch_317/ex ff ff 2242 | train/epoch_317/ex jjjjjjj jjjjjjj 2243 | train/epoch_317{1.29s} 2244 | train/epoch_318/loss 5.1217 2245 | train/epoch_318/ex e b 2246 | train/epoch_318/ex hch hfh 2247 | train/epoch_318/ex hhhhd ghhhh 2248 | train/epoch_318/ex id di 2249 | train/epoch_318/ex iiiiiig giiiiii 2250 | train/epoch_318{1.29s} 2251 | train/epoch_319/loss 5.1010 2252 | train/epoch_319/ex i j 2253 | train/epoch_319/ex eeg cee 2254 | train/epoch_319/ex hhh hhh 2255 | train/epoch_319/ex eeeeeeee eeeeeeee 2256 | train/epoch_319/ex aja ajh 2257 | train/epoch_319{1.27s} 2258 | train/epoch_320/loss 5.6982 2259 | train/epoch_320/ex gg gg 2260 | train/epoch_320/ex hhhhh hhhhh 2261 | train/epoch_320/ex eeiii eeeii 2262 | train/epoch_320/ex b i 2263 | train/epoch_320/ex eeej deee 2264 | train/epoch_320{1.25s} 2265 | train/epoch_321/loss 5.3738 2266 | train/epoch_321/ex eeeeee eeeeee 2267 | train/epoch_321/ex jjjj jjje 2268 | train/epoch_321/ex fffj jfff 2269 | train/epoch_321/ex ee cc 2270 | train/epoch_321/ex jjji jiii 2271 | train/epoch_321{1.29s} 2272 | train/epoch_322/loss 5.6449 2273 | train/epoch_322/ex bbc jbb 2274 | train/epoch_322/ex bibi adbi 2275 | train/epoch_322/ex aaa aaa 2276 | train/epoch_322/ex gggggg gggggg 2277 | train/epoch_322/ex iiiii iiiii 2278 | train/epoch_322{1.30s} 2279 | train/epoch_323/loss 5.3113 2280 | train/epoch_323/ex h i 2281 | train/epoch_323/ex d a 2282 | train/epoch_323/ex jjj jjj 2283 | train/epoch_323/ex eeaeeeea eeaeaaee 2284 | train/epoch_323/ex ffb bff 2285 | train/epoch_323{1.28s} 2286 | train/epoch_324/loss 4.9354 2287 | train/epoch_324/ex fff fff 2288 | train/epoch_324/ex c b 2289 | train/epoch_324/ex dde gdd 2290 | train/epoch_324/ex ifi ifh 2291 | train/epoch_324/ex iiiiii iiiiii 2292 | train/epoch_324{1.25s} 2293 | train/epoch_325/loss 5.6181 2294 | train/epoch_325/ex ii ii 2295 | train/epoch_325/ex iic cii 2296 | train/epoch_325/ex bibbibi biiibib 2297 | train/epoch_325/ex bbe cbb 2298 | train/epoch_325/ex dddd dddd 2299 | train/epoch_325{1.29s} 2300 | train/epoch_326/loss 5.5414 2301 | train/epoch_326/ex eeei eeef 2302 | train/epoch_326/ex e g 2303 | train/epoch_326/ex e j 2304 | train/epoch_326/ex hhh hhh 2305 | train/epoch_326/ex e i 2306 | train/epoch_326{1.28s} 2307 | train/epoch_327/loss 5.1233 2308 | train/epoch_327/ex d h 2309 | train/epoch_327/ex ie bi 2310 | train/epoch_327/ex ca ca 2311 | train/epoch_327/ex ddddj dddda 2312 | train/epoch_327/ex jjjeee jejjjj 2313 | train/epoch_327{1.27s} 2314 | train/epoch_328/loss 5.4084 2315 | train/epoch_328/ex fff fff 2316 | train/epoch_328/ex ggggg ggggg 2317 | train/epoch_328/ex b j 2318 | train/epoch_328/ex hhhh hhhh 2319 | train/epoch_328/ex i i 2320 | train/epoch_328{1.30s} 2321 | train/epoch_329/loss 5.1402 2322 | train/epoch_329/ex jjjcj jjfjj 2323 | train/epoch_329/ex dd dd 2324 | train/epoch_329/ex eeg iee 2325 | train/epoch_329/ex i f 2326 | train/epoch_329/ex gdg gdb 2327 | train/epoch_329{1.27s} 2328 | train/epoch_330/loss 4.9824 2329 | train/epoch_330/ex cec cei 2330 | train/epoch_330/ex iie aii 2331 | train/epoch_330/ex bbh hhb 2332 | train/epoch_330/ex fifi ifif 2333 | train/epoch_330/ex gdggd cdgdd 2334 | train/epoch_330{1.29s} 2335 | train/epoch_331/loss 4.8431 2336 | train/epoch_331/ex dd dd 2337 | train/epoch_331/ex j j 2338 | train/epoch_331/ex gbg gbg 2339 | train/epoch_331/ex ddddd ddddd 2340 | train/epoch_331/ex ddddddd ddddddd 2341 | train/epoch_331{1.28s} 2342 | train/epoch_332/loss 5.2783 2343 | train/epoch_332/ex jjj jjj 2344 | train/epoch_332/ex iiiiii iiiiii 2345 | train/epoch_332/ex ggc igg 2346 | train/epoch_332/ex ghggh hgghb 2347 | train/epoch_332/ex d d 2348 | train/epoch_332{1.27s} 2349 | train/epoch_333/loss 4.8253 2350 | train/epoch_333/ex cccc cccc 2351 | train/epoch_333/ex fff ddd 2352 | train/epoch_333/ex efefef idfidd 2353 | train/epoch_333/ex c b 2354 | train/epoch_333/ex ddj dda 2355 | train/epoch_333{1.26s} 2356 | train/epoch_334/loss 5.4519 2357 | train/epoch_334/ex jh je 2358 | train/epoch_334/ex e h 2359 | train/epoch_334/ex jjjjjj jjjjjj 2360 | train/epoch_334/ex ddddddd ddddddd 2361 | train/epoch_334/ex g b 2362 | train/epoch_334{1.28s} 2363 | train/epoch_335/loss 4.9193 2364 | train/epoch_335/ex j f 2365 | train/epoch_335/ex ccf fcc 2366 | train/epoch_335/ex ffe eff 2367 | train/epoch_335/ex ddddd ddddd 2368 | train/epoch_335/ex iii iii 2369 | train/epoch_335{1.28s} 2370 | train/epoch_336/loss 5.3302 2371 | train/epoch_336/ex jjjjjjj jjjjjjj 2372 | train/epoch_336/ex ccjc cjcc 2373 | train/epoch_336/ex dddddd dddddd 2374 | train/epoch_336/ex bbbi bbbi 2375 | train/epoch_336/ex iijii jjijj 2376 | train/epoch_336{1.27s} 2377 | train/epoch_337/loss 4.9250 2378 | train/epoch_337/ex gggggg gggggg 2379 | train/epoch_337/ex eebeeeeb eeceeeeb 2380 | train/epoch_337/ex ddddddd ddddddd 2381 | train/epoch_337/ex fhfhfhf fjhhjhj 2382 | train/epoch_337/ex b a 2383 | train/epoch_337{1.25s} 2384 | -------------------------------------------------------------------------------- /exp/test/run.out: -------------------------------------------------------------------------------- 1 | train/epoch_000/loss 22.8362 2 | train/epoch_000/ex c jjjjjjjj 3 | train/epoch_000/ex c h 4 | train/epoch_000/ex hhhhhh hh 5 | train/epoch_000/ex c be 6 | train/epoch_000/ex c g 7 | train/epoch_000{1.67s} 8 | train/epoch_001/loss 17.8316 9 | train/epoch_001/ex hhhhhhhhhhhhhh hghhh 10 | train/epoch_001/ex eeeeee cccgc 11 | train/epoch_001/ex dd dgg 12 | train/epoch_001/ex jjj bba 13 | train/epoch_001/ex dddddddd bbbbb 14 | train/epoch_001{1.66s} 15 | train/epoch_002/loss 15.7034 16 | train/epoch_002/ex hhhhhhhh ccccccc 17 | train/epoch_002/ex ee de 18 | train/epoch_002/ex ee hj 19 | train/epoch_002/ex aaaaaaa jhhhjh 20 | train/epoch_002/ex ee ee 21 | train/epoch_002{1.68s} 22 | train/epoch_003/loss 15.4253 23 | train/epoch_003/ex hhhhh gjjj 24 | train/epoch_003/ex cccc fff 25 | train/epoch_003/ex cccc ddd 26 | train/epoch_003/ex ddd jj 27 | train/epoch_003/ex hhhhh iiii 28 | train/epoch_003{1.64s} 29 | train/epoch_004/loss 14.3880 30 | train/epoch_004/ex ddd eei 31 | train/epoch_004/ex jjj bbb 32 | train/epoch_004/ex dd jj 33 | train/epoch_004/ex dd hh 34 | train/epoch_004/ex hhhhhh hhhhhhh 35 | train/epoch_004{1.66s} 36 | train/epoch_005/loss 13.5733 37 | train/epoch_005/ex d j 38 | train/epoch_005/ex ddddddddd fffffffff 39 | train/epoch_005/ex jjjjjj jjjjjj 40 | train/epoch_005/ex j d 41 | train/epoch_005/ex ccccc hhchc 42 | train/epoch_005{1.66s} 43 | train/epoch_006/loss 13.6279 44 | train/epoch_006/ex i f 45 | train/epoch_006/ex jjjjj fffff 46 | train/epoch_006/ex i c 47 | train/epoch_006/ex ii dg 48 | train/epoch_006/ex i d 49 | train/epoch_006{1.66s} 50 | train/epoch_007/loss 12.9868 51 | train/epoch_007/ex d e 52 | train/epoch_007/ex d jj 53 | train/epoch_007/ex ggg jjjj 54 | train/epoch_007/ex ccc ddee 55 | train/epoch_007/ex ggg eeb 56 | train/epoch_007{1.65s} 57 | train/epoch_008/loss 13.9978 58 | train/epoch_008/ex jjj iii 59 | train/epoch_008/ex jjjj ddda 60 | train/epoch_008/ex jjj ccj 61 | train/epoch_008/ex jjj jjf 62 | train/epoch_008/ex jjjj eeeee 63 | train/epoch_008{1.64s} 64 | train/epoch_009/loss 12.8823 65 | train/epoch_009/ex ddd gee 66 | train/epoch_009/ex ddd ggg 67 | train/epoch_009/ex gggg gece 68 | train/epoch_009/ex ggggggggg gffififi 69 | train/epoch_009/ex ggggg fffff 70 | train/epoch_009{1.62s} 71 | train/epoch_010/loss 12.7981 72 | train/epoch_010/ex iii ddd 73 | train/epoch_010/ex a a 74 | train/epoch_010/ex ggg hhi 75 | train/epoch_010/ex ggggg bcccb 76 | train/epoch_010/ex ggg iii 77 | train/epoch_010{1.71s} 78 | train/epoch_011/loss 13.0906 79 | train/epoch_011/ex ffff aaab 80 | train/epoch_011/ex fff fff 81 | train/epoch_011/ex jj bd 82 | train/epoch_011/ex jj fd 83 | train/epoch_011/ex ggg hgg 84 | train/epoch_011{1.75s} 85 | train/epoch_012/loss 13.2870 86 | train/epoch_012/ex ccccc hhhhh 87 | train/epoch_012/ex ff jj 88 | train/epoch_012/ex fff efg 89 | train/epoch_012/ex ff fg 90 | train/epoch_012/ex eee daa 91 | train/epoch_012{1.73s} 92 | train/epoch_013/loss 12.4678 93 | train/epoch_013/ex jjjj aaaa 94 | train/epoch_013/ex jj gg 95 | train/epoch_013/ex jjjj dddd 96 | train/epoch_013/ex d d 97 | train/epoch_013/ex jjjjj gggga 98 | train/epoch_013{1.68s} 99 | train/epoch_014/loss 12.5800 100 | train/epoch_014/ex ee ij 101 | train/epoch_014/ex h a 102 | train/epoch_014/ex cc dc 103 | train/epoch_014/ex jjjjj eaaaa 104 | train/epoch_014/ex c h 105 | train/epoch_014{1.70s} 106 | train/epoch_015/loss 13.1313 107 | train/epoch_015/ex jj jg 108 | train/epoch_015/ex ggggg iiiii 109 | train/epoch_015/ex jj dd 110 | train/epoch_015/ex jj dd 111 | train/epoch_015/ex bbbbb gggge 112 | train/epoch_015{1.66s} 113 | train/epoch_016/loss 12.1703 114 | train/epoch_016/ex fff aah 115 | train/epoch_016/ex c j 116 | train/epoch_016/ex fff igg 117 | train/epoch_016/ex cccccccc ddddddd 118 | train/epoch_016/ex ffff hhhh 119 | train/epoch_016{1.77s} 120 | train/epoch_017/loss 12.0576 121 | train/epoch_017/ex ccccccc afaaafa 122 | train/epoch_017/ex g i 123 | train/epoch_017/ex cccccc ccccce 124 | train/epoch_017/ex d i 125 | train/epoch_017/ex ggggg hbhhb 126 | train/epoch_017{1.72s} 127 | train/epoch_018/loss 12.5933 128 | train/epoch_018/ex iiii ffff 129 | train/epoch_018/ex bbbbbb eggggg 130 | train/epoch_018/ex aaa fhf 131 | train/epoch_018/ex ii fh 132 | train/epoch_018/ex bbbbb iiiii 133 | train/epoch_018{1.68s} 134 | train/epoch_019/loss 12.2876 135 | train/epoch_019/ex hhhh hjbb 136 | train/epoch_019/ex iii ffe 137 | train/epoch_019/ex b d 138 | train/epoch_019/ex c d 139 | train/epoch_019/ex ccccc fhjfh 140 | train/epoch_019{1.68s} 141 | train/epoch_020/loss 12.1402 142 | train/epoch_020/ex f c 143 | train/epoch_020/ex hhh ddd 144 | train/epoch_020/ex hhhh gggg 145 | train/epoch_020/ex fff iff 146 | train/epoch_020/ex hhh ddd 147 | train/epoch_020{1.70s} 148 | train/epoch_021/loss 12.5671 149 | train/epoch_021/ex eee bbb 150 | train/epoch_021/ex ii bb 151 | train/epoch_021/ex i a 152 | train/epoch_021/ex ggg jjj 153 | train/epoch_021/ex ggg fbb 154 | train/epoch_021{1.73s} 155 | train/epoch_022/loss 12.4098 156 | train/epoch_022/ex hhhh didd 157 | train/epoch_022/ex ddd dci 158 | train/epoch_022/ex ggg bee 159 | train/epoch_022/ex hh cj 160 | train/epoch_022/ex d a 161 | train/epoch_022{1.78s} 162 | train/epoch_023/loss 11.6609 163 | train/epoch_023/ex hhhhhh jhjhhh 164 | train/epoch_023/ex ccc adi 165 | train/epoch_023/ex h f 166 | train/epoch_023/ex ccc iii 167 | train/epoch_023/ex a d 168 | train/epoch_023{1.67s} 169 | train/epoch_024/loss 12.1278 170 | train/epoch_024/ex gggg iiii 171 | train/epoch_024/ex h e 172 | train/epoch_024/ex jjjj aaaa 173 | train/epoch_024/ex gg fg 174 | train/epoch_024/ex jjjj jjjb 175 | train/epoch_024{1.73s} 176 | train/epoch_025/loss 11.1727 177 | train/epoch_025/ex d g 178 | train/epoch_025/ex ee ce 179 | train/epoch_025/ex fff ffd 180 | train/epoch_025/ex hhhhh hhhhh 181 | train/epoch_025/ex ee he 182 | train/epoch_025{1.72s} 183 | train/epoch_026/loss 11.3304 184 | train/epoch_026/ex fff eai 185 | train/epoch_026/ex ccccccc ccjcccc 186 | train/epoch_026/ex aaaaa aaaai 187 | train/epoch_026/ex jj ja 188 | train/epoch_026/ex aaaa jjjf 189 | train/epoch_026{1.64s} 190 | train/epoch_027/loss 11.3086 191 | train/epoch_027/ex ii bj 192 | train/epoch_027/ex i f 193 | train/epoch_027/ex c c 194 | train/epoch_027/ex ccc dcd 195 | train/epoch_027/ex iiii giig 196 | train/epoch_027{1.68s} 197 | train/epoch_028/loss 11.5476 198 | train/epoch_028/ex eee bjj 199 | train/epoch_028/ex iiii jddd 200 | train/epoch_028/ex hhhh hhhh 201 | train/epoch_028/ex c g 202 | train/epoch_028/ex aa gd 203 | train/epoch_028{1.73s} 204 | train/epoch_029/loss 11.0319 205 | train/epoch_029/ex ddd ddj 206 | train/epoch_029/ex i e 207 | train/epoch_029/ex ee hh 208 | train/epoch_029/ex b c 209 | train/epoch_029/ex dddd cddi 210 | train/epoch_029{1.67s} 211 | train/epoch_030/loss 10.6165 212 | train/epoch_030/ex ggg ggg 213 | train/epoch_030/ex bb bb 214 | train/epoch_030/ex dddddd ddddhd 215 | train/epoch_030/ex jj jj 216 | train/epoch_030/ex iiii ibbb 217 | train/epoch_030{1.78s} 218 | train/epoch_031/loss 10.4115 219 | train/epoch_031/ex aaaaaa aagaaa 220 | train/epoch_031/ex gg dg 221 | train/epoch_031/ex bbbb bbgb 222 | train/epoch_031/ex gggg aagg 223 | train/epoch_031/ex eeee eeea 224 | train/epoch_031{1.69s} 225 | train/epoch_032/loss 9.9072 226 | train/epoch_032/ex dddd dddd 227 | train/epoch_032/ex ggg ggh 228 | train/epoch_032/ex iiiii iiiii 229 | train/epoch_032/ex cccc cccg 230 | train/epoch_032/ex bbbbbb gggdgg 231 | train/epoch_032{1.81s} 232 | train/epoch_033/loss 10.3149 233 | train/epoch_033/ex d d 234 | train/epoch_033/ex ii gb 235 | train/epoch_033/ex dd de 236 | train/epoch_033/ex iii iii 237 | train/epoch_033/ex gggg gbbe 238 | train/epoch_033{1.69s} 239 | train/epoch_034/loss 9.4857 240 | train/epoch_034/ex d i 241 | train/epoch_034/ex ccccc chcch 242 | train/epoch_034/ex ggggg ggggg 243 | train/epoch_034/ex bbb ddi 244 | train/epoch_034/ex d c 245 | train/epoch_034{1.68s} 246 | train/epoch_035/loss 9.1306 247 | train/epoch_035/ex i e 248 | train/epoch_035/ex eee deb 249 | train/epoch_035/ex ccc aca 250 | train/epoch_035/ex aaa haa 251 | train/epoch_035/ex d d 252 | train/epoch_035{1.63s} 253 | train/epoch_036/loss 9.2752 254 | train/epoch_036/ex bbb iii 255 | train/epoch_036/ex jjjjjj fjjjff 256 | train/epoch_036/ex ccc fcf 257 | train/epoch_036/ex ggg ggg 258 | train/epoch_036/ex bb bb 259 | train/epoch_036{1.65s} 260 | train/epoch_037/loss 9.0192 261 | train/epoch_037/ex bbb bbb 262 | train/epoch_037/ex eee hee 263 | train/epoch_037/ex hh fh 264 | train/epoch_037/ex ccc cbi 265 | train/epoch_037/ex e h 266 | train/epoch_037{1.63s} 267 | train/epoch_038/loss 8.5020 268 | train/epoch_038/ex ggg ggg 269 | train/epoch_038/ex aa ai 270 | train/epoch_038/ex d f 271 | train/epoch_038/ex jjj ahh 272 | train/epoch_038/ex jjjjjjjj jjjjjjj 273 | train/epoch_038{1.68s} 274 | train/epoch_039/loss 8.8784 275 | train/epoch_039/ex hhhh hhhh 276 | train/epoch_039/ex i i 277 | train/epoch_039/ex ddddd ddddd 278 | train/epoch_039/ex aaaa aaaa 279 | train/epoch_039/ex hhh ccc 280 | train/epoch_039{1.69s} 281 | train/epoch_040/loss 8.5456 282 | train/epoch_040/ex eee iff 283 | train/epoch_040/ex jjj jjj 284 | train/epoch_040/ex d e 285 | train/epoch_040/ex fffff ffffa 286 | train/epoch_040/ex ccc ccc 287 | train/epoch_040{1.68s} 288 | train/epoch_041/loss 7.9460 289 | train/epoch_041/ex a d 290 | train/epoch_041/ex bb ji 291 | train/epoch_041/ex f j 292 | train/epoch_041/ex d h 293 | train/epoch_041/ex gggggg gggggg 294 | train/epoch_041{1.75s} 295 | train/epoch_042/loss 8.4096 296 | train/epoch_042/ex jjjjj jjbbj 297 | train/epoch_042/ex bbbbb bbbib 298 | train/epoch_042/ex ee be 299 | train/epoch_042/ex hh be 300 | train/epoch_042/ex iiiiiii iiiigii 301 | train/epoch_042{1.70s} 302 | train/epoch_043/loss 8.3319 303 | train/epoch_043/ex hhhhhhh cccehhe 304 | train/epoch_043/ex aaaaaaa aabaaaa 305 | train/epoch_043/ex jjjj igjj 306 | train/epoch_043/ex bbb bbb 307 | train/epoch_043/ex eee iee 308 | train/epoch_043{1.61s} 309 | train/epoch_044/loss 8.2171 310 | train/epoch_044/ex bbb ajc 311 | train/epoch_044/ex jjjj jjjj 312 | train/epoch_044/ex iiii ciii 313 | train/epoch_044/ex dddd dddd 314 | train/epoch_044/ex dd dg 315 | train/epoch_044{1.70s} 316 | train/epoch_045/loss 8.4160 317 | train/epoch_045/ex ee fb 318 | train/epoch_045/ex d d 319 | train/epoch_045/ex fff fff 320 | train/epoch_045/ex jj de 321 | train/epoch_045/ex d d 322 | train/epoch_045{1.74s} 323 | train/epoch_046/loss 7.9525 324 | train/epoch_046/ex b a 325 | train/epoch_046/ex j j 326 | train/epoch_046/ex b c 327 | train/epoch_046/ex b d 328 | train/epoch_046/ex ggg gga 329 | train/epoch_046{1.65s} 330 | train/epoch_047/loss 8.0812 331 | train/epoch_047/ex ccc cee 332 | train/epoch_047/ex eeeee eeeee 333 | train/epoch_047/ex e e 334 | train/epoch_047/ex bbbbb abaaa 335 | train/epoch_047/ex hhhhh hfhhh 336 | train/epoch_047{1.64s} 337 | train/epoch_048/loss 7.9757 338 | train/epoch_048/ex eee eee 339 | train/epoch_048/ex jjjj jjjj 340 | train/epoch_048/ex hh hh 341 | train/epoch_048/ex fff ddd 342 | train/epoch_048/ex aaaaaaaa babababa 343 | train/epoch_048{1.63s} 344 | train/epoch_049/loss 8.2288 345 | train/epoch_049/ex aaa haa 346 | train/epoch_049/ex d g 347 | train/epoch_049/ex bb gh 348 | train/epoch_049/ex ccc ccc 349 | train/epoch_049/ex jjjj jddj 350 | train/epoch_049{1.67s} 351 | train/epoch_050/loss 7.7076 352 | train/epoch_050/ex bbbbbbb bbbbbbb 353 | train/epoch_050/ex jjjj jjjj 354 | train/epoch_050/ex aaaaaaaaaa aaaaaaaaae 355 | train/epoch_050/ex ddddddd cccdccd 356 | train/epoch_050/ex gggggg gjjggj 357 | train/epoch_050{1.67s} 358 | train/epoch_051/loss 7.5583 359 | train/epoch_051/ex gggg gcgg 360 | train/epoch_051/ex ffff fffj 361 | train/epoch_051/ex iiiiiii gifffff 362 | train/epoch_051/ex ii bb 363 | train/epoch_051/ex iiiiii igggig 364 | train/epoch_051{1.72s} 365 | train/epoch_052/loss 8.0744 366 | train/epoch_052/ex fffffff fefffff 367 | train/epoch_052/ex hhhhh hhihh 368 | train/epoch_052/ex jj ae 369 | train/epoch_052/ex bbbb bccc 370 | train/epoch_052/ex iiiih iccci 371 | train/epoch_052{1.66s} 372 | train/epoch_053/loss 7.7585 373 | train/epoch_053/ex dddd aadd 374 | train/epoch_053/ex eeeeg ggeee 375 | train/epoch_053/ex ggg gcb 376 | train/epoch_053/ex iiiii iiiii 377 | train/epoch_053/ex j f 378 | train/epoch_053{1.63s} 379 | train/epoch_054/loss 7.6292 380 | train/epoch_054/ex g b 381 | train/epoch_054/ex jjjj jjjj 382 | train/epoch_054/ex ddd ddd 383 | train/epoch_054/ex fffff aafac 384 | train/epoch_054/ex fff efc 385 | train/epoch_054{1.70s} 386 | train/epoch_055/loss 7.4907 387 | train/epoch_055/ex cccc aaaa 388 | train/epoch_055/ex b e 389 | train/epoch_055/ex bbbbb babja 390 | train/epoch_055/ex bb ib 391 | train/epoch_055/ex bbbbb bbbbf 392 | train/epoch_055{1.70s} 393 | train/epoch_056/loss 7.4383 394 | train/epoch_056/ex aaaaaaaaa aiaaiiiaa 395 | train/epoch_056/ex i a 396 | train/epoch_056/ex i i 397 | train/epoch_056/ex dd fe 398 | train/epoch_056/ex iiii iiii 399 | train/epoch_056{1.70s} 400 | train/epoch_057/loss 6.6370 401 | train/epoch_057/ex hh hh 402 | train/epoch_057/ex jjjjj jjjjj 403 | train/epoch_057/ex ff fb 404 | train/epoch_057/ex hhh hhg 405 | train/epoch_057/ex hd ih 406 | train/epoch_057{1.73s} 407 | train/epoch_058/loss 7.4613 408 | train/epoch_058/ex iiiii iaiii 409 | train/epoch_058/ex eeee fbbf 410 | train/epoch_058/ex i b 411 | train/epoch_058/ex ddd ddd 412 | train/epoch_058/ex ggggg gbggb 413 | train/epoch_058{1.63s} 414 | train/epoch_059/loss 7.8029 415 | train/epoch_059/ex ggg iee 416 | train/epoch_059/ex eeeee eeeee 417 | train/epoch_059/ex j h 418 | train/epoch_059/ex bbbb bbbc 419 | train/epoch_059/ex d a 420 | train/epoch_059{1.68s} 421 | train/epoch_060/loss 7.4298 422 | train/epoch_060/ex ddd ddd 423 | train/epoch_060/ex b b 424 | train/epoch_060/ex b d 425 | train/epoch_060/ex ffffff eeffee 426 | train/epoch_060/ex iiiiiii iiiiiii 427 | train/epoch_060{1.63s} 428 | train/epoch_061/loss 7.6609 429 | train/epoch_061/ex iiiiii iiigii 430 | train/epoch_061/ex fffif fafff 431 | train/epoch_061/ex bbb fdb 432 | train/epoch_061/ex bbbb baaa 433 | train/epoch_061/ex i i 434 | train/epoch_061{1.66s} 435 | train/epoch_062/loss 7.3057 436 | train/epoch_062/ex aaaaaaa aaaaaaa 437 | train/epoch_062/ex aaaaaaaaa aaaaaaaaa 438 | train/epoch_062/ex ai ai 439 | train/epoch_062/ex iiiii ibiii 440 | train/epoch_062/ex hh eh 441 | train/epoch_062{1.69s} 442 | train/epoch_063/loss 7.3409 443 | train/epoch_063/ex g e 444 | train/epoch_063/ex eeeei idide 445 | train/epoch_063/ex d a 446 | train/epoch_063/ex i i 447 | train/epoch_063/ex g g 448 | train/epoch_063{1.71s} 449 | train/epoch_064/loss 6.9645 450 | train/epoch_064/ex i h 451 | train/epoch_064/ex ee hh 452 | train/epoch_064/ex aaa aaa 453 | train/epoch_064/ex ccc ccc 454 | train/epoch_064/ex ii fi 455 | train/epoch_064{1.65s} 456 | train/epoch_065/loss 7.2653 457 | train/epoch_065/ex dd db 458 | train/epoch_065/ex fe de 459 | train/epoch_065/ex bfb fef 460 | train/epoch_065/ex eee bbb 461 | train/epoch_065/ex eee eej 462 | train/epoch_065{1.66s} 463 | train/epoch_066/loss 7.0616 464 | train/epoch_066/ex iiii iiii 465 | train/epoch_066/ex i j 466 | train/epoch_066/ex j i 467 | train/epoch_066/ex aaaa aaad 468 | train/epoch_066/ex ggggg ggggg 469 | train/epoch_066{1.67s} 470 | train/epoch_067/loss 7.0897 471 | train/epoch_067/ex j i 472 | train/epoch_067/ex b d 473 | train/epoch_067/ex ccccc ccccd 474 | train/epoch_067/ex jjjj jjjj 475 | train/epoch_067/ex dd bb 476 | train/epoch_067{1.68s} 477 | train/epoch_068/loss 7.2424 478 | Epoch 68: reducing learning rate of group 0 to 1.0000e-03. 479 | train/epoch_068/ex b b 480 | train/epoch_068/ex hhhe eeeg 481 | train/epoch_068/ex ggggg ggggg 482 | train/epoch_068/ex bbbbbbbb bggggggg 483 | train/epoch_068/ex d b 484 | train/epoch_068{1.78s} 485 | train/epoch_069/loss 6.6082 486 | train/epoch_069/ex iiiii iiiii 487 | train/epoch_069/ex bbiiii ibbbbb 488 | train/epoch_069/ex jjjj jjjj 489 | train/epoch_069/ex ggee egge 490 | train/epoch_069/ex bbbb bbbi 491 | train/epoch_069{1.68s} 492 | train/epoch_070/loss 6.7222 493 | train/epoch_070/ex hhhh bgbb 494 | train/epoch_070/ex dddd dddd 495 | train/epoch_070/ex aaj ajj 496 | train/epoch_070/ex cccc eeee 497 | train/epoch_070/ex j j 498 | train/epoch_070{1.61s} 499 | train/epoch_071/loss 7.0077 500 | train/epoch_071/ex bc cb 501 | train/epoch_071/ex ggg gga 502 | train/epoch_071/ex fgf fgf 503 | train/epoch_071/ex e i 504 | train/epoch_071/ex bbbb bebb 505 | train/epoch_071{1.60s} 506 | train/epoch_072/loss 6.9859 507 | train/epoch_072/ex cacc acca 508 | train/epoch_072/ex ffff ffff 509 | train/epoch_072/ex ddddddd ddddddd 510 | train/epoch_072/ex ddd ddd 511 | train/epoch_072/ex gggg gggg 512 | train/epoch_072{1.64s} 513 | train/epoch_073/loss 6.4847 514 | train/epoch_073/ex d f 515 | train/epoch_073/ex dd df 516 | train/epoch_073/ex cccccb ebcbbc 517 | train/epoch_073/ex jccc ccjc 518 | train/epoch_073/ex jjj aaa 519 | train/epoch_073{1.62s} 520 | train/epoch_074/loss 6.6003 521 | train/epoch_074/ex eeec cece 522 | train/epoch_074/ex jjjj cjjj 523 | train/epoch_074/ex jjjj jjjj 524 | train/epoch_074/ex abba abba 525 | train/epoch_074/ex hb gj 526 | train/epoch_074{1.77s} 527 | train/epoch_075/loss 6.7520 528 | train/epoch_075/ex dd he 529 | train/epoch_075/ex hhhh hfhh 530 | train/epoch_075/ex h h 531 | train/epoch_075/ex ggggggg ggggggg 532 | train/epoch_075/ex aaaaaj jajjja 533 | train/epoch_075{1.66s} 534 | train/epoch_076/loss 6.6033 535 | train/epoch_076/ex hhhhh haahh 536 | train/epoch_076/ex iii iii 537 | train/epoch_076/ex aac aca 538 | train/epoch_076/ex ff ff 539 | train/epoch_076/ex bbbbbbb bbbbbbb 540 | train/epoch_076{1.66s} 541 | train/epoch_077/loss 6.5350 542 | train/epoch_077/ex c e 543 | train/epoch_077/ex dg dg 544 | train/epoch_077/ex gggggg gggggf 545 | train/epoch_077/ex ccgggg gccgcc 546 | train/epoch_077/ex ffffff ffffff 547 | train/epoch_077{1.72s} 548 | train/epoch_078/loss 6.7589 549 | train/epoch_078/ex eefe fefe 550 | train/epoch_078/ex ddddd ddddd 551 | train/epoch_078/ex cc aa 552 | train/epoch_078/ex ddd ddd 553 | train/epoch_078/ex cc fc 554 | train/epoch_078{1.64s} 555 | train/epoch_079/loss 6.8897 556 | train/epoch_079/ex aaaaa aaaah 557 | train/epoch_079/ex eeee eeee 558 | train/epoch_079/ex jddbj jbbbb 559 | train/epoch_079/ex b b 560 | train/epoch_079/ex d d 561 | train/epoch_079{1.62s} 562 | train/epoch_080/loss 6.6700 563 | train/epoch_080/ex bbb jjj 564 | train/epoch_080/ex cccc cccc 565 | train/epoch_080/ex de ec 566 | train/epoch_080/ex jjjj jjjj 567 | train/epoch_080/ex dddd dddd 568 | train/epoch_080{1.69s} 569 | train/epoch_081/loss 6.2871 570 | train/epoch_081/ex ii hi 571 | train/epoch_081/ex hh ii 572 | train/epoch_081/ex da gd 573 | train/epoch_081/ex jg jd 574 | train/epoch_081/ex eei dee 575 | train/epoch_081{1.69s} 576 | train/epoch_082/loss 6.6473 577 | train/epoch_082/ex dddg gddd 578 | train/epoch_082/ex eeb ebb 579 | train/epoch_082/ex didi fdfd 580 | train/epoch_082/ex cc ii 581 | train/epoch_082/ex bdb edb 582 | train/epoch_082{1.62s} 583 | train/epoch_083/loss 6.8588 584 | train/epoch_083/ex ggg gge 585 | train/epoch_083/ex fffe efff 586 | train/epoch_083/ex ccccc dcccc 587 | train/epoch_083/ex fafa adea 588 | train/epoch_083/ex cccccc cceeie 589 | train/epoch_083{1.69s} 590 | train/epoch_084/loss 6.4701 591 | train/epoch_084/ex hhh bhh 592 | train/epoch_084/ex eee geg 593 | train/epoch_084/ex ccccc ceeee 594 | train/epoch_084/ex dddd ddad 595 | train/epoch_084/ex jc fj 596 | train/epoch_084{1.68s} 597 | train/epoch_085/loss 6.4537 598 | train/epoch_085/ex aa ef 599 | train/epoch_085/ex hhh fff 600 | train/epoch_085/ex aaaa aggg 601 | train/epoch_085/ex hhh hhh 602 | train/epoch_085/ex c c 603 | train/epoch_085{1.64s} 604 | train/epoch_086/loss 6.0545 605 | train/epoch_086/ex iiiii eeeee 606 | train/epoch_086/ex eeej jejj 607 | train/epoch_086/ex ccc aaa 608 | train/epoch_086/ex ggggg hgggg 609 | train/epoch_086/ex c c 610 | train/epoch_086{1.63s} 611 | train/epoch_087/loss 6.5613 612 | train/epoch_087/ex aaaaaaa fffhaah 613 | train/epoch_087/ex b a 614 | train/epoch_087/ex iiii iibi 615 | train/epoch_087/ex gg he 616 | train/epoch_087/ex ffff fffg 617 | train/epoch_087{1.71s} 618 | train/epoch_088/loss 6.4960 619 | train/epoch_088/ex eee eei 620 | train/epoch_088/ex hch hhc 621 | train/epoch_088/ex bf fi 622 | train/epoch_088/ex bbb bbb 623 | train/epoch_088/ex ddddddd ddddddd 624 | train/epoch_088{1.59s} 625 | train/epoch_089/loss 6.1300 626 | train/epoch_089/ex dddddddddddd dddddddddddd 627 | train/epoch_089/ex ccc ccc 628 | train/epoch_089/ex ccccc dcccc 629 | train/epoch_089/ex ccc ccc 630 | train/epoch_089/ex bb bh 631 | train/epoch_089{1.69s} 632 | train/epoch_090/loss 6.4890 633 | train/epoch_090/ex cccc cccg 634 | train/epoch_090/ex hhh iii 635 | train/epoch_090/ex cc cc 636 | train/epoch_090/ex c h 637 | train/epoch_090/ex dc hd 638 | train/epoch_090{1.68s} 639 | train/epoch_091/loss 6.2117 640 | train/epoch_091/ex cccc cccc 641 | train/epoch_091/ex iiiiiii iiiiiii 642 | train/epoch_091/ex cca cca 643 | train/epoch_091/ex aaaaaa iaacaa 644 | train/epoch_091/ex c c 645 | train/epoch_091{1.74s} 646 | train/epoch_092/loss 6.4197 647 | train/epoch_092/ex fbf cfb 648 | train/epoch_092/ex ccc ccj 649 | train/epoch_092/ex bb bb 650 | train/epoch_092/ex fff fff 651 | train/epoch_092/ex db bf 652 | train/epoch_092{1.66s} 653 | train/epoch_093/loss 6.1316 654 | train/epoch_093/ex gggggg cggggg 655 | train/epoch_093/ex efe hef 656 | train/epoch_093/ex jjjj jjjj 657 | train/epoch_093/ex i d 658 | train/epoch_093/ex eee eej 659 | train/epoch_093{1.67s} 660 | train/epoch_094/loss 6.6532 661 | train/epoch_094/ex hhh hhh 662 | train/epoch_094/ex ccgc gcgc 663 | train/epoch_094/ex hhh dhh 664 | train/epoch_094/ex cccccc cccccc 665 | train/epoch_094/ex eee aaa 666 | train/epoch_094{1.59s} 667 | train/epoch_095/loss 6.5366 668 | train/epoch_095/ex fb fg 669 | train/epoch_095/ex dddddd dddcdd 670 | train/epoch_095/ex biii ebbb 671 | train/epoch_095/ex fb fb 672 | train/epoch_095/ex ggg ggg 673 | train/epoch_095{1.63s} 674 | train/epoch_096/loss 6.7092 675 | train/epoch_096/ex gggg fggg 676 | train/epoch_096/ex e c 677 | train/epoch_096/ex ddd ddd 678 | train/epoch_096/ex i f 679 | train/epoch_096/ex i i 680 | train/epoch_096{1.71s} 681 | train/epoch_097/loss 6.5643 682 | Epoch 97: reducing learning rate of group 0 to 5.0000e-04. 683 | train/epoch_097/ex bbbbbb dbbbbb 684 | train/epoch_097/ex b b 685 | train/epoch_097/ex hff fif 686 | train/epoch_097/ex ccc ece 687 | train/epoch_097/ex addddd ddddda 688 | train/epoch_097{1.65s} 689 | train/epoch_098/loss 6.5670 690 | train/epoch_098/ex ffh jeh 691 | train/epoch_098/ex ii di 692 | train/epoch_098/ex cccccc cceecc 693 | train/epoch_098/ex e a 694 | train/epoch_098/ex jjjj jjjj 695 | train/epoch_098{1.66s} 696 | train/epoch_099/loss 6.3209 697 | train/epoch_099/ex bbb bfb 698 | train/epoch_099/ex fffff fffff 699 | train/epoch_099/ex je ge 700 | train/epoch_099/ex gjgjgj jjjggj 701 | train/epoch_099/ex ccc ccc 702 | train/epoch_099{1.64s} 703 | train/epoch_100/loss 6.8810 704 | train/epoch_100/ex jiij ijii 705 | train/epoch_100/ex ggg ggj 706 | train/epoch_100/ex hhh hhh 707 | train/epoch_100/ex gg gg 708 | train/epoch_100/ex iii eej 709 | train/epoch_100{1.69s} 710 | train/epoch_101/loss 6.2407 711 | train/epoch_101/ex ic ch 712 | train/epoch_101/ex ccc cjc 713 | train/epoch_101/ex ic fc 714 | train/epoch_101/ex jjh hjj 715 | train/epoch_101/ex hhhhh jhjhj 716 | train/epoch_101{1.68s} 717 | train/epoch_102/loss 6.1463 718 | train/epoch_102/ex adddaa djajag 719 | train/epoch_102/ex iii hhh 720 | train/epoch_102/ex eeee eaee 721 | train/epoch_102/ex d f 722 | train/epoch_102/ex ggggh hhghh 723 | train/epoch_102{1.70s} 724 | train/epoch_103/loss 6.5568 725 | train/epoch_103/ex jffjf jjfjj 726 | train/epoch_103/ex bbb bbb 727 | train/epoch_103/ex jjjjjjccj cjcjcjjcj 728 | train/epoch_103/ex hhh hhh 729 | train/epoch_103/ex hhh hhh 730 | train/epoch_103{1.71s} 731 | train/epoch_104/loss 6.4236 732 | train/epoch_104/ex jjj iii 733 | train/epoch_104/ex aaaaaaaaa aaaaaaaaa 734 | train/epoch_104/ex eeea ggaa 735 | train/epoch_104/ex i i 736 | train/epoch_104/ex bbbb bbbb 737 | train/epoch_104{1.65s} 738 | train/epoch_105/loss 6.5115 739 | train/epoch_105/ex iiiii iiiia 740 | train/epoch_105/ex aai aii 741 | train/epoch_105/ex jjjd hhhj 742 | train/epoch_105/ex ffff ffff 743 | train/epoch_105/ex ffjjff jffffj 744 | train/epoch_105{1.72s} 745 | train/epoch_106/loss 6.6293 746 | train/epoch_106/ex c c 747 | train/epoch_106/ex bd df 748 | train/epoch_106/ex cc cg 749 | train/epoch_106/ex jhhj hjjj 750 | train/epoch_106/ex hhhh hhhh 751 | train/epoch_106{1.67s} 752 | train/epoch_107/loss 7.0168 753 | train/epoch_107/ex cccc cccc 754 | train/epoch_107/ex jjjjjjjjjj jjhhjhjjhh 755 | train/epoch_107/ex i f 756 | train/epoch_107/ex b c 757 | train/epoch_107/ex aaa aab 758 | train/epoch_107{1.69s} 759 | train/epoch_108/loss 6.7053 760 | Epoch 108: reducing learning rate of group 0 to 2.5000e-04. 761 | train/epoch_108/ex fbfb ffbf 762 | train/epoch_108/ex e e 763 | train/epoch_108/ex hhh hhh 764 | train/epoch_108/ex aaaaa jaaaa 765 | train/epoch_108/ex e e 766 | train/epoch_108{1.66s} 767 | train/epoch_109/loss 6.0841 768 | train/epoch_109/ex jc ej 769 | train/epoch_109/ex hhhhhhhh chhhhhcc 770 | train/epoch_109/ex geg hee 771 | train/epoch_109/ex acacac caacac 772 | train/epoch_109/ex gj bg 773 | train/epoch_109{1.74s} 774 | train/epoch_110/loss 6.3016 775 | train/epoch_110/ex ic ic 776 | train/epoch_110/ex j e 777 | train/epoch_110/ex fffdd ffddd 778 | train/epoch_110/ex hhgg chha 779 | train/epoch_110/ex iej fij 780 | train/epoch_110{1.63s} 781 | train/epoch_111/loss 6.5304 782 | train/epoch_111/ex dd dd 783 | train/epoch_111/ex ccc ccc 784 | train/epoch_111/ex aaa aaf 785 | train/epoch_111/ex hhhhhhhhc ccchhhhcc 786 | train/epoch_111/ex ccccc ccfcc 787 | train/epoch_111{1.73s} 788 | train/epoch_112/loss 6.1326 789 | train/epoch_112/ex ib ib 790 | train/epoch_112/ex ggg ggg 791 | train/epoch_112/ex ggggg gjggg 792 | train/epoch_112/ex dddddd ddddic 793 | train/epoch_112/ex hhh eee 794 | train/epoch_112{1.72s} 795 | train/epoch_113/loss 5.9173 796 | train/epoch_113/ex cccc cccc 797 | train/epoch_113/ex cb bc 798 | train/epoch_113/ex gggggg ggggbg 799 | train/epoch_113/ex jjbb gbbb 800 | train/epoch_113/ex ddf ffd 801 | train/epoch_113{1.71s} 802 | train/epoch_114/loss 6.6359 803 | train/epoch_114/ex bggb bgbg 804 | train/epoch_114/ex aaa aaa 805 | train/epoch_114/ex j j 806 | train/epoch_114/ex edede ddedi 807 | train/epoch_114/ex heehe ehbdh 808 | train/epoch_114{1.61s} 809 | train/epoch_115/loss 5.9474 810 | train/epoch_115/ex ddd bdd 811 | train/epoch_115/ex bbbgg bbgbb 812 | train/epoch_115/ex ccccc ccccc 813 | train/epoch_115/ex ffff ffff 814 | train/epoch_115/ex j e 815 | train/epoch_115{1.72s} 816 | train/epoch_116/loss 6.7458 817 | train/epoch_116/ex fff aaa 818 | train/epoch_116/ex eee iie 819 | train/epoch_116/ex ggggggg ggggigi 820 | train/epoch_116/ex e h 821 | train/epoch_116/ex cc hc 822 | train/epoch_116{1.58s} 823 | train/epoch_117/loss 5.9001 824 | train/epoch_117/ex d h 825 | train/epoch_117/ex cccc cccc 826 | train/epoch_117/ex aeea eeaa 827 | train/epoch_117/ex iiiia iiiei 828 | train/epoch_117/ex did ied 829 | train/epoch_117{1.70s} 830 | train/epoch_118/loss 6.5518 831 | train/epoch_118/ex gj jb 832 | train/epoch_118/ex jj aa 833 | train/epoch_118/ex ccce eccc 834 | train/epoch_118/ex dddddddd ffbfffff 835 | train/epoch_118/ex he ch 836 | train/epoch_118{1.68s} 837 | train/epoch_119/loss 6.4336 838 | train/epoch_119/ex ddg add 839 | train/epoch_119/ex dd dd 840 | train/epoch_119/ex eeeeeee eeeeeee 841 | train/epoch_119/ex iiii iiii 842 | train/epoch_119/ex ififf iiiif 843 | train/epoch_119{1.65s} 844 | train/epoch_120/loss 6.3349 845 | train/epoch_120/ex df df 846 | train/epoch_120/ex fff fff 847 | train/epoch_120/ex jjjjj hhhhh 848 | train/epoch_120/ex aaaaaaa aaaaaaa 849 | train/epoch_120/ex bigb igbb 850 | train/epoch_120{1.65s} 851 | train/epoch_121/loss 6.3156 852 | train/epoch_121/ex icic cjii 853 | train/epoch_121/ex jj jj 854 | train/epoch_121/ex cd cg 855 | train/epoch_121/ex jjjj djjj 856 | train/epoch_121/ex eeee eeee 857 | train/epoch_121{1.65s} 858 | train/epoch_122/loss 6.7921 859 | train/epoch_122/ex dd dd 860 | train/epoch_122/ex eeeeeeeee eeeeeeeee 861 | train/epoch_122/ex fffff fffff 862 | train/epoch_122/ex hhh hjh 863 | train/epoch_122/ex aaa aaa 864 | train/epoch_122{1.66s} 865 | train/epoch_123/loss 6.4344 866 | train/epoch_123/ex gggggggg aaaaagaa 867 | train/epoch_123/ex ccccc ccccc 868 | train/epoch_123/ex ifififfiff ififfifiif 869 | train/epoch_123/ex iai fif 870 | train/epoch_123/ex i i 871 | train/epoch_123{1.70s} 872 | train/epoch_124/loss 6.5039 873 | train/epoch_124/ex jjjj jjjj 874 | train/epoch_124/ex c f 875 | train/epoch_124/ex jjjjj jjjjj 876 | train/epoch_124/ex jb ej 877 | train/epoch_124/ex jjjjj jjjja 878 | train/epoch_124{1.63s} 879 | train/epoch_125/loss 6.2283 880 | train/epoch_125/ex aa ad 881 | train/epoch_125/ex fjff ffjf 882 | train/epoch_125/ex d a 883 | train/epoch_125/ex hhhh hhhh 884 | train/epoch_125/ex eeeee eeeee 885 | train/epoch_125{1.74s} 886 | train/epoch_126/loss 6.2067 887 | train/epoch_126/ex dc id 888 | train/epoch_126/ex ccc ccc 889 | train/epoch_126/ex hhh hhh 890 | train/epoch_126/ex iii iii 891 | train/epoch_126/ex e h 892 | train/epoch_126{1.64s} 893 | train/epoch_127/loss 6.3030 894 | train/epoch_127/ex aaa hhh 895 | train/epoch_127/ex b j 896 | train/epoch_127/ex hj ha 897 | train/epoch_127/ex i b 898 | train/epoch_127/ex ccg cgg 899 | train/epoch_127{1.64s} 900 | train/epoch_128/loss 6.2002 901 | Epoch 128: reducing learning rate of group 0 to 1.2500e-04. 902 | train/epoch_128/ex gde edi 903 | train/epoch_128/ex fei ife 904 | train/epoch_128/ex bbbbbbh bbbbhbb 905 | train/epoch_128/ex j j 906 | train/epoch_128/ex eeeee eeehe 907 | train/epoch_128{1.67s} 908 | train/epoch_129/loss 6.1837 909 | train/epoch_129/ex ccbbbbbbbc cbcccccccc 910 | train/epoch_129/ex gcgc gicg 911 | train/epoch_129/ex ccbcbc bccccb 912 | train/epoch_129/ex jdddj dddjd 913 | train/epoch_129/ex bb gg 914 | train/epoch_129{1.65s} 915 | train/epoch_130/loss 6.4865 916 | train/epoch_130/ex gg gg 917 | train/epoch_130/ex ddddd ddddj 918 | train/epoch_130/ex hhib hfii 919 | train/epoch_130/ex d j 920 | train/epoch_130/ex jjjjjjj jjjjjjj 921 | train/epoch_130{1.64s} 922 | train/epoch_131/loss 5.8629 923 | train/epoch_131/ex eeeeeeeee eeeeeeeee 924 | train/epoch_131/ex gdeg dgdg 925 | train/epoch_131/ex fff ffg 926 | train/epoch_131/ex dddd dddh 927 | train/epoch_131/ex bbbb bbbb 928 | train/epoch_131{1.69s} 929 | train/epoch_132/loss 6.4737 930 | train/epoch_132/ex ccccc ccccc 931 | train/epoch_132/ex ddd ddd 932 | train/epoch_132/ex ggg ccc 933 | train/epoch_132/ex aag aaf 934 | train/epoch_132/ex ch hc 935 | train/epoch_132{1.70s} 936 | train/epoch_133/loss 5.8846 937 | train/epoch_133/ex hhh hhh 938 | train/epoch_133/ex jjjjj jjjjd 939 | train/epoch_133/ex dde jee 940 | train/epoch_133/ex b g 941 | train/epoch_133/ex ddii iddd 942 | train/epoch_133{1.70s} 943 | train/epoch_134/loss 6.2642 944 | train/epoch_134/ex aaaaaa baaaaa 945 | train/epoch_134/ex eeeee eeeee 946 | train/epoch_134/ex ccj cjj 947 | train/epoch_134/ex b d 948 | train/epoch_134/ex j e 949 | train/epoch_134{1.73s} 950 | train/epoch_135/loss 6.5267 951 | train/epoch_135/ex fj jf 952 | train/epoch_135/ex eeeeeeee eeeeehee 953 | train/epoch_135/ex aaaga aadga 954 | train/epoch_135/ex fafaf feffe 955 | train/epoch_135/ex d i 956 | train/epoch_135{1.63s} 957 | train/epoch_136/loss 6.0839 958 | train/epoch_136/ex ffff ffff 959 | train/epoch_136/ex d d 960 | train/epoch_136/ex eeee eeee 961 | train/epoch_136/ex ie ef 962 | train/epoch_136/ex hb hb 963 | train/epoch_136{1.63s} 964 | train/epoch_137/loss 6.1981 965 | train/epoch_137/ex ggggggggggg ggggggggggg 966 | train/epoch_137/ex cccccccc cccccccc 967 | train/epoch_137/ex jjj jjj 968 | train/epoch_137/ex d b 969 | train/epoch_137/ex iiiii iiiif 970 | train/epoch_137{1.70s} 971 | train/epoch_138/loss 5.9685 972 | train/epoch_138/ex ffffff ffffff 973 | train/epoch_138/ex hhh hhh 974 | train/epoch_138/ex jjdd jded 975 | train/epoch_138/ex ggg ggg 976 | train/epoch_138/ex i j 977 | train/epoch_138{1.69s} 978 | train/epoch_139/loss 6.2380 979 | train/epoch_139/ex ccc ehh 980 | train/epoch_139/ex iiff ffii 981 | train/epoch_139/ex hjj aah 982 | train/epoch_139/ex hhhhh hhhhh 983 | train/epoch_139/ex dde edd 984 | train/epoch_139{1.71s} 985 | train/epoch_140/loss 5.9524 986 | train/epoch_140/ex ggg hgg 987 | train/epoch_140/ex bb bf 988 | train/epoch_140/ex fffffg fgffff 989 | train/epoch_140/ex ee ee 990 | train/epoch_140/ex fffffff fffffff 991 | train/epoch_140{1.78s} 992 | train/epoch_141/loss 6.1213 993 | train/epoch_141/ex hhhhh hhhhh 994 | train/epoch_141/ex gbgb gdbf 995 | train/epoch_141/ex j c 996 | train/epoch_141/ex jjjj jjjj 997 | train/epoch_141/ex iiiii giiii 998 | train/epoch_141{1.64s} 999 | train/epoch_142/loss 5.9057 1000 | Epoch 142: reducing learning rate of group 0 to 6.2500e-05. 1001 | train/epoch_142/ex jjjj jjjj 1002 | train/epoch_142/ex jj jj 1003 | train/epoch_142/ex i g 1004 | train/epoch_142/ex iiiii iiiii 1005 | train/epoch_142/ex d c 1006 | train/epoch_142{1.72s} 1007 | train/epoch_143/loss 6.3737 1008 | train/epoch_143/ex da da 1009 | train/epoch_143/ex e c 1010 | train/epoch_143/ex iiiiiii iiiiiii 1011 | train/epoch_143/ex bbb bbb 1012 | train/epoch_143/ex jg ij 1013 | train/epoch_143{1.61s} 1014 | train/epoch_144/loss 6.5032 1015 | train/epoch_144/ex eieefe fddfei 1016 | train/epoch_144/ex ddb djj 1017 | train/epoch_144/ex fd fg 1018 | train/epoch_144/ex gggg gggg 1019 | train/epoch_144/ex ccccjj cccjcc 1020 | train/epoch_144{1.64s} 1021 | train/epoch_145/loss 6.1498 1022 | train/epoch_145/ex hhhh hhhh 1023 | train/epoch_145/ex ffif iifi 1024 | train/epoch_145/ex ai id 1025 | train/epoch_145/ex aja aaj 1026 | train/epoch_145/ex jj ji 1027 | train/epoch_145{1.64s} 1028 | train/epoch_146/loss 6.1023 1029 | train/epoch_146/ex d d 1030 | train/epoch_146/ex i d 1031 | train/epoch_146/ex dj jc 1032 | train/epoch_146/ex hhh hhh 1033 | train/epoch_146/ex e e 1034 | train/epoch_146{1.70s} 1035 | train/epoch_147/loss 6.7364 1036 | train/epoch_147/ex bbbbd gddgg 1037 | train/epoch_147/ex aaaa aaaa 1038 | train/epoch_147/ex ffff ffef 1039 | train/epoch_147/ex ffffff fffffa 1040 | train/epoch_147/ex cccccj jjjccj 1041 | train/epoch_147{1.68s} 1042 | train/epoch_148/loss 6.1966 1043 | train/epoch_148/ex aaaaaaa aabaaab 1044 | train/epoch_148/ex i d 1045 | train/epoch_148/ex fffff fffff 1046 | train/epoch_148/ex ddd ggg 1047 | train/epoch_148/ex fff fff 1048 | train/epoch_148{1.79s} 1049 | train/epoch_149/loss 6.2020 1050 | train/epoch_149/ex ddddd ddded 1051 | train/epoch_149/ex b b 1052 | train/epoch_149/ex ja jb 1053 | train/epoch_149/ex hhhhhhhhhhh hhhhhhhhhhh 1054 | train/epoch_149/ex ddd ggg 1055 | train/epoch_149{1.71s} 1056 | train/epoch_150/loss 5.8367 1057 | train/epoch_150/ex hhhhhhhhhaaa bhbaffbhbabb 1058 | train/epoch_150/ex h j 1059 | train/epoch_150/ex bb gg 1060 | train/epoch_150/ex e b 1061 | train/epoch_150/ex jjjj jjjj 1062 | train/epoch_150{1.64s} 1063 | train/epoch_151/loss 6.0384 1064 | train/epoch_151/ex aaa aaa 1065 | train/epoch_151/ex ii ii 1066 | train/epoch_151/ex e e 1067 | train/epoch_151/ex ccc ccc 1068 | train/epoch_151/ex ccdddd cddccc 1069 | train/epoch_151{1.71s} 1070 | train/epoch_152/loss 5.9184 1071 | train/epoch_152/ex ccbb cbbc 1072 | train/epoch_152/ex aaaaaaah ahhhhhah 1073 | train/epoch_152/ex aaaaaa geeebe 1074 | train/epoch_152/ex ee ee 1075 | train/epoch_152/ex bf db 1076 | train/epoch_152{1.69s} 1077 | train/epoch_153/loss 5.9824 1078 | train/epoch_153/ex ba ba 1079 | train/epoch_153/ex ii id 1080 | train/epoch_153/ex fffh diif 1081 | train/epoch_153/ex cccccc cccccc 1082 | train/epoch_153/ex di dh 1083 | train/epoch_153{1.75s} 1084 | train/epoch_154/loss 6.1138 1085 | train/epoch_154/ex cc cc 1086 | train/epoch_154/ex j h 1087 | train/epoch_154/ex hhhhhhh jhjjjjj 1088 | train/epoch_154/ex hhbb hbbb 1089 | train/epoch_154/ex gg cc 1090 | train/epoch_154{1.65s} 1091 | train/epoch_155/loss 6.3677 1092 | train/epoch_155/ex jj jj 1093 | train/epoch_155/ex b b 1094 | train/epoch_155/ex fj jc 1095 | train/epoch_155/ex d f 1096 | train/epoch_155/ex ggggg ggggg 1097 | train/epoch_155{1.61s} 1098 | train/epoch_156/loss 6.3078 1099 | train/epoch_156/ex bbb fbb 1100 | train/epoch_156/ex fffff hffff 1101 | train/epoch_156/ex c j 1102 | train/epoch_156/ex bcbc cbbc 1103 | train/epoch_156/ex b c 1104 | train/epoch_156{1.70s} 1105 | train/epoch_157/loss 6.2118 1106 | train/epoch_157/ex bbbb bbbb 1107 | train/epoch_157/ex d d 1108 | train/epoch_157/ex edede dbeec 1109 | train/epoch_157/ex de de 1110 | train/epoch_157/ex bbbbb jjbbb 1111 | train/epoch_157{1.67s} 1112 | train/epoch_158/loss 6.2537 1113 | train/epoch_158/ex b g 1114 | train/epoch_158/ex aaaag gdggg 1115 | train/epoch_158/ex fffff fffff 1116 | train/epoch_158/ex eeheeh heheae 1117 | train/epoch_158/ex di db 1118 | train/epoch_158{1.70s} 1119 | train/epoch_159/loss 6.4654 1120 | train/epoch_159/ex ggggh ghagg 1121 | train/epoch_159/ex jjj jjj 1122 | train/epoch_159/ex hhhhh hhhhh 1123 | train/epoch_159/ex iiiiiiiiiii iiiiiiiiiii 1124 | train/epoch_159/ex iiiii biiii 1125 | train/epoch_159{1.69s} 1126 | train/epoch_160/loss 5.6308 1127 | train/epoch_160/ex ebe ebe 1128 | train/epoch_160/ex jjj hhh 1129 | train/epoch_160/ex aj af 1130 | train/epoch_160/ex ggggg ggbbc 1131 | train/epoch_160/ex gggggg eggegg 1132 | train/epoch_160{1.70s} 1133 | train/epoch_161/loss 5.9329 1134 | train/epoch_161/ex iii iii 1135 | train/epoch_161/ex j g 1136 | train/epoch_161/ex jgjg gjjg 1137 | train/epoch_161/ex ggggg ggggh 1138 | train/epoch_161/ex ada iab 1139 | train/epoch_161{1.66s} 1140 | train/epoch_162/loss 6.1695 1141 | train/epoch_162/ex dddj cddd 1142 | train/epoch_162/ex fff fff 1143 | train/epoch_162/ex jg hg 1144 | train/epoch_162/ex e g 1145 | train/epoch_162/ex iiiii giiii 1146 | train/epoch_162{1.69s} 1147 | train/epoch_163/loss 6.4028 1148 | train/epoch_163/ex eeee eeeg 1149 | train/epoch_163/ex eee bee 1150 | train/epoch_163/ex i i 1151 | train/epoch_163/ex c c 1152 | train/epoch_163/ex hjhjhj jhhjhj 1153 | train/epoch_163{1.70s} 1154 | train/epoch_164/loss 6.2076 1155 | train/epoch_164/ex hhhhhh hhhbbh 1156 | train/epoch_164/ex aab abd 1157 | train/epoch_164/ex ha ea 1158 | train/epoch_164/ex bbbbbbbb bbbdbbbb 1159 | train/epoch_164/ex ii jj 1160 | train/epoch_164{1.69s} 1161 | train/epoch_165/loss 6.0833 1162 | train/epoch_165/ex aad daa 1163 | train/epoch_165/ex ec ed 1164 | train/epoch_165/ex ddddd ddddd 1165 | train/epoch_165/ex ffffb fffbb 1166 | train/epoch_165/ex aa fa 1167 | train/epoch_165{1.70s} 1168 | train/epoch_166/loss 6.0310 1169 | train/epoch_166/ex i j 1170 | train/epoch_166/ex aaaj jaaa 1171 | train/epoch_166/ex iig igg 1172 | train/epoch_166/ex ibi bdb 1173 | train/epoch_166/ex hhhh hhhh 1174 | train/epoch_166{1.68s} 1175 | train/epoch_167/loss 5.9586 1176 | train/epoch_167/ex eeeee eeeej 1177 | train/epoch_167/ex aaaaaaaa aaaaaaba 1178 | train/epoch_167/ex heheh hcehc 1179 | train/epoch_167/ex jgjg jgff 1180 | train/epoch_167/ex ddd dbb 1181 | train/epoch_167{1.62s} 1182 | train/epoch_168/loss 6.5112 1183 | train/epoch_168/ex bjb bjb 1184 | train/epoch_168/ex jh jf 1185 | train/epoch_168/ex jj jj 1186 | train/epoch_168/ex if ia 1187 | train/epoch_168/ex bb bb 1188 | train/epoch_168{1.70s} 1189 | train/epoch_169/loss 5.9743 1190 | train/epoch_169/ex j f 1191 | train/epoch_169/ex ffbffbfb bfbffbfb 1192 | train/epoch_169/ex e j 1193 | train/epoch_169/ex bb bb 1194 | train/epoch_169/ex cicccc cciici 1195 | train/epoch_169{1.64s} 1196 | train/epoch_170/loss 6.5227 1197 | train/epoch_170/ex cc cc 1198 | train/epoch_170/ex bj jb 1199 | train/epoch_170/ex iiiii iiiid 1200 | train/epoch_170/ex jjjj jjjj 1201 | train/epoch_170/ex aaaa aaaa 1202 | train/epoch_170{1.64s} 1203 | train/epoch_171/loss 6.1279 1204 | Epoch 171: reducing learning rate of group 0 to 3.1250e-05. 1205 | train/epoch_171/ex fffffff dffffff 1206 | train/epoch_171/ex ffcf cfff 1207 | train/epoch_171/ex ff ff 1208 | train/epoch_171/ex iiiii iiiii 1209 | train/epoch_171/ex d a 1210 | train/epoch_171{1.67s} 1211 | train/epoch_172/loss 6.4508 1212 | train/epoch_172/ex ddd ddd 1213 | train/epoch_172/ex ddedde aeeded 1214 | train/epoch_172/ex e i 1215 | train/epoch_172/ex ddd ddd 1216 | train/epoch_172/ex i a 1217 | train/epoch_172{1.69s} 1218 | train/epoch_173/loss 6.1593 1219 | train/epoch_173/ex gggg gggg 1220 | train/epoch_173/ex ejej jeej 1221 | train/epoch_173/ex gf bf 1222 | train/epoch_173/ex eeaea aaeaa 1223 | train/epoch_173/ex ddc jdd 1224 | train/epoch_173{1.64s} 1225 | train/epoch_174/loss 6.0932 1226 | train/epoch_174/ex hf fd 1227 | train/epoch_174/ex jjjjj jjjjj 1228 | train/epoch_174/ex ccffcffc fccffccf 1229 | train/epoch_174/ex i i 1230 | train/epoch_174/ex fffffffi ffiiiiif 1231 | train/epoch_174{1.61s} 1232 | train/epoch_175/loss 6.3809 1233 | train/epoch_175/ex jh hj 1234 | train/epoch_175/ex gd gd 1235 | train/epoch_175/ex fj ce 1236 | train/epoch_175/ex cb cf 1237 | train/epoch_175/ex heeehe eeehhh 1238 | train/epoch_175{1.70s} 1239 | train/epoch_176/loss 6.4938 1240 | train/epoch_176/ex ii ii 1241 | train/epoch_176/ex hhh hdh 1242 | train/epoch_176/ex iiiiiiiii iiiiiiiii 1243 | train/epoch_176/ex bbb gbb 1244 | train/epoch_176/ex gc gj 1245 | train/epoch_176{1.64s} 1246 | train/epoch_177/loss 5.6568 1247 | train/epoch_177/ex dd dd 1248 | train/epoch_177/ex iiiiic icccii 1249 | train/epoch_177/ex hdhd dhdh 1250 | train/epoch_177/ex iie iig 1251 | train/epoch_177/ex jjjjjjd jjjjjdj 1252 | train/epoch_177{1.69s} 1253 | train/epoch_178/loss 6.3999 1254 | train/epoch_178/ex ij ai 1255 | train/epoch_178/ex gggg gggd 1256 | train/epoch_178/ex j j 1257 | train/epoch_178/ex ded ede 1258 | train/epoch_178/ex ccccc ccccc 1259 | train/epoch_178{1.70s} 1260 | train/epoch_179/loss 5.7520 1261 | train/epoch_179/ex dd dd 1262 | train/epoch_179/ex ddd idd 1263 | train/epoch_179/ex iii cii 1264 | train/epoch_179/ex jjjjjj jjjjbb 1265 | train/epoch_179/ex fffff ffffg 1266 | train/epoch_179{1.78s} 1267 | train/epoch_180/loss 6.0310 1268 | train/epoch_180/ex eb be 1269 | train/epoch_180/ex aah aah 1270 | train/epoch_180/ex i i 1271 | train/epoch_180/ex bc bc 1272 | train/epoch_180/ex hhhh aaah 1273 | train/epoch_180{1.71s} 1274 | train/epoch_181/loss 6.3980 1275 | train/epoch_181/ex jjjjjj hhhhhj 1276 | train/epoch_181/ex aiifiiaa afaaafai 1277 | train/epoch_181/ex gggggggggg fgfgghggfg 1278 | train/epoch_181/ex dde cdd 1279 | train/epoch_181/ex ffe eaa 1280 | train/epoch_181{1.73s} 1281 | train/epoch_182/loss 6.1611 1282 | Epoch 182: reducing learning rate of group 0 to 1.5625e-05. 1283 | train/epoch_182/ex ddd ddd 1284 | train/epoch_182/ex ggggg ggggg 1285 | train/epoch_182/ex d i 1286 | train/epoch_182/ex aaaaaaa aaaaaaa 1287 | train/epoch_182/ex bjbjbj jbjbjj 1288 | train/epoch_182{1.63s} 1289 | train/epoch_183/loss 5.8197 1290 | train/epoch_183/ex ggggg ggggg 1291 | train/epoch_183/ex di di 1292 | train/epoch_183/ex i i 1293 | train/epoch_183/ex fgf fgf 1294 | train/epoch_183/ex dd dd 1295 | train/epoch_183{1.62s} 1296 | train/epoch_184/loss 5.7442 1297 | train/epoch_184/ex i i 1298 | train/epoch_184/ex hhh hhf 1299 | train/epoch_184/ex e e 1300 | train/epoch_184/ex bbbbb bbbgb 1301 | train/epoch_184/ex aai aii 1302 | train/epoch_184{1.67s} 1303 | train/epoch_185/loss 5.9449 1304 | train/epoch_185/ex fa ha 1305 | train/epoch_185/ex jddj cdjj 1306 | train/epoch_185/ex ccccccccc ccccccccc 1307 | train/epoch_185/ex bbbb bbba 1308 | train/epoch_185/ex idid fdid 1309 | train/epoch_185{1.69s} 1310 | train/epoch_186/loss 6.4132 1311 | train/epoch_186/ex i i 1312 | train/epoch_186/ex ffff ffff 1313 | train/epoch_186/ex d a 1314 | train/epoch_186/ex iiie geee 1315 | train/epoch_186/ex hhhh hhhh 1316 | train/epoch_186{1.64s} 1317 | train/epoch_187/loss 6.2593 1318 | train/epoch_187/ex fc cf 1319 | train/epoch_187/ex ddddddd ddddddd 1320 | train/epoch_187/ex eeeeeee eeeeeee 1321 | train/epoch_187/ex hhhhhhh hhhhhee 1322 | train/epoch_187/ex j j 1323 | train/epoch_187{1.62s} 1324 | train/epoch_188/loss 5.9596 1325 | train/epoch_188/ex hhhh hhhh 1326 | train/epoch_188/ex fff bff 1327 | train/epoch_188/ex bbb bbb 1328 | train/epoch_188/ex iiiiii ieiiii 1329 | train/epoch_188/ex edded edeee 1330 | train/epoch_188{1.65s} 1331 | train/epoch_189/loss 5.5558 1332 | train/epoch_189/ex fe fe 1333 | train/epoch_189/ex ddf dda 1334 | train/epoch_189/ex ddbd bdbd 1335 | train/epoch_189/ex iid dii 1336 | train/epoch_189/ex iii iii 1337 | train/epoch_189{1.64s} 1338 | train/epoch_190/loss 6.5355 1339 | train/epoch_190/ex g g 1340 | train/epoch_190/ex d d 1341 | train/epoch_190/ex jjjjh cjjjc 1342 | train/epoch_190/ex hhhhhh hhhhhh 1343 | train/epoch_190/ex jg gj 1344 | train/epoch_190{1.62s} 1345 | train/epoch_191/loss 6.4038 1346 | train/epoch_191/ex ggg ggg 1347 | train/epoch_191/ex fjf fjf 1348 | train/epoch_191/ex hhh hhh 1349 | train/epoch_191/ex i i 1350 | train/epoch_191/ex iii iii 1351 | train/epoch_191{1.63s} 1352 | train/epoch_192/loss 6.2900 1353 | train/epoch_192/ex b b 1354 | train/epoch_192/ex cgcg gcec 1355 | train/epoch_192/ex aaaaa aaaaa 1356 | train/epoch_192/ex jj jj 1357 | train/epoch_192/ex dc dc 1358 | train/epoch_192{1.66s} 1359 | train/epoch_193/loss 6.0979 1360 | train/epoch_193/ex d c 1361 | train/epoch_193/ex aaa aaa 1362 | train/epoch_193/ex bi ib 1363 | train/epoch_193/ex ff fa 1364 | train/epoch_193/ex cj cj 1365 | train/epoch_193{1.64s} 1366 | train/epoch_194/loss 5.9652 1367 | train/epoch_194/ex i i 1368 | train/epoch_194/ex ggg ggg 1369 | train/epoch_194/ex fd fd 1370 | train/epoch_194/ex ggggjj jjjjgj 1371 | train/epoch_194/ex hhhhf hffhh 1372 | train/epoch_194{1.65s} 1373 | train/epoch_195/loss 5.6970 1374 | train/epoch_195/ex jjdj djdd 1375 | train/epoch_195/ex c h 1376 | train/epoch_195/ex hhhhhhhh dbhbdbhd 1377 | train/epoch_195/ex d b 1378 | train/epoch_195/ex i i 1379 | train/epoch_195{1.65s} 1380 | train/epoch_196/loss 6.1554 1381 | train/epoch_196/ex ggg jgg 1382 | train/epoch_196/ex gg hh 1383 | train/epoch_196/ex hhhh hhhh 1384 | train/epoch_196/ex ddddddd hdddddd 1385 | train/epoch_196/ex bgbggb ggbbbg 1386 | train/epoch_196{1.72s} 1387 | train/epoch_197/loss 5.6966 1388 | train/epoch_197/ex e a 1389 | train/epoch_197/ex d a 1390 | train/epoch_197/ex e c 1391 | train/epoch_197/ex gdg ggd 1392 | train/epoch_197/ex bbc cbb 1393 | train/epoch_197{1.75s} 1394 | train/epoch_198/loss 6.3850 1395 | train/epoch_198/ex ccic icci 1396 | train/epoch_198/ex i h 1397 | train/epoch_198/ex ici ijc 1398 | train/epoch_198/ex bb bb 1399 | train/epoch_198/ex jgjg gejj 1400 | train/epoch_198{1.72s} 1401 | train/epoch_199/loss 6.4086 1402 | train/epoch_199/ex iiiii iiiii 1403 | train/epoch_199/ex ddd ddd 1404 | train/epoch_199/ex c g 1405 | train/epoch_199/ex j f 1406 | train/epoch_199/ex aaag gagg 1407 | train/epoch_199{1.67s} 1408 | train/epoch_200/loss 6.4065 1409 | Epoch 200: reducing learning rate of group 0 to 7.8125e-06. 1410 | train/epoch_200/ex ffbbffbf bfbbfbfb 1411 | train/epoch_200/ex ggd dgd 1412 | train/epoch_200/ex ccccc ccccc 1413 | train/epoch_200/ex eeee eeee 1414 | train/epoch_200/ex dd bb 1415 | train/epoch_200{1.61s} 1416 | train/epoch_201/loss 6.2569 1417 | train/epoch_201/ex b h 1418 | train/epoch_201/ex ddbb bdbb 1419 | train/epoch_201/ex aaaaaaaa aaaaaaaa 1420 | train/epoch_201/ex jjj jji 1421 | train/epoch_201/ex jaj ejj 1422 | train/epoch_201{1.65s} 1423 | train/epoch_202/loss 5.9009 1424 | train/epoch_202/ex aaaaai aaaiai 1425 | train/epoch_202/ex ggggg hgggg 1426 | train/epoch_202/ex jd bj 1427 | train/epoch_202/ex bb bb 1428 | train/epoch_202/ex ei ej 1429 | train/epoch_202{1.69s} 1430 | train/epoch_203/loss 5.9967 1431 | train/epoch_203/ex ggggf fggfh 1432 | train/epoch_203/ex bj bg 1433 | train/epoch_203/ex ababab baccab 1434 | train/epoch_203/ex aaaaa ajeae 1435 | train/epoch_203/ex deded dedde 1436 | train/epoch_203{1.71s} 1437 | train/epoch_204/loss 5.9941 1438 | train/epoch_204/ex ccee eecc 1439 | train/epoch_204/ex gjjg jggj 1440 | train/epoch_204/ex ccccccccc ccccccccc 1441 | train/epoch_204/ex bbaaa bbabb 1442 | train/epoch_204/ex d d 1443 | train/epoch_204{1.66s} 1444 | train/epoch_205/loss 6.2342 1445 | train/epoch_205/ex e i 1446 | train/epoch_205/ex ggg ggg 1447 | train/epoch_205/ex ee dd 1448 | train/epoch_205/ex d g 1449 | train/epoch_205/ex j j 1450 | train/epoch_205{1.76s} 1451 | train/epoch_206/loss 5.9397 1452 | train/epoch_206/ex iiiiii iiiiii 1453 | train/epoch_206/ex gd db 1454 | train/epoch_206/ex c d 1455 | train/epoch_206/ex e i 1456 | train/epoch_206/ex dddf fffd 1457 | train/epoch_206{1.71s} 1458 | train/epoch_207/loss 5.6915 1459 | train/epoch_207/ex agag ggag 1460 | train/epoch_207/ex fff fff 1461 | train/epoch_207/ex ccc ccc 1462 | train/epoch_207/ex b d 1463 | train/epoch_207/ex iiiiiiiiii iiiiiiiiii 1464 | train/epoch_207{1.68s} 1465 | train/epoch_208/loss 6.0428 1466 | train/epoch_208/ex jf fj 1467 | train/epoch_208/ex c c 1468 | train/epoch_208/ex jjjjj jjjjj 1469 | train/epoch_208/ex eb de 1470 | train/epoch_208/ex iiiai iaiii 1471 | train/epoch_208{1.64s} 1472 | train/epoch_209/loss 5.8970 1473 | train/epoch_209/ex ii bb 1474 | train/epoch_209/ex jf ci 1475 | train/epoch_209/ex hi id 1476 | train/epoch_209/ex hhhff hfhhf 1477 | train/epoch_209/ex c d 1478 | train/epoch_209{1.67s} 1479 | train/epoch_210/loss 5.9637 1480 | train/epoch_210/ex eeeeeed dbbedeb 1481 | train/epoch_210/ex iii iii 1482 | train/epoch_210/ex ccccccccg ccggggccg 1483 | train/epoch_210/ex jjjjj jjjjj 1484 | train/epoch_210/ex dd ff 1485 | train/epoch_210{1.71s} 1486 | train/epoch_211/loss 6.3755 1487 | Epoch 211: reducing learning rate of group 0 to 3.9063e-06. 1488 | train/epoch_211/ex a e 1489 | train/epoch_211/ex iiiii iiiii 1490 | train/epoch_211/ex d d 1491 | train/epoch_211/ex bgbgbg bbgbge 1492 | train/epoch_211/ex i i 1493 | train/epoch_211{1.69s} 1494 | train/epoch_212/loss 6.2919 1495 | train/epoch_212/ex aaa haa 1496 | train/epoch_212/ex c i 1497 | train/epoch_212/ex gg gg 1498 | train/epoch_212/ex i i 1499 | train/epoch_212/ex aaaaa aaeaa 1500 | train/epoch_212{1.57s} 1501 | train/epoch_213/loss 5.9976 1502 | train/epoch_213/ex i f 1503 | train/epoch_213/ex hhhhh hhhhh 1504 | train/epoch_213/ex bbi bbi 1505 | train/epoch_213/ex eeee eaaa 1506 | train/epoch_213/ex cc cc 1507 | train/epoch_213{1.65s} 1508 | train/epoch_214/loss 6.1092 1509 | train/epoch_214/ex i i 1510 | train/epoch_214/ex ga jg 1511 | train/epoch_214/ex i f 1512 | train/epoch_214/ex e a 1513 | train/epoch_214/ex hhhhhh hhiihh 1514 | train/epoch_214{1.66s} 1515 | train/epoch_215/loss 6.0899 1516 | train/epoch_215/ex ddd ddd 1517 | train/epoch_215/ex b d 1518 | train/epoch_215/ex hhhhh hhhhh 1519 | train/epoch_215/ex ggggg egggg 1520 | train/epoch_215/ex cjcjcj acfjjf 1521 | train/epoch_215{1.64s} 1522 | train/epoch_216/loss 5.9925 1523 | train/epoch_216/ex ddd ddd 1524 | train/epoch_216/ex ffffhf hhfhhf 1525 | train/epoch_216/ex ia ia 1526 | train/epoch_216/ex da db 1527 | train/epoch_216/ex hhh jjj 1528 | train/epoch_216{1.71s} 1529 | train/epoch_217/loss 6.0272 1530 | train/epoch_217/ex fifi fifi 1531 | train/epoch_217/ex ge ge 1532 | train/epoch_217/ex iib jbb 1533 | train/epoch_217/ex jd if 1534 | train/epoch_217/ex acacac caccca 1535 | train/epoch_217{1.73s} 1536 | train/epoch_218/loss 5.8920 1537 | train/epoch_218/ex ififi ififi 1538 | train/epoch_218/ex c j 1539 | train/epoch_218/ex gg gg 1540 | train/epoch_218/ex bbbbb bbbbb 1541 | train/epoch_218/ex j j 1542 | train/epoch_218{1.71s} 1543 | train/epoch_219/loss 5.9707 1544 | train/epoch_219/ex ff jj 1545 | train/epoch_219/ex dbdb dbdd 1546 | train/epoch_219/ex ccjjjc eeejcj 1547 | train/epoch_219/ex i i 1548 | train/epoch_219/ex eeeee eeeee 1549 | train/epoch_219{1.61s} 1550 | train/epoch_220/loss 5.8610 1551 | train/epoch_220/ex j j 1552 | train/epoch_220/ex cj cj 1553 | train/epoch_220/ex ffj jjf 1554 | train/epoch_220/ex ggee ggeg 1555 | train/epoch_220/ex ji ji 1556 | train/epoch_220{1.71s} 1557 | train/epoch_221/loss 6.1566 1558 | train/epoch_221/ex ef fe 1559 | train/epoch_221/ex ie bi 1560 | train/epoch_221/ex df fd 1561 | train/epoch_221/ex b d 1562 | train/epoch_221/ex i j 1563 | train/epoch_221{1.69s} 1564 | train/epoch_222/loss 6.2244 1565 | Epoch 222: reducing learning rate of group 0 to 1.9531e-06. 1566 | train/epoch_222/ex gggggg iggggg 1567 | train/epoch_222/ex gggge geegg 1568 | train/epoch_222/ex eee cee 1569 | train/epoch_222/ex cjcj cjce 1570 | train/epoch_222/ex eebeebe ebbbebe 1571 | train/epoch_222{1.61s} 1572 | train/epoch_223/loss 6.3746 1573 | train/epoch_223/ex eec cee 1574 | train/epoch_223/ex eee eee 1575 | train/epoch_223/ex dda aaj 1576 | train/epoch_223/ex i d 1577 | train/epoch_223/ex gfg jfg 1578 | train/epoch_223{1.67s} 1579 | train/epoch_224/loss 5.9124 1580 | train/epoch_224/ex e h 1581 | train/epoch_224/ex eee eee 1582 | train/epoch_224/ex bbc bhb 1583 | train/epoch_224/ex dddd addd 1584 | train/epoch_224/ex hfhf fhhf 1585 | train/epoch_224{1.65s} 1586 | train/epoch_225/loss 6.3971 1587 | train/epoch_225/ex gjgj agaj 1588 | train/epoch_225/ex hhh ddd 1589 | train/epoch_225/ex fig gfi 1590 | train/epoch_225/ex i e 1591 | train/epoch_225/ex d d 1592 | train/epoch_225{1.64s} 1593 | train/epoch_226/loss 6.4814 1594 | train/epoch_226/ex iiii iiii 1595 | train/epoch_226/ex e j 1596 | train/epoch_226/ex fifi hifi 1597 | train/epoch_226/ex ah eh 1598 | train/epoch_226/ex ffcfc chchc 1599 | train/epoch_226{1.63s} 1600 | train/epoch_227/loss 6.2232 1601 | train/epoch_227/ex fjbj fbjh 1602 | train/epoch_227/ex aaaaa aaaaa 1603 | train/epoch_227/ex gjj gee 1604 | train/epoch_227/ex i i 1605 | train/epoch_227/ex iiiiiiiiiii iiiiiiiiiii 1606 | train/epoch_227{1.67s} 1607 | train/epoch_228/loss 6.3387 1608 | train/epoch_228/ex dddd dddd 1609 | train/epoch_228/ex cccc cccc 1610 | train/epoch_228/ex dddd ahhh 1611 | train/epoch_228/ex jgjg jgja 1612 | train/epoch_228/ex bab aba 1613 | train/epoch_228{1.69s} 1614 | train/epoch_229/loss 5.9282 1615 | train/epoch_229/ex iii iii 1616 | train/epoch_229/ex e e 1617 | train/epoch_229/ex ccc cch 1618 | train/epoch_229/ex iieei eeiee 1619 | train/epoch_229/ex ccccc ccccc 1620 | train/epoch_229{1.67s} 1621 | train/epoch_230/loss 6.0003 1622 | train/epoch_230/ex jf cj 1623 | train/epoch_230/ex bb dd 1624 | train/epoch_230/ex ggg ggc 1625 | train/epoch_230/ex aaaaa aaaad 1626 | train/epoch_230/ex c h 1627 | train/epoch_230{1.62s} 1628 | train/epoch_231/loss 6.3400 1629 | train/epoch_231/ex hfh fhe 1630 | train/epoch_231/ex iiiiiii iiiiiii 1631 | train/epoch_231/ex cci hcc 1632 | train/epoch_231/ex iii iii 1633 | train/epoch_231/ex ggg ggg 1634 | train/epoch_231{1.65s} 1635 | train/epoch_232/loss 6.1031 1636 | train/epoch_232/ex iii iii 1637 | train/epoch_232/ex ggggg ggggg 1638 | train/epoch_232/ex i i 1639 | train/epoch_232/ex bffb bbfb 1640 | train/epoch_232/ex dddd hddd 1641 | train/epoch_232{1.61s} 1642 | train/epoch_233/loss 5.8287 1643 | Epoch 233: reducing learning rate of group 0 to 9.7656e-07. 1644 | train/epoch_233/ex ia ai 1645 | train/epoch_233/ex ddddg dddfd 1646 | train/epoch_233/ex jjjd djdj 1647 | train/epoch_233/ex ai bi 1648 | train/epoch_233/ex hh jh 1649 | train/epoch_233{1.71s} 1650 | train/epoch_234/loss 6.2340 1651 | train/epoch_234/ex b b 1652 | train/epoch_234/ex iiii iiii 1653 | train/epoch_234/ex dii idd 1654 | train/epoch_234/ex cccc cccc 1655 | train/epoch_234/ex hhhhh hhhhh 1656 | train/epoch_234{1.73s} 1657 | train/epoch_235/loss 6.3833 1658 | train/epoch_235/ex ddd hhh 1659 | train/epoch_235/ex ddd idd 1660 | train/epoch_235/ex gggg fffg 1661 | train/epoch_235/ex i b 1662 | train/epoch_235/ex dddd dddd 1663 | train/epoch_235{1.68s} 1664 | train/epoch_236/loss 6.1122 1665 | train/epoch_236/ex ddee dded 1666 | train/epoch_236/ex dd dd 1667 | train/epoch_236/ex jg ic 1668 | train/epoch_236/ex fff hff 1669 | train/epoch_236/ex jjjj jjjj 1670 | train/epoch_236{1.66s} 1671 | train/epoch_237/loss 6.5434 1672 | train/epoch_237/ex ig ji 1673 | train/epoch_237/ex cb gc 1674 | train/epoch_237/ex fe ef 1675 | train/epoch_237/ex fjjf ghgg 1676 | train/epoch_237/ex eeee eeee 1677 | train/epoch_237{1.71s} 1678 | train/epoch_238/loss 6.2925 1679 | train/epoch_238/ex eee eee 1680 | train/epoch_238/ex e f 1681 | train/epoch_238/ex ffee feee 1682 | train/epoch_238/ex i j 1683 | train/epoch_238/ex fgf ggf 1684 | train/epoch_238{1.68s} 1685 | train/epoch_239/loss 6.2384 1686 | train/epoch_239/ex j j 1687 | train/epoch_239/ex ii ii 1688 | train/epoch_239/ex bbbbb bbbbb 1689 | train/epoch_239/ex aaf faa 1690 | train/epoch_239/ex eeeeeeee eaeeeeee 1691 | train/epoch_239{1.74s} 1692 | train/epoch_240/loss 6.4463 1693 | train/epoch_240/ex i h 1694 | train/epoch_240/ex ecce eece 1695 | train/epoch_240/ex iei fie 1696 | train/epoch_240/ex fjjjjff fjfjfjj 1697 | train/epoch_240/ex jbj jdb 1698 | train/epoch_240{1.71s} 1699 | train/epoch_241/loss 6.2361 1700 | train/epoch_241/ex aaa ggg 1701 | train/epoch_241/ex dfddf dfddf 1702 | train/epoch_241/ex bb bb 1703 | train/epoch_241/ex bj eb 1704 | train/epoch_241/ex iii iii 1705 | train/epoch_241{1.63s} 1706 | train/epoch_242/loss 6.2986 1707 | train/epoch_242/ex bb bb 1708 | train/epoch_242/ex jjjj ijjj 1709 | train/epoch_242/ex ccccc ccccc 1710 | train/epoch_242/ex jhj jhc 1711 | train/epoch_242/ex jjjj jjjj 1712 | train/epoch_242{1.68s} 1713 | train/epoch_243/loss 5.7629 1714 | train/epoch_243/ex ee ff 1715 | train/epoch_243/ex iiiid idiii 1716 | train/epoch_243/ex hi hf 1717 | train/epoch_243/ex cccc hccc 1718 | train/epoch_243/ex hhhhhhh hhhhhhh 1719 | train/epoch_243{1.73s} 1720 | train/epoch_244/loss 5.8432 1721 | Epoch 244: reducing learning rate of group 0 to 4.8828e-07. 1722 | train/epoch_244/ex aaaaaaa aaaaaaa 1723 | train/epoch_244/ex ae ea 1724 | train/epoch_244/ex bbbbb bbbbb 1725 | train/epoch_244/ex fgg ggi 1726 | train/epoch_244/ex bbbb bbbd 1727 | train/epoch_244{1.66s} 1728 | train/epoch_245/loss 5.7299 1729 | train/epoch_245/ex cacaa jgagg 1730 | train/epoch_245/ex cjc cfj 1731 | train/epoch_245/ex bj gb 1732 | train/epoch_245/ex iie iib 1733 | train/epoch_245/ex hhj hjj 1734 | train/epoch_245{1.69s} 1735 | train/epoch_246/loss 6.3262 1736 | train/epoch_246/ex cccc cccc 1737 | train/epoch_246/ex bbbbj jbbbg 1738 | train/epoch_246/ex jb fj 1739 | train/epoch_246/ex c d 1740 | train/epoch_246/ex d b 1741 | train/epoch_246{1.68s} 1742 | train/epoch_247/loss 5.9745 1743 | train/epoch_247/ex djd jdj 1744 | train/epoch_247/ex hhhh ihhh 1745 | train/epoch_247/ex ggggg ggggg 1746 | train/epoch_247/ex iii iii 1747 | train/epoch_247/ex fd jf 1748 | train/epoch_247{1.69s} 1749 | train/epoch_248/loss 5.5535 1750 | train/epoch_248/ex fff fff 1751 | train/epoch_248/ex ff ff 1752 | train/epoch_248/ex bbg bbg 1753 | train/epoch_248/ex jjf eje 1754 | train/epoch_248/ex ccc ecc 1755 | train/epoch_248{1.71s} 1756 | train/epoch_249/loss 6.6518 1757 | train/epoch_249/ex j b 1758 | train/epoch_249/ex d d 1759 | train/epoch_249/ex ggg igg 1760 | train/epoch_249/ex eeee eeee 1761 | train/epoch_249/ex jjjj jjjg 1762 | train/epoch_249{1.60s} 1763 | train/epoch_250/loss 5.9304 1764 | train/epoch_250/ex e h 1765 | train/epoch_250/ex ihihihih iiihhhhi 1766 | train/epoch_250/ex jjjjjjj ejjjjjj 1767 | train/epoch_250/ex cc hc 1768 | train/epoch_250/ex iiiii iiiii 1769 | train/epoch_250{1.70s} 1770 | train/epoch_251/loss 5.8658 1771 | train/epoch_251/ex aaaaa aaaaa 1772 | train/epoch_251/ex aaa aaa 1773 | train/epoch_251/ex ah ja 1774 | train/epoch_251/ex bbbbb bbbbb 1775 | train/epoch_251/ex adf dfa 1776 | train/epoch_251{1.65s} 1777 | train/epoch_252/loss 5.8809 1778 | train/epoch_252/ex ig cg 1779 | train/epoch_252/ex ac ce 1780 | train/epoch_252/ex e a 1781 | train/epoch_252/ex ggggg hgggg 1782 | train/epoch_252/ex hbh hhg 1783 | train/epoch_252{1.61s} 1784 | train/epoch_253/loss 6.3673 1785 | train/epoch_253/ex ccccc cccch 1786 | train/epoch_253/ex ei ed 1787 | train/epoch_253/ex i i 1788 | train/epoch_253/ex jjjj jjjj 1789 | train/epoch_253/ex bb bb 1790 | train/epoch_253{1.74s} 1791 | train/epoch_254/loss 5.7348 1792 | train/epoch_254/ex hhhhhhhf ffhfhhff 1793 | train/epoch_254/ex gggg gggg 1794 | train/epoch_254/ex ccc ccc 1795 | train/epoch_254/ex fffffff fffffff 1796 | train/epoch_254/ex j a 1797 | train/epoch_254{1.69s} 1798 | train/epoch_255/loss 5.7685 1799 | train/epoch_255/ex j a 1800 | train/epoch_255/ex hfhf hhfh 1801 | train/epoch_255/ex ddd ddd 1802 | train/epoch_255/ex dfddfd dfdgfd 1803 | train/epoch_255/ex ccece eecec 1804 | train/epoch_255{1.64s} 1805 | train/epoch_256/loss 5.9912 1806 | train/epoch_256/ex iiiic iicii 1807 | train/epoch_256/ex cc cc 1808 | train/epoch_256/ex h f 1809 | train/epoch_256/ex ce ce 1810 | train/epoch_256/ex gd hg 1811 | train/epoch_256{1.67s} 1812 | train/epoch_257/loss 5.9945 1813 | train/epoch_257/ex ie ja 1814 | train/epoch_257/ex gd hc 1815 | train/epoch_257/ex cccc cccc 1816 | train/epoch_257/ex bb bb 1817 | train/epoch_257/ex ggggg ggggg 1818 | train/epoch_257{1.69s} 1819 | train/epoch_258/loss 6.1971 1820 | train/epoch_258/ex gg gg 1821 | train/epoch_258/ex b d 1822 | train/epoch_258/ex ddddddddd ddddddddd 1823 | train/epoch_258/ex jjjjjj jjjjjj 1824 | train/epoch_258/ex hh hi 1825 | train/epoch_258{1.65s} 1826 | train/epoch_259/loss 5.8641 1827 | Epoch 259: reducing learning rate of group 0 to 2.4414e-07. 1828 | train/epoch_259/ex ddd ddd 1829 | train/epoch_259/ex iiiiii iiiiid 1830 | train/epoch_259/ex fffff fffff 1831 | train/epoch_259/ex bb gg 1832 | train/epoch_259/ex gg gg 1833 | train/epoch_259{1.70s} 1834 | train/epoch_260/loss 5.9756 1835 | train/epoch_260/ex hhhhhhhhhh hhhhhhhhhh 1836 | train/epoch_260/ex c c 1837 | train/epoch_260/ex fff fff 1838 | train/epoch_260/ex ccc ggg 1839 | train/epoch_260/ex bbbbbbb bbbbbbb 1840 | train/epoch_260{1.71s} 1841 | train/epoch_261/loss 6.1036 1842 | train/epoch_261/ex i d 1843 | train/epoch_261/ex fffff fffff 1844 | train/epoch_261/ex b b 1845 | train/epoch_261/ex fj bf 1846 | train/epoch_261/ex ggg ggg 1847 | train/epoch_261{1.67s} 1848 | train/epoch_262/loss 6.1952 1849 | train/epoch_262/ex fc gc 1850 | train/epoch_262/ex i i 1851 | train/epoch_262/ex iiiee iihee 1852 | train/epoch_262/ex eeeee eeeee 1853 | train/epoch_262/ex ifi ibf 1854 | train/epoch_262{1.65s} 1855 | train/epoch_263/loss 6.0037 1856 | train/epoch_263/ex da dh 1857 | train/epoch_263/ex j i 1858 | train/epoch_263/ex gg gg 1859 | train/epoch_263/ex jcj cjc 1860 | train/epoch_263/ex cdcdddc ccdcccd 1861 | train/epoch_263{1.74s} 1862 | train/epoch_264/loss 6.1218 1863 | train/epoch_264/ex ffifi eiiif 1864 | train/epoch_264/ex aaaaa aaaah 1865 | train/epoch_264/ex fb ef 1866 | train/epoch_264/ex d e 1867 | train/epoch_264/ex e h 1868 | train/epoch_264{1.68s} 1869 | train/epoch_265/loss 6.0748 1870 | train/epoch_265/ex ddf ffh 1871 | train/epoch_265/ex jjjjjj jjjjjj 1872 | train/epoch_265/ex hhh hhh 1873 | train/epoch_265/ex jgjg jgjj 1874 | train/epoch_265/ex i c 1875 | train/epoch_265{1.65s} 1876 | train/epoch_266/loss 6.2830 1877 | train/epoch_266/ex jjjjj jhhhh 1878 | train/epoch_266/ex ccccc cccca 1879 | train/epoch_266/ex ddb ddb 1880 | train/epoch_266/ex hh hh 1881 | train/epoch_266/ex iiie iiig 1882 | train/epoch_266{1.67s} 1883 | train/epoch_267/loss 6.0740 1884 | train/epoch_267/ex aj ca 1885 | train/epoch_267/ex ce gc 1886 | train/epoch_267/ex daad adda 1887 | train/epoch_267/ex bd dh 1888 | train/epoch_267/ex hhhhhh hhhhgh 1889 | train/epoch_267{1.61s} 1890 | train/epoch_268/loss 6.2476 1891 | train/epoch_268/ex j g 1892 | train/epoch_268/ex fd di 1893 | train/epoch_268/ex bbc bbh 1894 | train/epoch_268/ex cccjj dddjd 1895 | train/epoch_268/ex cgc cgc 1896 | train/epoch_268{1.72s} 1897 | train/epoch_269/loss 6.2418 1898 | train/epoch_269/ex ccccc ccccc 1899 | train/epoch_269/ex gggg jggj 1900 | train/epoch_269/ex dc dg 1901 | train/epoch_269/ex ieeie ieeii 1902 | train/epoch_269/ex ccccccc ccccccc 1903 | train/epoch_269{1.72s} 1904 | train/epoch_270/loss 6.2247 1905 | Epoch 270: reducing learning rate of group 0 to 1.2207e-07. 1906 | train/epoch_270/ex ddd ddd 1907 | train/epoch_270/ex hhhhh hhehh 1908 | train/epoch_270/ex ggg ggg 1909 | train/epoch_270/ex fff fff 1910 | train/epoch_270/ex aeea eaea 1911 | train/epoch_270{1.68s} 1912 | train/epoch_271/loss 6.1829 1913 | train/epoch_271/ex i i 1914 | train/epoch_271/ex hhhhhhhh hhhhjhhh 1915 | train/epoch_271/ex faga faeg 1916 | train/epoch_271/ex ddd fff 1917 | train/epoch_271/ex ccccc ccccc 1918 | train/epoch_271{1.68s} 1919 | train/epoch_272/loss 6.0693 1920 | train/epoch_272/ex d d 1921 | train/epoch_272/ex eed ede 1922 | train/epoch_272/ex i b 1923 | train/epoch_272/ex fjjf ijaa 1924 | train/epoch_272/ex ddd ddd 1925 | train/epoch_272{1.71s} 1926 | train/epoch_273/loss 5.9479 1927 | train/epoch_273/ex hhh dhh 1928 | train/epoch_273/ex jjjjjjjj jjjjjjjj 1929 | train/epoch_273/ex ddddddd ddddddd 1930 | train/epoch_273/ex i d 1931 | train/epoch_273/ex bbbb bbbb 1932 | train/epoch_273{1.71s} 1933 | train/epoch_274/loss 6.2712 1934 | train/epoch_274/ex hhh hhh 1935 | train/epoch_274/ex je he 1936 | train/epoch_274/ex c d 1937 | train/epoch_274/ex b b 1938 | train/epoch_274/ex cccc ccca 1939 | train/epoch_274{1.65s} 1940 | train/epoch_275/loss 6.1563 1941 | train/epoch_275/ex d f 1942 | train/epoch_275/ex bbbbb ebbbb 1943 | train/epoch_275/ex aaaa aaaa 1944 | train/epoch_275/ex iic icc 1945 | train/epoch_275/ex caa ajj 1946 | train/epoch_275{1.69s} 1947 | train/epoch_276/loss 5.8761 1948 | train/epoch_276/ex c c 1949 | train/epoch_276/ex bbbbg bbccg 1950 | train/epoch_276/ex cj ce 1951 | train/epoch_276/ex aaaaaaa aaaaaaa 1952 | train/epoch_276/ex c c 1953 | train/epoch_276{1.67s} 1954 | train/epoch_277/loss 6.2020 1955 | train/epoch_277/ex bbbbbb bbdbbb 1956 | train/epoch_277/ex ff ff 1957 | train/epoch_277/ex ga fg 1958 | train/epoch_277/ex ddd ddd 1959 | train/epoch_277/ex ii gg 1960 | train/epoch_277{1.67s} 1961 | train/epoch_278/loss 6.3273 1962 | train/epoch_278/ex bbbb jbbb 1963 | train/epoch_278/ex agg gaa 1964 | train/epoch_278/ex i i 1965 | train/epoch_278/ex edde dedd 1966 | train/epoch_278/ex aaaagga igggiaa 1967 | train/epoch_278{1.65s} 1968 | train/epoch_279/loss 6.0416 1969 | train/epoch_279/ex gh gf 1970 | train/epoch_279/ex hhh hhh 1971 | train/epoch_279/ex cf fc 1972 | train/epoch_279/ex ccccccc cccccch 1973 | train/epoch_279/ex hhhhh hhhhh 1974 | train/epoch_279{1.72s} 1975 | train/epoch_280/loss 6.1316 1976 | train/epoch_280/ex jcjf hcjc 1977 | train/epoch_280/ex ddd aff 1978 | train/epoch_280/ex ddde eddd 1979 | train/epoch_280/ex aha hah 1980 | train/epoch_280/ex ddd bii 1981 | train/epoch_280{1.63s} 1982 | train/epoch_281/loss 6.4975 1983 | Epoch 281: reducing learning rate of group 0 to 6.1035e-08. 1984 | train/epoch_281/ex hhhhh hhhhd 1985 | train/epoch_281/ex ddddd ddddd 1986 | train/epoch_281/ex ffff jfff 1987 | train/epoch_281/ex i b 1988 | train/epoch_281/ex ddd ddd 1989 | train/epoch_281{1.68s} 1990 | train/epoch_282/loss 5.9295 1991 | train/epoch_282/ex b d 1992 | train/epoch_282/ex eeeeeee eeeeeee 1993 | train/epoch_282/ex iii iii 1994 | train/epoch_282/ex ccaca acacc 1995 | train/epoch_282/ex ceb ece 1996 | train/epoch_282{1.61s} 1997 | train/epoch_283/loss 6.3771 1998 | train/epoch_283/ex ddddd ddddd 1999 | train/epoch_283/ex bbbbbb bbbabb 2000 | train/epoch_283/ex ffff ffff 2001 | train/epoch_283/ex iii dii 2002 | train/epoch_283/ex jg gj 2003 | train/epoch_283{1.59s} 2004 | train/epoch_284/loss 6.2439 2005 | train/epoch_284/ex bbb aaa 2006 | train/epoch_284/ex jjjj jjjj 2007 | train/epoch_284/ex ffbbf fbfbb 2008 | train/epoch_284/ex aaaaa caaaa 2009 | train/epoch_284/ex dd cc 2010 | train/epoch_284{1.68s} 2011 | train/epoch_285/loss 5.8718 2012 | train/epoch_285/ex hhh hhh 2013 | train/epoch_285/ex ggggg ggggg 2014 | train/epoch_285/ex cccccccc caaaaccc 2015 | train/epoch_285/ex e i 2016 | train/epoch_285/ex aaa aad 2017 | train/epoch_285{1.65s} 2018 | train/epoch_286/loss 5.9488 2019 | train/epoch_286/ex aiai aiia 2020 | train/epoch_286/ex cccc ccce 2021 | train/epoch_286/ex iii iii 2022 | train/epoch_286/ex eeeee eeeee 2023 | train/epoch_286/ex fff fff 2024 | train/epoch_286{1.69s} 2025 | train/epoch_287/loss 6.1329 2026 | train/epoch_287/ex cccc cccc 2027 | train/epoch_287/ex fd df 2028 | train/epoch_287/ex hi df 2029 | train/epoch_287/ex dbdb bgbg 2030 | train/epoch_287/ex hhh hbb 2031 | train/epoch_287{1.66s} 2032 | train/epoch_288/loss 6.3430 2033 | train/epoch_288/ex jjjj jjjj 2034 | train/epoch_288/ex ffffffffffb bdfbfdffbdf 2035 | train/epoch_288/ex aaaaa daaaa 2036 | train/epoch_288/ex jjj jjj 2037 | train/epoch_288/ex aaa aaa 2038 | train/epoch_288{1.82s} 2039 | train/epoch_289/loss 5.8025 2040 | train/epoch_289/ex eeje bgee 2041 | train/epoch_289/ex cdcddd cdaccc 2042 | train/epoch_289/ex dhd did 2043 | train/epoch_289/ex ccccc ccccc 2044 | train/epoch_289/ex dd dd 2045 | train/epoch_289{1.75s} 2046 | train/epoch_290/loss 6.1609 2047 | train/epoch_290/ex ccccf fcccj 2048 | train/epoch_290/ex jjjj jjjj 2049 | train/epoch_290/ex i c 2050 | train/epoch_290/ex eee eee 2051 | train/epoch_290/ex fj jf 2052 | train/epoch_290{1.65s} 2053 | train/epoch_291/loss 6.2130 2054 | train/epoch_291/ex ggg ggg 2055 | train/epoch_291/ex iic icc 2056 | train/epoch_291/ex ac ca 2057 | train/epoch_291/ex eb eb 2058 | train/epoch_291/ex bbb bbb 2059 | train/epoch_291{1.67s} 2060 | train/epoch_292/loss 5.7293 2061 | Epoch 292: reducing learning rate of group 0 to 3.0518e-08. 2062 | train/epoch_292/ex bbbbi bbiii 2063 | train/epoch_292/ex ahhah haaha 2064 | train/epoch_292/ex aa aa 2065 | train/epoch_292/ex ii ii 2066 | train/epoch_292/ex jjjjjjj jjjjjjj 2067 | train/epoch_292{1.66s} 2068 | train/epoch_293/loss 6.1803 2069 | train/epoch_293/ex iiiiiij ibbbibb 2070 | train/epoch_293/ex jjjjj jjjjj 2071 | train/epoch_293/ex ggggd gdhgg 2072 | train/epoch_293/ex ggggg ggggg 2073 | train/epoch_293/ex iiiii eiiii 2074 | train/epoch_293{1.65s} 2075 | train/epoch_294/loss 6.4848 2076 | train/epoch_294/ex ccc hcc 2077 | train/epoch_294/ex aeeae ieaea 2078 | train/epoch_294/ex ggggjj jhhhjh 2079 | train/epoch_294/ex jjfjf jfjfj 2080 | train/epoch_294/ex ha ab 2081 | train/epoch_294{1.72s} 2082 | train/epoch_295/loss 5.9765 2083 | train/epoch_295/ex jjj iii 2084 | train/epoch_295/ex ggggg gdddd 2085 | train/epoch_295/ex hhh hhh 2086 | train/epoch_295/ex eee eee 2087 | train/epoch_295/ex eeeeeee eeeeeee 2088 | train/epoch_295{1.68s} 2089 | train/epoch_296/loss 6.0851 2090 | train/epoch_296/ex jjj jjj 2091 | train/epoch_296/ex ffe fef 2092 | train/epoch_296/ex cg ac 2093 | train/epoch_296/ex ajjaj aajaj 2094 | train/epoch_296/ex eejj deee 2095 | train/epoch_296{1.61s} 2096 | train/epoch_297/loss 5.8814 2097 | train/epoch_297/ex gigigi giggig 2098 | train/epoch_297/ex cc dc 2099 | train/epoch_297/ex d b 2100 | train/epoch_297/ex hhhhhhh hhhhhhh 2101 | train/epoch_297/ex cccccb bcbccc 2102 | train/epoch_297{1.70s} 2103 | train/epoch_298/loss 5.8316 2104 | train/epoch_298/ex jh jh 2105 | train/epoch_298/ex fffff fffff 2106 | train/epoch_298/ex aj jf 2107 | train/epoch_298/ex eb ec 2108 | train/epoch_298/ex hhhhhhhj hhjjhhhh 2109 | train/epoch_298{1.75s} 2110 | train/epoch_299/loss 6.0841 2111 | train/epoch_299/ex c c 2112 | train/epoch_299/ex cc cc 2113 | train/epoch_299/ex ee ee 2114 | train/epoch_299/ex fi ic 2115 | train/epoch_299/ex aaaa aaaa 2116 | train/epoch_299{1.68s} 2117 | train/epoch_300/loss 6.0746 2118 | train/epoch_300/ex ieie eaei 2119 | train/epoch_300/ex aajj aajj 2120 | train/epoch_300/ex jjjjjj jjhjjj 2121 | train/epoch_300/ex gjg jgj 2122 | train/epoch_300/ex gd gh 2123 | train/epoch_300{1.71s} 2124 | train/epoch_301/loss 6.4497 2125 | train/epoch_301/ex bbbdb gbbdd 2126 | train/epoch_301/ex gggj jjgg 2127 | train/epoch_301/ex bj jb 2128 | train/epoch_301/ex iijjjij jjiiiij 2129 | train/epoch_301/ex ffffe fffef 2130 | train/epoch_301{1.72s} 2131 | train/epoch_302/loss 5.9866 2132 | train/epoch_302/ex jjj jjj 2133 | train/epoch_302/ex ig ei 2134 | train/epoch_302/ex fff dff 2135 | train/epoch_302/ex jdjdj jjadj 2136 | train/epoch_302/ex hb fh 2137 | train/epoch_302{1.67s} 2138 | train/epoch_303/loss 6.1320 2139 | Epoch 303: reducing learning rate of group 0 to 1.5259e-08. 2140 | train/epoch_303/ex ifi jif 2141 | train/epoch_303/ex iii iii 2142 | train/epoch_303/ex ffff fffc 2143 | train/epoch_303/ex aa bb 2144 | train/epoch_303/ex ccccc ccccc 2145 | train/epoch_303{1.70s} 2146 | train/epoch_304/loss 6.0997 2147 | train/epoch_304/ex jjjjjj ijjjjb 2148 | train/epoch_304/ex ffff ffaf 2149 | train/epoch_304/ex hhhh hhhh 2150 | train/epoch_304/ex db di 2151 | train/epoch_304/ex ddd ddd 2152 | train/epoch_304{1.66s} 2153 | train/epoch_305/loss 6.4011 2154 | train/epoch_305/ex hddh hhdh 2155 | train/epoch_305/ex ggg agg 2156 | train/epoch_305/ex iiii iiii 2157 | train/epoch_305/ex i d 2158 | train/epoch_305/ex hhhhhhhhhh hhhhhhhhhh 2159 | train/epoch_305{1.67s} 2160 | train/epoch_306/loss 6.2998 2161 | train/epoch_306/ex iii iii 2162 | train/epoch_306/ex bbbbbb gbgbbb 2163 | train/epoch_306/ex gf dg 2164 | train/epoch_306/ex hffcffcfcfc chefcfchhhf 2165 | train/epoch_306/ex hhhhhhhhhh hhhhhhhhhh 2166 | train/epoch_306{1.62s} 2167 | train/epoch_307/loss 6.2166 2168 | train/epoch_307/ex d b 2169 | train/epoch_307/ex hhhhh hhhhh 2170 | train/epoch_307/ex bgg ggc 2171 | train/epoch_307/ex iii iii 2172 | train/epoch_307/ex bbh abb 2173 | train/epoch_307{1.65s} 2174 | train/epoch_308/loss 6.2850 2175 | train/epoch_308/ex ggggg ggggg 2176 | train/epoch_308/ex d i 2177 | train/epoch_308/ex aaaa afaa 2178 | train/epoch_308/ex jhj cjh 2179 | train/epoch_308/ex ici cic 2180 | train/epoch_308{1.68s} 2181 | train/epoch_309/loss 6.7888 2182 | train/epoch_309/ex jjjjj jjjjg 2183 | train/epoch_309/ex jjj jjb 2184 | train/epoch_309/ex ffffff afffff 2185 | train/epoch_309/ex aaaaaaa aacaaaa 2186 | train/epoch_309/ex cgcg ehcc 2187 | train/epoch_309{1.64s} 2188 | train/epoch_310/loss 6.4260 2189 | train/epoch_310/ex hhh hdd 2190 | train/epoch_310/ex ggggg iiiii 2191 | train/epoch_310/ex eeee eeee 2192 | train/epoch_310/ex aaaaaj jajjjj 2193 | train/epoch_310/ex cda acj 2194 | train/epoch_310{1.60s} 2195 | train/epoch_311/loss 6.2633 2196 | train/epoch_311/ex aaaaa aaaaa 2197 | train/epoch_311/ex jd ej 2198 | train/epoch_311/ex i f 2199 | train/epoch_311/ex di gd 2200 | train/epoch_311/ex ib ib 2201 | train/epoch_311{1.67s} 2202 | train/epoch_312/loss 6.2548 2203 | train/epoch_312/ex jjj jjj 2204 | train/epoch_312/ex ggg aaa 2205 | train/epoch_312/ex ieeie ieiii 2206 | train/epoch_312/ex ii hh 2207 | train/epoch_312/ex cgf cgc 2208 | train/epoch_312{1.68s} 2209 | train/epoch_313/loss 6.0804 2210 | train/epoch_313/ex aaaaa aaaaa 2211 | train/epoch_313/ex dg dc 2212 | train/epoch_313/ex jjjjjjj gggjggj 2213 | train/epoch_313/ex hhhhhh bhhhhh 2214 | train/epoch_313/ex jjjjjbb jbbjjjj 2215 | train/epoch_313{1.68s} 2216 | train/epoch_314/loss 6.0775 2217 | train/epoch_314/ex aaaagg gaagaa 2218 | train/epoch_314/ex dd dd 2219 | train/epoch_314/ex fgf cgg 2220 | train/epoch_314/ex iiiiiiiia baaaiaabb 2221 | train/epoch_314/ex cccccc cccdcc 2222 | train/epoch_314{1.69s} 2223 | train/epoch_315/loss 6.0600 2224 | train/epoch_315/ex iiiiiii iiiiiii 2225 | train/epoch_315/ex cc cc 2226 | train/epoch_315/ex d d 2227 | train/epoch_315/ex ccccc ccccc 2228 | train/epoch_315/ex cb bc 2229 | train/epoch_315{1.69s} 2230 | train/epoch_316/loss 6.1829 2231 | train/epoch_316/ex b h 2232 | train/epoch_316/ex ffff feee 2233 | train/epoch_316/ex ggg ggg 2234 | train/epoch_316/ex bbbbb jbbbb 2235 | train/epoch_316/ex ddeed ejdjj 2236 | train/epoch_316{1.63s} 2237 | train/epoch_317/loss 6.3273 2238 | train/epoch_317/ex hhhhh hhhhh 2239 | train/epoch_317/ex hhhh hhhh 2240 | train/epoch_317/ex aaj jaa 2241 | train/epoch_317/ex hhbbhbb hhhbhhb 2242 | train/epoch_317/ex bbbbbb bbbbgb 2243 | train/epoch_317{1.69s} 2244 | train/epoch_318/loss 6.1831 2245 | train/epoch_318/ex ddd ddd 2246 | train/epoch_318/ex bbbb bbbb 2247 | train/epoch_318/ex ggg ggg 2248 | train/epoch_318/ex ch dc 2249 | train/epoch_318/ex hghgh gghgh 2250 | train/epoch_318{1.65s} 2251 | train/epoch_319/loss 6.2866 2252 | train/epoch_319/ex jjjj jjjj 2253 | train/epoch_319/ex ccjjc cjjcj 2254 | train/epoch_319/ex iii iii 2255 | train/epoch_319/ex dddd bbbd 2256 | train/epoch_319/ex cccc ccce 2257 | train/epoch_319{1.65s} 2258 | train/epoch_320/loss 5.9370 2259 | train/epoch_320/ex bf bc 2260 | train/epoch_320/ex ggg ggf 2261 | train/epoch_320/ex c c 2262 | train/epoch_320/ex affa baaf 2263 | train/epoch_320/ex fh hc 2264 | train/epoch_320{1.60s} 2265 | train/epoch_321/loss 5.9383 2266 | train/epoch_321/ex db db 2267 | train/epoch_321/ex c c 2268 | train/epoch_321/ex hhhhh hhhhh 2269 | train/epoch_321/ex jjjj jjjj 2270 | train/epoch_321/ex iiiii iiiii 2271 | train/epoch_321{1.60s} 2272 | train/epoch_322/loss 5.8068 2273 | train/epoch_322/ex cccc cccc 2274 | train/epoch_322/ex ddff fffd 2275 | train/epoch_322/ex je eg 2276 | train/epoch_322/ex bjjb jbbj 2277 | train/epoch_322/ex aac caa 2278 | train/epoch_322{1.65s} 2279 | train/epoch_323/loss 5.7356 2280 | train/epoch_323/ex ggggg ggggg 2281 | train/epoch_323/ex hhhhh hhhhh 2282 | train/epoch_323/ex jjjjjjjjj jjfjjjjjj 2283 | train/epoch_323/ex ccggcg ggcggc 2284 | train/epoch_323/ex aja jae 2285 | train/epoch_323{1.74s} 2286 | train/epoch_324/loss 6.3608 2287 | train/epoch_324/ex ddd iii 2288 | train/epoch_324/ex ggggg ggggg 2289 | train/epoch_324/ex aaaaaa aaaaaa 2290 | train/epoch_324/ex ffjf jffj 2291 | train/epoch_324/ex jjhjh hhjjh 2292 | train/epoch_324{1.63s} 2293 | train/epoch_325/loss 6.1163 2294 | train/epoch_325/ex eed eed 2295 | train/epoch_325/ex gggg gggc 2296 | train/epoch_325/ex aaaa aaaa 2297 | train/epoch_325/ex g g 2298 | train/epoch_325/ex cccc cccc 2299 | train/epoch_325{1.60s} 2300 | train/epoch_326/loss 6.3196 2301 | train/epoch_326/ex i h 2302 | train/epoch_326/ex jjjjjjj jjjjjjj 2303 | train/epoch_326/ex bbbb bhbb 2304 | train/epoch_326/ex ggggg ggggg 2305 | train/epoch_326/ex ajjaj ajaja 2306 | train/epoch_326{1.69s} 2307 | train/epoch_327/loss 6.0687 2308 | train/epoch_327/ex i e 2309 | train/epoch_327/ex aaa aaa 2310 | train/epoch_327/ex aaaaa aaaaa 2311 | train/epoch_327/ex ggg ggg 2312 | train/epoch_327/ex fffffffffff ffcfffgffff 2313 | train/epoch_327{1.71s} 2314 | train/epoch_328/loss 6.1832 2315 | train/epoch_328/ex c h 2316 | train/epoch_328/ex d h 2317 | train/epoch_328/ex cgj acg 2318 | train/epoch_328/ex d b 2319 | train/epoch_328/ex gggb gcgg 2320 | train/epoch_328{1.66s} 2321 | train/epoch_329/loss 6.2093 2322 | train/epoch_329/ex jjjj fjjj 2323 | train/epoch_329/ex iii iic 2324 | train/epoch_329/ex aaaaa haaaa 2325 | train/epoch_329/ex aaaa aaaa 2326 | train/epoch_329/ex cccca cccaa 2327 | train/epoch_329{1.67s} 2328 | train/epoch_330/loss 5.9111 2329 | train/epoch_330/ex dc da 2330 | train/epoch_330/ex cddbb cbbbd 2331 | train/epoch_330/ex eeeee eeeee 2332 | train/epoch_330/ex d d 2333 | train/epoch_330/ex ei eb 2334 | train/epoch_330{1.68s} 2335 | train/epoch_331/loss 6.3757 2336 | train/epoch_331/ex gggg gggc 2337 | train/epoch_331/ex hhe aee 2338 | train/epoch_331/ex cccc cccc 2339 | train/epoch_331/ex ch ec 2340 | train/epoch_331/ex aj ja 2341 | train/epoch_331{1.70s} 2342 | train/epoch_332/loss 6.0378 2343 | train/epoch_332/ex hhh hhh 2344 | train/epoch_332/ex eee gee 2345 | train/epoch_332/ex ce hc 2346 | train/epoch_332/ex jjjj jjjg 2347 | train/epoch_332/ex ffffffff ffffffff 2348 | train/epoch_332{1.67s} 2349 | train/epoch_333/loss 5.9896 2350 | train/epoch_333/ex iii iid 2351 | train/epoch_333/ex j a 2352 | train/epoch_333/ex ddbbbdd bdddbbb 2353 | train/epoch_333/ex i i 2354 | train/epoch_333/ex fffd fffd 2355 | train/epoch_333{1.70s} 2356 | train/epoch_334/loss 6.1915 2357 | train/epoch_334/ex iiii iiii 2358 | train/epoch_334/ex didid iiidi 2359 | train/epoch_334/ex iiiiiii iiiiiii 2360 | train/epoch_334/ex c c 2361 | train/epoch_334/ex b b 2362 | train/epoch_334{1.63s} 2363 | train/epoch_335/loss 6.1718 2364 | train/epoch_335/ex eeeeei ieeeee 2365 | train/epoch_335/ex a i 2366 | train/epoch_335/ex bbb bbb 2367 | train/epoch_335/ex eeeei beiee 2368 | train/epoch_335/ex ff ff 2369 | train/epoch_335{1.70s} 2370 | train/epoch_336/loss 5.7570 2371 | train/epoch_336/ex fe fe 2372 | train/epoch_336/ex ch bh 2373 | train/epoch_336/ex c c 2374 | train/epoch_336/ex jjjjjj jjjjjj 2375 | train/epoch_336/ex iiiii iiiii 2376 | train/epoch_336{1.67s} 2377 | train/epoch_337/loss 5.8231 2378 | train/epoch_337/ex iii iii 2379 | train/epoch_337/ex ji ji 2380 | train/epoch_337/ex dddddddddj djjdjjjdjj 2381 | train/epoch_337/ex c d 2382 | train/epoch_337/ex cccc cccc 2383 | train/epoch_337{1.66s} 2384 | train/epoch_338/loss 6.2300 2385 | train/epoch_338/ex ab ad 2386 | train/epoch_338/ex b d 2387 | train/epoch_338/ex bbb bba 2388 | train/epoch_338/ex iiii iiii 2389 | train/epoch_338/ex ddd idd 2390 | train/epoch_338{1.67s} 2391 | train/epoch_339/loss 6.4937 2392 | train/epoch_339/ex ge hg 2393 | train/epoch_339/ex aaa aaa 2394 | train/epoch_339/ex iii iii 2395 | train/epoch_339/ex ja ja 2396 | train/epoch_339/ex dde eed 2397 | train/epoch_339{1.66s} 2398 | train/epoch_340/loss 6.3367 2399 | train/epoch_340/ex iiiig igiii 2400 | train/epoch_340/ex cd cd 2401 | train/epoch_340/ex cccc cccc 2402 | train/epoch_340/ex iiii iiic 2403 | train/epoch_340/ex cac ccg 2404 | train/epoch_340{1.71s} 2405 | train/epoch_341/loss 6.2187 2406 | train/epoch_341/ex ddj bdd 2407 | train/epoch_341/ex e h 2408 | train/epoch_341/ex h g 2409 | train/epoch_341/ex eeej eeej 2410 | train/epoch_341/ex fffffb bfbffb 2411 | train/epoch_341{1.71s} 2412 | train/epoch_342/loss 6.1466 2413 | train/epoch_342/ex bbb ebb 2414 | train/epoch_342/ex b a 2415 | train/epoch_342/ex ccg ccj 2416 | train/epoch_342/ex bbb bbb 2417 | train/epoch_342/ex fifi fdid 2418 | train/epoch_342{1.69s} 2419 | train/epoch_343/loss 6.1674 2420 | train/epoch_343/ex ccccc cchcc 2421 | train/epoch_343/ex eee eef 2422 | train/epoch_343/ex d c 2423 | train/epoch_343/ex cb cb 2424 | train/epoch_343/ex gjjg jjgj 2425 | train/epoch_343{1.72s} 2426 | train/epoch_344/loss 5.9071 2427 | train/epoch_344/ex hhha aaah 2428 | train/epoch_344/ex ggg igf 2429 | train/epoch_344/ex ig ia 2430 | train/epoch_344/ex j j 2431 | train/epoch_344/ex aa ja 2432 | train/epoch_344{1.62s} 2433 | train/epoch_345/loss 6.3706 2434 | train/epoch_345/ex iii fii 2435 | train/epoch_345/ex jjjjjjg gggjggj 2436 | train/epoch_345/ex bc bj 2437 | train/epoch_345/ex dgd dgd 2438 | train/epoch_345/ex ccc cgg 2439 | train/epoch_345{1.71s} 2440 | train/epoch_346/loss 6.1455 2441 | train/epoch_346/ex i f 2442 | train/epoch_346/ex dddd dddd 2443 | train/epoch_346/ex d g 2444 | train/epoch_346/ex b i 2445 | train/epoch_346/ex dde eed 2446 | train/epoch_346{1.72s} 2447 | train/epoch_347/loss 6.3149 2448 | train/epoch_347/ex cdcdddc ddddccd 2449 | train/epoch_347/ex d d 2450 | train/epoch_347/ex hhi iid 2451 | train/epoch_347/ex i b 2452 | train/epoch_347/ex ddhdh ddcjh 2453 | train/epoch_347{1.70s} 2454 | train/epoch_348/loss 6.0296 2455 | train/epoch_348/ex ggggg ggggg 2456 | train/epoch_348/ex bb bb 2457 | train/epoch_348/ex aaaaa aaaaa 2458 | train/epoch_348/ex hjhj hhjh 2459 | train/epoch_348/ex hhhhh hhhhh 2460 | train/epoch_348{1.70s} 2461 | train/epoch_349/loss 6.9180 2462 | train/epoch_349/ex b b 2463 | train/epoch_349/ex iddidid dididdi 2464 | train/epoch_349/ex fff fff 2465 | train/epoch_349/ex eeeeee eeeeec 2466 | train/epoch_349/ex gdgdgg gdddgd 2467 | train/epoch_349{1.70s} 2468 | train/epoch_350/loss 6.2653 2469 | train/epoch_350/ex cdcd dcdc 2470 | train/epoch_350/ex ff ii 2471 | train/epoch_350/ex ii ii 2472 | train/epoch_350/ex bbbbbf bbbbfb 2473 | train/epoch_350/ex hhhf ffhh 2474 | train/epoch_350{1.60s} 2475 | train/epoch_351/loss 5.7307 2476 | train/epoch_351/ex fjjf jffj 2477 | train/epoch_351/ex iiiiiiiiii iiiiiiiiii 2478 | train/epoch_351/ex ggggg ggggg 2479 | train/epoch_351/ex b b 2480 | train/epoch_351/ex bbb bbb 2481 | train/epoch_351{1.67s} 2482 | train/epoch_352/loss 6.3049 2483 | train/epoch_352/ex i i 2484 | train/epoch_352/ex jj jj 2485 | train/epoch_352/ex dddd dddd 2486 | train/epoch_352/ex e e 2487 | train/epoch_352/ex dd dd 2488 | train/epoch_352{1.77s} 2489 | train/epoch_353/loss 6.0001 2490 | train/epoch_353/ex fffff fffff 2491 | train/epoch_353/ex iii iig 2492 | train/epoch_353/ex hhh hhh 2493 | train/epoch_353/ex chch hchc 2494 | train/epoch_353/ex aaaa aaia 2495 | train/epoch_353{1.75s} 2496 | train/epoch_354/loss 5.6768 2497 | train/epoch_354/ex ccc ccc 2498 | train/epoch_354/ex b h 2499 | train/epoch_354/ex dddd dddd 2500 | train/epoch_354/ex aaaaaaaaa aaaaaaaaa 2501 | train/epoch_354/ex bbggggg biiibgg 2502 | train/epoch_354{1.72s} 2503 | train/epoch_355/loss 5.8546 2504 | train/epoch_355/ex babab baabb 2505 | train/epoch_355/ex i b 2506 | train/epoch_355/ex bbhh hhhb 2507 | train/epoch_355/ex eeeee eieee 2508 | train/epoch_355/ex i g 2509 | train/epoch_355{1.67s} 2510 | train/epoch_356/loss 6.3981 2511 | train/epoch_356/ex eee aee 2512 | train/epoch_356/ex ei bi 2513 | train/epoch_356/ex igg ibg 2514 | train/epoch_356/ex j j 2515 | train/epoch_356/ex ddd ddb 2516 | train/epoch_356{1.68s} 2517 | train/epoch_357/loss 6.2083 2518 | train/epoch_357/ex jjjjjj djjgjj 2519 | train/epoch_357/ex bb eb 2520 | train/epoch_357/ex fff fff 2521 | train/epoch_357/ex cccb cbcc 2522 | train/epoch_357/ex gg cc 2523 | train/epoch_357{1.62s} 2524 | train/epoch_358/loss 6.4533 2525 | train/epoch_358/ex bbf ffi 2526 | train/epoch_358/ex aaaaaaa aaaaaaa 2527 | train/epoch_358/ex jjjg jjgj 2528 | train/epoch_358/ex hj ij 2529 | train/epoch_358/ex aaa aaa 2530 | train/epoch_358{1.64s} 2531 | train/epoch_359/loss 6.2084 2532 | train/epoch_359/ex hhhhh hhhhh 2533 | train/epoch_359/ex i d 2534 | train/epoch_359/ex ji jg 2535 | train/epoch_359/ex fb fe 2536 | train/epoch_359/ex bbb bbb 2537 | train/epoch_359{1.63s} 2538 | train/epoch_360/loss 6.5868 2539 | train/epoch_360/ex aj gj 2540 | train/epoch_360/ex hhaa fhha 2541 | train/epoch_360/ex b d 2542 | train/epoch_360/ex ddd ddd 2543 | train/epoch_360/ex hb jh 2544 | train/epoch_360{1.74s} 2545 | train/epoch_361/loss 6.3684 2546 | train/epoch_361/ex bbbb bbbc 2547 | train/epoch_361/ex hh hf 2548 | train/epoch_361/ex bh hc 2549 | train/epoch_361/ex ffffffffff ffffffffff 2550 | train/epoch_361/ex ffee fffd 2551 | train/epoch_361{1.66s} 2552 | train/epoch_362/loss 6.2143 2553 | train/epoch_362/ex bbbbbb fbbbbb 2554 | train/epoch_362/ex iff iif 2555 | train/epoch_362/ex aaaaaa haahaa 2556 | train/epoch_362/ex eeee eeee 2557 | train/epoch_362/ex hhhhh hhhhh 2558 | train/epoch_362{1.67s} 2559 | train/epoch_363/loss 5.7841 2560 | train/epoch_363/ex ee he 2561 | train/epoch_363/ex jijiji ijjjfi 2562 | train/epoch_363/ex hhh hhh 2563 | train/epoch_363/ex ecjc eeje 2564 | train/epoch_363/ex hhh hhh 2565 | train/epoch_363{1.75s} 2566 | train/epoch_364/loss 6.2260 2567 | train/epoch_364/ex hh ff 2568 | train/epoch_364/ex dc cd 2569 | train/epoch_364/ex hhhhh ddddd 2570 | train/epoch_364/ex aaaaaa aaaaae 2571 | train/epoch_364/ex ggg ggj 2572 | train/epoch_364{1.62s} 2573 | train/epoch_365/loss 6.4527 2574 | train/epoch_365/ex dddd bddd 2575 | train/epoch_365/ex iiii iiii 2576 | train/epoch_365/ex i f 2577 | train/epoch_365/ex j j 2578 | train/epoch_365/ex iiiiiiia fiiiifcc 2579 | train/epoch_365{1.67s} 2580 | train/epoch_366/loss 5.9261 2581 | train/epoch_366/ex bbbbb bbbbb 2582 | train/epoch_366/ex iji hhj 2583 | train/epoch_366/ex gg ii 2584 | train/epoch_366/ex eeee geee 2585 | train/epoch_366/ex bjb bgj 2586 | train/epoch_366{1.67s} 2587 | train/epoch_367/loss 6.0866 2588 | train/epoch_367/ex d d 2589 | train/epoch_367/ex jj bb 2590 | train/epoch_367/ex aaa aaa 2591 | train/epoch_367/ex d h 2592 | train/epoch_367/ex ddg ggd 2593 | train/epoch_367{1.66s} 2594 | train/epoch_368/loss 5.8218 2595 | train/epoch_368/ex cc cc 2596 | train/epoch_368/ex j j 2597 | train/epoch_368/ex h g 2598 | train/epoch_368/ex ffbbb fffbf 2599 | train/epoch_368/ex ge be 2600 | train/epoch_368{1.73s} 2601 | train/epoch_369/loss 6.4046 2602 | train/epoch_369/ex eege eege 2603 | train/epoch_369/ex d b 2604 | train/epoch_369/ex iiiiiii iiiiiia 2605 | train/epoch_369/ex jj jj 2606 | train/epoch_369/ex fa fa 2607 | train/epoch_369{1.72s} 2608 | train/epoch_370/loss 5.9136 2609 | train/epoch_370/ex hhh hhh 2610 | train/epoch_370/ex e e 2611 | train/epoch_370/ex c j 2612 | train/epoch_370/ex jdjdj jjddc 2613 | train/epoch_370/ex i d 2614 | train/epoch_370{1.62s} 2615 | train/epoch_371/loss 6.2363 2616 | train/epoch_371/ex jjd jaj 2617 | train/epoch_371/ex hggh hghh 2618 | train/epoch_371/ex ahah ehef 2619 | train/epoch_371/ex cccch gccch 2620 | train/epoch_371/ex eej ebe 2621 | train/epoch_371{1.59s} 2622 | train/epoch_372/loss 6.3825 2623 | train/epoch_372/ex eea eae 2624 | train/epoch_372/ex ddddd ddddd 2625 | train/epoch_372/ex c d 2626 | train/epoch_372/ex afaaf aaafa 2627 | train/epoch_372/ex fe fd 2628 | train/epoch_372{1.66s} 2629 | train/epoch_373/loss 6.0288 2630 | train/epoch_373/ex ddddddd ddddddd 2631 | train/epoch_373/ex ddddd ddddd 2632 | train/epoch_373/ex j e 2633 | train/epoch_373/ex iiiii iiiii 2634 | train/epoch_373/ex ececeh hchhee 2635 | train/epoch_373{1.74s} 2636 | train/epoch_374/loss 5.7189 2637 | train/epoch_374/ex fff fff 2638 | train/epoch_374/ex e e 2639 | train/epoch_374/ex hhii hihh 2640 | train/epoch_374/ex fa ag 2641 | train/epoch_374/ex eeje aehj 2642 | train/epoch_374{1.68s} 2643 | train/epoch_375/loss 6.1286 2644 | train/epoch_375/ex dg ed 2645 | train/epoch_375/ex fj jf 2646 | train/epoch_375/ex fffff fffff 2647 | train/epoch_375/ex bc cb 2648 | train/epoch_375/ex gdgdg dgdgd 2649 | train/epoch_375{1.61s} 2650 | train/epoch_376/loss 5.9586 2651 | train/epoch_376/ex gjgjjgj ajaaaaj 2652 | train/epoch_376/ex bbbbbbb bbccccc 2653 | train/epoch_376/ex i g 2654 | train/epoch_376/ex db db 2655 | train/epoch_376/ex iiig iiig 2656 | train/epoch_376{1.72s} 2657 | train/epoch_377/loss 6.3735 2658 | train/epoch_377/ex gg gg 2659 | train/epoch_377/ex fifi ffif 2660 | train/epoch_377/ex iiic icii 2661 | train/epoch_377/ex iijjij iiijii 2662 | train/epoch_377/ex jjjj jjjj 2663 | train/epoch_377{1.72s} 2664 | train/epoch_378/loss 6.2734 2665 | train/epoch_378/ex ccc ggg 2666 | train/epoch_378/ex cccc cccc 2667 | train/epoch_378/ex ccccc ccccc 2668 | train/epoch_378/ex ggg ggg 2669 | train/epoch_378/ex j e 2670 | train/epoch_378{1.67s} 2671 | train/epoch_379/loss 6.3686 2672 | train/epoch_379/ex g c 2673 | train/epoch_379/ex d a 2674 | train/epoch_379/ex hhh ghh 2675 | train/epoch_379/ex jjjj jjjj 2676 | train/epoch_379/ex ggg ddd 2677 | train/epoch_379{1.68s} 2678 | train/epoch_380/loss 6.1349 2679 | train/epoch_380/ex c j 2680 | train/epoch_380/ex i a 2681 | train/epoch_380/ex hjj hjj 2682 | train/epoch_380/ex ca ca 2683 | train/epoch_380/ex jjjjjjj jjjjjjj 2684 | train/epoch_380{1.69s} 2685 | train/epoch_381/loss 6.3028 2686 | train/epoch_381/ex jjjj jjjj 2687 | train/epoch_381/ex bbbb jbbb 2688 | train/epoch_381/ex hhhhh hhhhh 2689 | train/epoch_381/ex jjdd jdff 2690 | train/epoch_381/ex ddbbd dbbdd 2691 | train/epoch_381{1.66s} 2692 | train/epoch_382/loss 5.8893 2693 | train/epoch_382/ex ddddb ddfdd 2694 | train/epoch_382/ex c d 2695 | train/epoch_382/ex fjb hfj 2696 | train/epoch_382/ex e j 2697 | train/epoch_382/ex e b 2698 | train/epoch_382{1.68s} 2699 | train/epoch_383/loss 6.1314 2700 | train/epoch_383/ex hhh hhh 2701 | train/epoch_383/ex hh hh 2702 | train/epoch_383/ex fffff iffff 2703 | train/epoch_383/ex aaa aaa 2704 | train/epoch_383/ex eei eeg 2705 | train/epoch_383{1.68s} 2706 | train/epoch_384/loss 5.6820 2707 | train/epoch_384/ex i b 2708 | train/epoch_384/ex e j 2709 | train/epoch_384/ex jjj aaa 2710 | train/epoch_384/ex gd jf 2711 | train/epoch_384/ex bj fb 2712 | train/epoch_384{1.72s} 2713 | train/epoch_385/loss 6.1967 2714 | train/epoch_385/ex d f 2715 | train/epoch_385/ex bbg gaa 2716 | train/epoch_385/ex gggg gggg 2717 | train/epoch_385/ex ghghgh gghhgh 2718 | train/epoch_385/ex c c 2719 | train/epoch_385{1.64s} 2720 | train/epoch_386/loss 5.9736 2721 | train/epoch_386/ex iiiii iiiii 2722 | train/epoch_386/ex jjjjjjj jjjjjjj 2723 | train/epoch_386/ex jj jj 2724 | train/epoch_386/ex aa aa 2725 | train/epoch_386/ex cdcd fccd 2726 | train/epoch_386{1.68s} 2727 | train/epoch_387/loss 5.7759 2728 | train/epoch_387/ex ccc cci 2729 | train/epoch_387/ex bci eca 2730 | train/epoch_387/ex hhh ghh 2731 | train/epoch_387/ex j j 2732 | train/epoch_387/ex j a 2733 | train/epoch_387{1.66s} 2734 | train/epoch_388/loss 6.4127 2735 | train/epoch_388/ex aab aac 2736 | train/epoch_388/ex bba hff 2737 | train/epoch_388/ex iibiiiii iibiibii 2738 | train/epoch_388/ex hhhhh hhhhh 2739 | train/epoch_388/ex eee eej 2740 | train/epoch_388{1.67s} 2741 | train/epoch_389/loss 6.2089 2742 | train/epoch_389/ex i d 2743 | train/epoch_389/ex bbbbbgggg agggbabbb 2744 | train/epoch_389/ex ccc gcc 2745 | train/epoch_389/ex da da 2746 | train/epoch_389/ex bgbgbg fbbbgb 2747 | train/epoch_389{1.72s} 2748 | train/epoch_390/loss 5.9688 2749 | train/epoch_390/ex dd dd 2750 | train/epoch_390/ex aaaaaaaaaaa iiaaaiaiaia 2751 | train/epoch_390/ex ababa aabaa 2752 | train/epoch_390/ex aaaaaa aaaaff 2753 | train/epoch_390/ex d a 2754 | train/epoch_390{1.72s} 2755 | train/epoch_391/loss 5.9084 2756 | train/epoch_391/ex aaaaj jjjaa 2757 | train/epoch_391/ex jjjjj jjbjj 2758 | train/epoch_391/ex iij iji 2759 | train/epoch_391/ex hjih hhih 2760 | train/epoch_391/ex gg gg 2761 | train/epoch_391{1.69s} 2762 | train/epoch_392/loss 5.7375 2763 | train/epoch_392/ex ccc ccc 2764 | train/epoch_392/ex c g 2765 | train/epoch_392/ex hjhj hijh 2766 | train/epoch_392/ex aaaa aaah 2767 | train/epoch_392/ex aaa aaa 2768 | train/epoch_392{1.65s} 2769 | train/epoch_393/loss 6.4508 2770 | train/epoch_393/ex dde bdb 2771 | train/epoch_393/ex egege geege 2772 | train/epoch_393/ex eee eee 2773 | train/epoch_393/ex eeee eeee 2774 | train/epoch_393/ex ddddd ddidf 2775 | train/epoch_393{1.67s} 2776 | train/epoch_394/loss 6.1535 2777 | train/epoch_394/ex ccccccc ccccccc 2778 | train/epoch_394/ex ddj did 2779 | train/epoch_394/ex eee eee 2780 | train/epoch_394/ex igig ejii 2781 | train/epoch_394/ex jjhhhj hhjhhj 2782 | train/epoch_394{1.72s} 2783 | train/epoch_395/loss 6.4586 2784 | train/epoch_395/ex aaaa aaah 2785 | train/epoch_395/ex jjjjjbb bbgjjjb 2786 | train/epoch_395/ex gggg gggg 2787 | train/epoch_395/ex ffbbbb ffbfff 2788 | train/epoch_395/ex j c 2789 | train/epoch_395{1.68s} 2790 | train/epoch_396/loss 5.9828 2791 | train/epoch_396/ex d i 2792 | train/epoch_396/ex bbb bbb 2793 | train/epoch_396/ex eg ae 2794 | train/epoch_396/ex d g 2795 | train/epoch_396/ex b h 2796 | train/epoch_396{1.68s} 2797 | train/epoch_397/loss 6.5899 2798 | train/epoch_397/ex hhh hhh 2799 | train/epoch_397/ex ji hi 2800 | train/epoch_397/ex jjfjf ijiji 2801 | train/epoch_397/ex bg hg 2802 | train/epoch_397/ex fff fff 2803 | train/epoch_397{1.68s} 2804 | train/epoch_398/loss 6.1268 2805 | train/epoch_398/ex bbbh bbhb 2806 | train/epoch_398/ex dddd dddd 2807 | train/epoch_398/ex bbbd dbdb 2808 | train/epoch_398/ex cccc cccc 2809 | train/epoch_398/ex iii iii 2810 | train/epoch_398{1.65s} 2811 | train/epoch_399/loss 5.7406 2812 | train/epoch_399/ex ff gg 2813 | train/epoch_399/ex gbc eeg 2814 | train/epoch_399/ex cc cc 2815 | train/epoch_399/ex bbbbb hbbbb 2816 | train/epoch_399/ex jej jij 2817 | train/epoch_399{1.65s} 2818 | train/epoch_400/loss 6.2328 2819 | train/epoch_400/ex iiiiii iiiiii 2820 | train/epoch_400/ex aaa gaa 2821 | train/epoch_400/ex j j 2822 | train/epoch_400/ex gjjg gehh 2823 | train/epoch_400/ex eeeee geeee 2824 | train/epoch_400{1.70s} 2825 | train/epoch_401/loss 6.0554 2826 | train/epoch_401/ex eeeeeeee aeeeeeee 2827 | train/epoch_401/ex iiii iiii 2828 | train/epoch_401/ex eeeee eeeee 2829 | train/epoch_401/ex c b 2830 | train/epoch_401/ex fa ed 2831 | train/epoch_401{1.62s} 2832 | train/epoch_402/loss 6.2234 2833 | train/epoch_402/ex aaj jaa 2834 | train/epoch_402/ex he ah 2835 | train/epoch_402/ex bddbf bdbbd 2836 | train/epoch_402/ex eeeeeee eeeeeee 2837 | train/epoch_402/ex gg cc 2838 | train/epoch_402{1.65s} 2839 | train/epoch_403/loss 6.1876 2840 | train/epoch_403/ex idid iidi 2841 | train/epoch_403/ex fc cd 2842 | train/epoch_403/ex hee fee 2843 | train/epoch_403/ex jjjjj jjjjb 2844 | train/epoch_403/ex bbbj cjcc 2845 | train/epoch_403{1.66s} 2846 | train/epoch_404/loss 6.3013 2847 | train/epoch_404/ex cccd ccjj 2848 | train/epoch_404/ex ggg fff 2849 | train/epoch_404/ex bjjb bjbj 2850 | train/epoch_404/ex aaaaaaa aaaaaaa 2851 | train/epoch_404/ex cjcjc gjdcj 2852 | train/epoch_404{1.65s} 2853 | train/epoch_405/loss 6.0273 2854 | train/epoch_405/ex c d 2855 | train/epoch_405/ex j j 2856 | train/epoch_405/ex aaa aaa 2857 | train/epoch_405/ex ddddb dbddb 2858 | train/epoch_405/ex ahah haah 2859 | train/epoch_405{1.66s} 2860 | train/epoch_406/loss 6.3622 2861 | train/epoch_406/ex e c 2862 | train/epoch_406/ex bbbbb bbbbe 2863 | train/epoch_406/ex ggggggggg ggggggggg 2864 | train/epoch_406/ex adaaab baddba 2865 | train/epoch_406/ex hhjj hjjh 2866 | train/epoch_406{1.65s} 2867 | train/epoch_407/loss 6.1803 2868 | train/epoch_407/ex ffff ffff 2869 | train/epoch_407/ex gggg fggg 2870 | train/epoch_407/ex ddd ddd 2871 | train/epoch_407/ex dffd fdff 2872 | train/epoch_407/ex cc cb 2873 | train/epoch_407{1.71s} 2874 | train/epoch_408/loss 6.0481 2875 | train/epoch_408/ex ffff ffff 2876 | train/epoch_408/ex jhj jhj 2877 | train/epoch_408/ex deedde edjdjj 2878 | train/epoch_408/ex gdgada ddgagd 2879 | train/epoch_408/ex eej eej 2880 | train/epoch_408{1.63s} 2881 | train/epoch_409/loss 6.1948 2882 | train/epoch_409/ex ea eb 2883 | train/epoch_409/ex fff fff 2884 | train/epoch_409/ex hhh hhj 2885 | train/epoch_409/ex aaf faa 2886 | train/epoch_409/ex ii ii 2887 | train/epoch_409{1.66s} 2888 | train/epoch_410/loss 6.0313 2889 | train/epoch_410/ex dd dd 2890 | train/epoch_410/ex j e 2891 | train/epoch_410/ex aaaaa daaaa 2892 | train/epoch_410/ex aaa gaa 2893 | train/epoch_410/ex ee eh 2894 | train/epoch_410{1.68s} 2895 | train/epoch_411/loss 6.1728 2896 | train/epoch_411/ex b d 2897 | train/epoch_411/ex aaa aaj 2898 | train/epoch_411/ex jjjj ajjj 2899 | train/epoch_411/ex iii iii 2900 | train/epoch_411/ex aaaa aaah 2901 | train/epoch_411{1.71s} 2902 | train/epoch_412/loss 5.8488 2903 | train/epoch_412/ex jjj jjj 2904 | train/epoch_412/ex d c 2905 | train/epoch_412/ex ddd ddd 2906 | train/epoch_412/ex eee eea 2907 | train/epoch_412/ex ffffff ffffff 2908 | train/epoch_412{1.58s} 2909 | train/epoch_413/loss 6.4548 2910 | train/epoch_413/ex j c 2911 | train/epoch_413/ex cjj jcc 2912 | train/epoch_413/ex ggggg ggggg 2913 | train/epoch_413/ex iiiih hihii 2914 | train/epoch_413/ex d d 2915 | train/epoch_413{1.65s} 2916 | train/epoch_414/loss 5.9420 2917 | train/epoch_414/ex iiii iiii 2918 | train/epoch_414/ex cjcj jcjc 2919 | train/epoch_414/ex ccccc cccgc 2920 | train/epoch_414/ex iiii iiih 2921 | train/epoch_414/ex c d 2922 | train/epoch_414{1.71s} 2923 | train/epoch_415/loss 6.2099 2924 | train/epoch_415/ex ddddddd ddddddd 2925 | train/epoch_415/ex hhhjjjh hjhjjjh 2926 | train/epoch_415/ex ee aa 2927 | train/epoch_415/ex efeefe efeffe 2928 | train/epoch_415/ex b b 2929 | train/epoch_415{1.66s} 2930 | train/epoch_416/loss 6.3344 2931 | train/epoch_416/ex jjjj bjjj 2932 | train/epoch_416/ex bb bb 2933 | train/epoch_416/ex d i 2934 | train/epoch_416/ex i i 2935 | train/epoch_416/ex b f 2936 | train/epoch_416{1.73s} 2937 | train/epoch_417/loss 6.5784 2938 | train/epoch_417/ex hch chg 2939 | train/epoch_417/ex ccccc ccccc 2940 | train/epoch_417/ex da ja 2941 | train/epoch_417/ex ededed ddeded 2942 | train/epoch_417/ex ggggg ggggg 2943 | train/epoch_417{1.73s} 2944 | train/epoch_418/loss 6.2283 2945 | train/epoch_418/ex iiiii iiiii 2946 | train/epoch_418/ex i e 2947 | train/epoch_418/ex j a 2948 | train/epoch_418/ex ccc ccc 2949 | train/epoch_418/ex ccch dhhh 2950 | train/epoch_418{1.67s} 2951 | train/epoch_419/loss 5.8940 2952 | train/epoch_419/ex cd dh 2953 | train/epoch_419/ex h d 2954 | train/epoch_419/ex aaa eee 2955 | train/epoch_419/ex cdcdcddc dgdcgdcd 2956 | train/epoch_419/ex bc gb 2957 | train/epoch_419{1.67s} 2958 | train/epoch_420/loss 6.0457 2959 | train/epoch_420/ex aaaa haaa 2960 | train/epoch_420/ex cffcfcc fccccfc 2961 | train/epoch_420/ex bbhhbbbh bbbbhhbh 2962 | train/epoch_420/ex aaaa aaaa 2963 | train/epoch_420/ex hhhhh hhhhh 2964 | train/epoch_420{1.73s} 2965 | train/epoch_421/loss 6.1142 2966 | train/epoch_421/ex chccccccccch chchhhchhhhh 2967 | train/epoch_421/ex jjjj jjjj 2968 | train/epoch_421/ex cc ic 2969 | train/epoch_421/ex ii cc 2970 | train/epoch_421/ex chc cih 2971 | train/epoch_421{1.74s} 2972 | train/epoch_422/loss 6.4450 2973 | train/epoch_422/ex ic cj 2974 | train/epoch_422/ex jfjjf ddjff 2975 | train/epoch_422/ex aaaa aaaa 2976 | train/epoch_422/ex gggg gggg 2977 | train/epoch_422/ex dadad ajdjd 2978 | train/epoch_422{1.65s} 2979 | train/epoch_423/loss 5.9950 2980 | train/epoch_423/ex hhhh ahhe 2981 | train/epoch_423/ex bg gb 2982 | train/epoch_423/ex ddddd ddddd 2983 | train/epoch_423/ex ii ii 2984 | train/epoch_423/ex bbbb bbbb 2985 | train/epoch_423{1.70s} 2986 | train/epoch_424/loss 6.0490 2987 | train/epoch_424/ex ig ih 2988 | train/epoch_424/ex i i 2989 | train/epoch_424/ex iih iih 2990 | train/epoch_424/ex ddddddd dgdgdgg 2991 | train/epoch_424/ex fj jf 2992 | train/epoch_424{1.64s} 2993 | train/epoch_425/loss 5.8621 2994 | train/epoch_425/ex j a 2995 | train/epoch_425/ex cdc dcd 2996 | train/epoch_425/ex eeje efgj 2997 | train/epoch_425/ex aaaaaf ffaffa 2998 | train/epoch_425/ex iiii gggb 2999 | train/epoch_425{1.71s} 3000 | train/epoch_426/loss 6.2427 3001 | train/epoch_426/ex e e 3002 | train/epoch_426/ex cc gg 3003 | train/epoch_426/ex ejg geg 3004 | train/epoch_426/ex jjij iffh 3005 | train/epoch_426/ex iih hhf 3006 | train/epoch_426{1.64s} 3007 | train/epoch_427/loss 6.4234 3008 | train/epoch_427/ex b a 3009 | train/epoch_427/ex ggg egg 3010 | train/epoch_427/ex fffff fcfff 3011 | train/epoch_427/ex iiiii iiiii 3012 | train/epoch_427/ex hfh cfh 3013 | train/epoch_427{1.61s} 3014 | train/epoch_428/loss 6.0105 3015 | train/epoch_428/ex b a 3016 | train/epoch_428/ex i i 3017 | train/epoch_428/ex fe ei 3018 | train/epoch_428/ex dddddddddd dddddddddd 3019 | train/epoch_428/ex b b 3020 | train/epoch_428{1.62s} 3021 | train/epoch_429/loss 5.9524 3022 | train/epoch_429/ex hhhhh hhhhh 3023 | train/epoch_429/ex ccccc ccccc 3024 | train/epoch_429/ex hhhhh bbbbb 3025 | train/epoch_429/ex d d 3026 | train/epoch_429/ex ggg ggb 3027 | train/epoch_429{1.70s} 3028 | train/epoch_430/loss 6.5278 3029 | train/epoch_430/ex i h 3030 | train/epoch_430/ex aaa iaa 3031 | train/epoch_430/ex aaj jaa 3032 | train/epoch_430/ex fffi iffd 3033 | train/epoch_430/ex bbbbb bbbeb 3034 | train/epoch_430{1.65s} 3035 | train/epoch_431/loss 6.4249 3036 | train/epoch_431/ex ggg ghh 3037 | train/epoch_431/ex je jh 3038 | train/epoch_431/ex iii jjj 3039 | train/epoch_431/ex fd fd 3040 | train/epoch_431/ex ffff faff 3041 | train/epoch_431{1.69s} 3042 | train/epoch_432/loss 6.0528 3043 | train/epoch_432/ex dd dd 3044 | train/epoch_432/ex cdd ccd 3045 | train/epoch_432/ex gig aig 3046 | train/epoch_432/ex ddd ddd 3047 | train/epoch_432/ex ebeb jbbe 3048 | train/epoch_432{1.67s} 3049 | train/epoch_433/loss 6.2883 3050 | train/epoch_433/ex fffff hhhhh 3051 | train/epoch_433/ex fff fff 3052 | train/epoch_433/ex hihihi hihhih 3053 | train/epoch_433/ex g h 3054 | train/epoch_433/ex jjhj cjjc 3055 | train/epoch_433{1.61s} 3056 | train/epoch_434/loss 6.0974 3057 | train/epoch_434/ex gggj hhgh 3058 | train/epoch_434/ex ib ic 3059 | train/epoch_434/ex fff dff 3060 | train/epoch_434/ex bgb bgc 3061 | train/epoch_434/ex hhh hhh 3062 | train/epoch_434{1.73s} 3063 | train/epoch_435/loss 5.4621 3064 | train/epoch_435/ex eee eee 3065 | train/epoch_435/ex fj gj 3066 | train/epoch_435/ex e j 3067 | train/epoch_435/ex aaa aab 3068 | train/epoch_435/ex jjjj jjjj 3069 | train/epoch_435{1.65s} 3070 | train/epoch_436/loss 5.6770 3071 | train/epoch_436/ex c c 3072 | train/epoch_436/ex ee aa 3073 | train/epoch_436/ex aaag aaga 3074 | train/epoch_436/ex hhhh bhhh 3075 | train/epoch_436/ex iii hii 3076 | train/epoch_436{1.74s} 3077 | train/epoch_437/loss 6.2312 3078 | train/epoch_437/ex eec eec 3079 | train/epoch_437/ex ddd ddd 3080 | train/epoch_437/ex gh gj 3081 | train/epoch_437/ex aaaaa aaaaa 3082 | train/epoch_437/ex jjij fjji 3083 | train/epoch_437{1.65s} 3084 | train/epoch_438/loss 6.1330 3085 | train/epoch_438/ex ggg ggh 3086 | train/epoch_438/ex c c 3087 | train/epoch_438/ex jjd jgj 3088 | train/epoch_438/ex jj jj 3089 | train/epoch_438/ex eeceec cbceec 3090 | train/epoch_438{1.67s} 3091 | train/epoch_439/loss 6.4038 3092 | train/epoch_439/ex jj aj 3093 | train/epoch_439/ex ccccc ccccc 3094 | train/epoch_439/ex be ib 3095 | train/epoch_439/ex egea eefa 3096 | train/epoch_439/ex aaaaa aaaaa 3097 | train/epoch_439{1.65s} 3098 | train/epoch_440/loss 5.8897 3099 | train/epoch_440/ex gggggg gggggg 3100 | train/epoch_440/ex hhhjjj jjhjhh 3101 | train/epoch_440/ex c c 3102 | train/epoch_440/ex cd bf 3103 | train/epoch_440/ex ea de 3104 | train/epoch_440{1.72s} 3105 | train/epoch_441/loss 5.9677 3106 | train/epoch_441/ex ggg ggd 3107 | train/epoch_441/ex bbbbbb bbfbbb 3108 | train/epoch_441/ex aaaaaa aaaaaa 3109 | train/epoch_441/ex c b 3110 | train/epoch_441/ex gg ii 3111 | train/epoch_441{1.59s} 3112 | train/epoch_442/loss 5.5883 3113 | train/epoch_442/ex eea eef 3114 | train/epoch_442/ex iii iii 3115 | train/epoch_442/ex jd jg 3116 | train/epoch_442/ex ccc ccc 3117 | train/epoch_442/ex eeee aeee 3118 | train/epoch_442{1.72s} 3119 | train/epoch_443/loss 6.0468 3120 | train/epoch_443/ex iiiiiiiii iiiiiiiii 3121 | train/epoch_443/ex ddd ddd 3122 | train/epoch_443/ex j c 3123 | train/epoch_443/ex i f 3124 | train/epoch_443/ex fjef ejjf 3125 | train/epoch_443{1.66s} 3126 | train/epoch_444/loss 6.1882 3127 | train/epoch_444/ex hhhhhhh hhhhhhh 3128 | train/epoch_444/ex cccccc cccccc 3129 | train/epoch_444/ex jjjjjjj jjjjjjj 3130 | train/epoch_444/ex bi bi 3131 | train/epoch_444/ex jc jc 3132 | train/epoch_444{1.67s} 3133 | train/epoch_445/loss 6.0480 3134 | train/epoch_445/ex be bd 3135 | train/epoch_445/ex ac ge 3136 | train/epoch_445/ex aaa aaa 3137 | train/epoch_445/ex dddd dddd 3138 | train/epoch_445/ex eee eee 3139 | train/epoch_445{1.71s} 3140 | train/epoch_446/loss 6.5290 3141 | train/epoch_446/ex c g 3142 | train/epoch_446/ex ahhaha aaahah 3143 | train/epoch_446/ex e c 3144 | train/epoch_446/ex ddddd ddddd 3145 | train/epoch_446/ex iiciicic iiiiccic 3146 | train/epoch_446{1.64s} 3147 | train/epoch_447/loss 6.0909 3148 | train/epoch_447/ex jcjc bicj 3149 | train/epoch_447/ex eeeeeei ihhhhii 3150 | train/epoch_447/ex fdg dfc 3151 | train/epoch_447/ex aaa aaa 3152 | train/epoch_447/ex jffjf jjhjf 3153 | train/epoch_447{1.70s} 3154 | train/epoch_448/loss 6.4686 3155 | train/epoch_448/ex jjjj jjjj 3156 | train/epoch_448/ex iji cij 3157 | train/epoch_448/ex aaia aaia 3158 | train/epoch_448/ex fc ca 3159 | train/epoch_448/ex aaae daae 3160 | train/epoch_448{1.69s} 3161 | train/epoch_449/loss 6.1415 3162 | train/epoch_449/ex bbbbj bbbbj 3163 | train/epoch_449/ex fffff fffff 3164 | train/epoch_449/ex iii iii 3165 | train/epoch_449/ex aiaiai iiiaai 3166 | train/epoch_449/ex jfjjf djfff 3167 | train/epoch_449{1.61s} 3168 | train/epoch_450/loss 6.0899 3169 | train/epoch_450/ex jeejee ehehje 3170 | train/epoch_450/ex bbbbb bbbbh 3171 | train/epoch_450/ex bj cb 3172 | train/epoch_450/ex ccaccacc caccacac 3173 | train/epoch_450/ex ddddd ddddd 3174 | train/epoch_450{1.74s} 3175 | train/epoch_451/loss 6.2052 3176 | train/epoch_451/ex cccccccc cccccecc 3177 | train/epoch_451/ex ibiibi ibiiii 3178 | train/epoch_451/ex hhhhhhhhhh hhhhhhhhhh 3179 | train/epoch_451/ex ge gb 3180 | train/epoch_451/ex iia aai 3181 | train/epoch_451{1.68s} 3182 | train/epoch_452/loss 6.4461 3183 | train/epoch_452/ex fff fff 3184 | train/epoch_452/ex hgg hhg 3185 | train/epoch_452/ex iiii iiii 3186 | train/epoch_452/ex ee jj 3187 | train/epoch_452/ex bbggg bgggb 3188 | train/epoch_452{1.65s} 3189 | train/epoch_453/loss 6.0896 3190 | train/epoch_453/ex ehehehe ddehhdh 3191 | train/epoch_453/ex ddd ddd 3192 | train/epoch_453/ex jjjjj jjjjj 3193 | train/epoch_453/ex di bj 3194 | train/epoch_453/ex aaaaaa faaaaa 3195 | train/epoch_453{1.67s} 3196 | train/epoch_454/loss 5.8263 3197 | train/epoch_454/ex e a 3198 | train/epoch_454/ex caccccjc ajajacaa 3199 | train/epoch_454/ex gggg aggg 3200 | train/epoch_454/ex eje jej 3201 | train/epoch_454/ex bbbb bccc 3202 | train/epoch_454{1.74s} 3203 | train/epoch_455/loss 5.9745 3204 | train/epoch_455/ex cccc cccc 3205 | train/epoch_455/ex ab ga 3206 | train/epoch_455/ex aaaaaaaaa aaaaaaaaa 3207 | train/epoch_455/ex hehe eehe 3208 | train/epoch_455/ex eei jee 3209 | train/epoch_455{1.62s} 3210 | train/epoch_456/loss 6.1401 3211 | train/epoch_456/ex eee eee 3212 | train/epoch_456/ex aaa aaa 3213 | train/epoch_456/ex ccccc ccccc 3214 | train/epoch_456/ex ggggg ggggg 3215 | train/epoch_456/ex fch fcf 3216 | train/epoch_456{1.68s} 3217 | train/epoch_457/loss 6.0618 3218 | train/epoch_457/ex e e 3219 | train/epoch_457/ex ffhhhf hhfhhf 3220 | train/epoch_457/ex jjjjj jjjjh 3221 | train/epoch_457/ex gggggf gfgggg 3222 | train/epoch_457/ex jhj jhe 3223 | train/epoch_457{1.65s} 3224 | train/epoch_458/loss 6.3180 3225 | train/epoch_458/ex ha ji 3226 | train/epoch_458/ex d c 3227 | train/epoch_458/ex ca ag 3228 | train/epoch_458/ex j e 3229 | train/epoch_458/ex dj de 3230 | train/epoch_458{1.71s} 3231 | train/epoch_459/loss 5.7988 3232 | train/epoch_459/ex aad aag 3233 | train/epoch_459/ex i i 3234 | train/epoch_459/ex ccc jjj 3235 | train/epoch_459/ex ccc ccc 3236 | train/epoch_459/ex ggg ggd 3237 | train/epoch_459{1.73s} 3238 | train/epoch_460/loss 5.9250 3239 | train/epoch_460/ex ffff ffff 3240 | train/epoch_460/ex ddd ddd 3241 | train/epoch_460/ex hhh hhh 3242 | train/epoch_460/ex dfd idf 3243 | train/epoch_460/ex c c 3244 | train/epoch_460{1.63s} 3245 | train/epoch_461/loss 5.8154 3246 | train/epoch_461/ex aaa afa 3247 | train/epoch_461/ex i i 3248 | train/epoch_461/ex ddd iii 3249 | train/epoch_461/ex gggg gggg 3250 | train/epoch_461/ex ggg ggj 3251 | train/epoch_461{1.60s} 3252 | train/epoch_462/loss 6.4168 3253 | train/epoch_462/ex aaaaa aaaaa 3254 | train/epoch_462/ex dddf eedd 3255 | train/epoch_462/ex ii ii 3256 | train/epoch_462/ex jjj jji 3257 | train/epoch_462/ex bbb bbd 3258 | train/epoch_462{1.66s} 3259 | train/epoch_463/loss 6.2851 3260 | train/epoch_463/ex jjj jjj 3261 | train/epoch_463/ex aaa eee 3262 | train/epoch_463/ex d e 3263 | train/epoch_463/ex ggg ggg 3264 | train/epoch_463/ex eee eee 3265 | train/epoch_463{1.69s} 3266 | train/epoch_464/loss 5.9816 3267 | train/epoch_464/ex aaaa aaha 3268 | train/epoch_464/ex dc dc 3269 | train/epoch_464/ex dada daad 3270 | train/epoch_464/ex jhhhjjh hjhjjhh 3271 | train/epoch_464/ex fhf hfh 3272 | train/epoch_464{1.72s} 3273 | train/epoch_465/loss 5.9140 3274 | train/epoch_465/ex iijjji ijijjj 3275 | train/epoch_465/ex ic jc 3276 | train/epoch_465/ex aag gaa 3277 | train/epoch_465/ex hhh jhh 3278 | train/epoch_465/ex ddd hdd 3279 | train/epoch_465{1.64s} 3280 | train/epoch_466/loss 5.9214 3281 | train/epoch_466/ex c d 3282 | train/epoch_466/ex ggg cgg 3283 | train/epoch_466/ex hhhhd dhdhh 3284 | train/epoch_466/ex hd bh 3285 | train/epoch_466/ex bjbj djbj 3286 | train/epoch_466{1.64s} 3287 | train/epoch_467/loss 6.4123 3288 | train/epoch_467/ex ceaea aegec 3289 | train/epoch_467/ex bbh bhb 3290 | train/epoch_467/ex aaaaaa caaaaa 3291 | train/epoch_467/ex ggg ggg 3292 | train/epoch_467/ex d b 3293 | train/epoch_467{1.75s} 3294 | train/epoch_468/loss 6.0019 3295 | train/epoch_468/ex ei ej 3296 | train/epoch_468/ex dddc cdcd 3297 | train/epoch_468/ex ggdd gdgg 3298 | train/epoch_468/ex fe ef 3299 | train/epoch_468/ex hh hh 3300 | train/epoch_468{1.68s} 3301 | train/epoch_469/loss 6.5598 3302 | train/epoch_469/ex jjjj jjjj 3303 | train/epoch_469/ex ggggg ggggg 3304 | train/epoch_469/ex aga aga 3305 | train/epoch_469/ex bbb bbb 3306 | train/epoch_469/ex hg dh 3307 | train/epoch_469{1.75s} 3308 | train/epoch_470/loss 5.9900 3309 | train/epoch_470/ex hh hh 3310 | train/epoch_470/ex hhj bhh 3311 | train/epoch_470/ex gg aa 3312 | train/epoch_470/ex gd gj 3313 | train/epoch_470/ex ga ia 3314 | train/epoch_470{1.70s} 3315 | train/epoch_471/loss 6.3808 3316 | train/epoch_471/ex ec ic 3317 | train/epoch_471/ex gh ag 3318 | train/epoch_471/ex iiii giii 3319 | train/epoch_471/ex aaag ahaa 3320 | train/epoch_471/ex ffff ffff 3321 | train/epoch_471{1.67s} 3322 | train/epoch_472/loss 6.0119 3323 | train/epoch_472/ex i i 3324 | train/epoch_472/ex aaaa aaaa 3325 | train/epoch_472/ex ggg ggg 3326 | train/epoch_472/ex iiii iiii 3327 | train/epoch_472/ex bbb bbb 3328 | train/epoch_472{1.69s} 3329 | train/epoch_473/loss 6.0915 3330 | train/epoch_473/ex hf hf 3331 | train/epoch_473/ex dd gg 3332 | train/epoch_473/ex aaj aac 3333 | train/epoch_473/ex eegg gbee 3334 | train/epoch_473/ex gc ig 3335 | train/epoch_473{1.63s} 3336 | train/epoch_474/loss 6.1220 3337 | train/epoch_474/ex ccccc ccccc 3338 | train/epoch_474/ex ejejj ejeej 3339 | train/epoch_474/ex d c 3340 | train/epoch_474/ex gg ee 3341 | train/epoch_474/ex d c 3342 | train/epoch_474{1.63s} 3343 | train/epoch_475/loss 5.9406 3344 | train/epoch_475/ex eeeee aeeee 3345 | train/epoch_475/ex aah haa 3346 | train/epoch_475/ex ddddd ddddd 3347 | train/epoch_475/ex j b 3348 | train/epoch_475/ex hhh hhh 3349 | train/epoch_475{1.66s} 3350 | train/epoch_476/loss 5.6717 3351 | train/epoch_476/ex e a 3352 | train/epoch_476/ex jjjjj jdjjj 3353 | train/epoch_476/ex ajjaj eajjj 3354 | train/epoch_476/ex aaaaa aaaaa 3355 | train/epoch_476/ex i i 3356 | train/epoch_476{1.63s} 3357 | train/epoch_477/loss 6.0442 3358 | train/epoch_477/ex eeeee eeeee 3359 | train/epoch_477/ex jjj jjj 3360 | train/epoch_477/ex dddd dddd 3361 | train/epoch_477/ex jjj eee 3362 | train/epoch_477/ex cgccggc gcccggg 3363 | train/epoch_477{1.71s} 3364 | train/epoch_478/loss 5.9641 3365 | train/epoch_478/ex jjjjjjj jjjggjj 3366 | train/epoch_478/ex ff ff 3367 | train/epoch_478/ex hhh bbb 3368 | train/epoch_478/ex ggc gfg 3369 | train/epoch_478/ex aaaaa baaaa 3370 | train/epoch_478{1.71s} 3371 | train/epoch_479/loss 6.0973 3372 | train/epoch_479/ex jf gj 3373 | train/epoch_479/ex aa da 3374 | train/epoch_479/ex eeee geee 3375 | train/epoch_479/ex iii iii 3376 | train/epoch_479/ex aaaj aaaj 3377 | train/epoch_479{1.65s} 3378 | train/epoch_480/loss 6.2255 3379 | train/epoch_480/ex baba babb 3380 | train/epoch_480/ex c e 3381 | train/epoch_480/ex gggge ggeee 3382 | train/epoch_480/ex eb ce 3383 | train/epoch_480/ex bbbgg gbbbb 3384 | train/epoch_480{1.65s} 3385 | train/epoch_481/loss 5.8839 3386 | train/epoch_481/ex iiiiiiiii biiiiiiii 3387 | train/epoch_481/ex ahah ihah 3388 | train/epoch_481/ex j j 3389 | train/epoch_481/ex ccccc ccccc 3390 | train/epoch_481/ex jjcjd jdcjj 3391 | train/epoch_481{1.75s} 3392 | train/epoch_482/loss 5.8425 3393 | train/epoch_482/ex e i 3394 | train/epoch_482/ex aaaa aaaa 3395 | train/epoch_482/ex gggg gggg 3396 | train/epoch_482/ex aaaa eaaa 3397 | train/epoch_482/ex cccc cccc 3398 | train/epoch_482{1.68s} 3399 | train/epoch_483/loss 6.1832 3400 | train/epoch_483/ex jh aj 3401 | train/epoch_483/ex df df 3402 | train/epoch_483/ex aaaaf eaeia 3403 | train/epoch_483/ex jhj jhj 3404 | train/epoch_483/ex gggg ggef 3405 | train/epoch_483{1.68s} 3406 | train/epoch_484/loss 6.2235 3407 | train/epoch_484/ex eeeeee eeeeee 3408 | train/epoch_484/ex fff fff 3409 | train/epoch_484/ex jjjj jjja 3410 | train/epoch_484/ex aa jj 3411 | train/epoch_484/ex dddddd ddbddd 3412 | train/epoch_484{1.71s} 3413 | train/epoch_485/loss 6.2125 3414 | train/epoch_485/ex bbjj gjjb 3415 | train/epoch_485/ex e i 3416 | train/epoch_485/ex jjjj jjjj 3417 | train/epoch_485/ex iii iii 3418 | train/epoch_485/ex jh ji 3419 | train/epoch_485{1.74s} 3420 | train/epoch_486/loss 6.1269 3421 | train/epoch_486/ex aaaa agaa 3422 | train/epoch_486/ex aaaaaaaaaa ijijaajjji 3423 | train/epoch_486/ex ejej jejj 3424 | train/epoch_486/ex aggag agaaa 3425 | train/epoch_486/ex bbbb bbbd 3426 | train/epoch_486{1.63s} 3427 | --------------------------------------------------------------------------------