import os import sys with open(sys.argv[0]) as f: code = f.read() # read the code of this file ASAP, for logging import uuid import time import copy from dataclasses import dataclass from functools import lru_cache from pathlib import Path os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "expandable_segments:True" import torch torch.empty(1, device="cuda", requires_grad=True).backward() # prevents a bug on some systems from torch import Tensor, nn import torch.nn.functional as F import torch.distributed as dist # use of FlexAttention contributed by @KoszarskyB from torch.nn.attention.flex_attention import BlockMask, flex_attention #torch._inductor.config.coordinate_descent_tuning = True # we have banned this flag for new records because it causes compilation to take 30min # ----------------------------------------------------------------------------- # Custom operators: FP8 matmul by @YouJiacheng @torch.library.custom_op("nanogpt::mm", mutates_args=()) def mm_op(x: Tensor, w: Tensor, x_s: float, w_s: float, grad_s: float) -> tuple[Tensor, Tensor, Tensor]: @torch.compile def impl(x: Tensor, w: Tensor): assert x.is_contiguous() and w.is_contiguous() x_f8 = x.div(x_s).to(torch.float8_e4m3fn) w_f8 = w.div(w_s).to(torch.float8_e4m3fn) out = torch._scaled_mm( x_f8, w_f8.T, out_dtype=torch.bfloat16, scale_a=x.new_tensor(x_s, dtype=torch.float32), scale_b=x.new_tensor(w_s, dtype=torch.float32), use_fast_accum=True, ) return out, x_f8, w_f8 return impl(x, w) @mm_op.register_fake def _(x: Tensor, w: Tensor, *_): assert x.ndim == w.ndim == 2 assert x.shape[1] == w.shape[1] assert x.device == w.device assert x.is_contiguous() and w.is_contiguous() return x @ w.T, x.to(torch.float8_e4m3fn), w.to(torch.float8_e4m3fn) @torch.library.custom_op("nanogpt::mm_backward", mutates_args=()) def mm_backward_op(g: Tensor, x_f8: Tensor, w_f8: Tensor, x_s: float, w_s: float, grad_s: float) -> tuple[Tensor, Tensor]: @torch.compile def impl(grad: Tensor, x_f8: Tensor, w_f8: Tensor): assert grad.is_contiguous() x_inv_s = grad.new_tensor(x_s, dtype=torch.float32) w_inv_s = grad.new_tensor(w_s, dtype=torch.float32) grad_inv_s = grad.new_tensor(grad_s, dtype=torch.float32) grad_f8 = grad.div(grad_s).to(torch.float8_e5m2) grad_x = torch._scaled_mm( grad_f8, w_f8.T.contiguous().T, out_dtype=torch.bfloat16, scale_a=grad_inv_s, scale_b=w_inv_s, use_fast_accum=False, ) # faster than grad_f8_t @ x_f8, for (d_out, d_in) == (50304, 768) grad_w = torch._scaled_mm( x_f8.T.contiguous(), grad_f8.T.contiguous().T, out_dtype=torch.float32, scale_a=x_inv_s, scale_b=grad_inv_s, use_fast_accum=False, ).T return grad_x, grad_w return impl(g, x_f8, w_f8) @mm_backward_op.register_fake def _(g: Tensor, x_f8: Tensor, w_f8: Tensor, *_): return x_f8.to(torch.bfloat16), w_f8.to(torch.float32) def backward(ctx, grad_out: Tensor, *_): x_f8, w_f8 = ctx.saved_tensors x_s, w_s, grad_s = ctx.scales grad_x, grad_w = torch.ops.nanogpt.mm_backward( grad_out, x_f8, w_f8, x_s, w_s, grad_s ) return grad_x, grad_w, None, None, None def setup_context(ctx: torch.autograd.function.FunctionCtx, inputs, output): *_, x_s, w_s, grad_s = inputs _, x_f8, w_f8 = output ctx.save_for_backward(x_f8, w_f8) ctx.scales = x_s, w_s, grad_s ctx.set_materialize_grads(False) mm_op.register_autograd(backward, setup_context=setup_context) # ----------------------------------------------------------------------------- # Muon optimizer @torch.compile def zeropower_via_newtonschulz5(G: Tensor, steps: int) -> Tensor: """ Newton-Schulz iteration to compute the zeroth power / orthogonalization of G. We opt to use a quintic iteration whose coefficients are selected to maximize the slope at zero. For the purpose of minimizing steps, it turns out to be empirically effective to keep increasing the slope at zero even beyond the point where the iteration no longer converges all the way to one everywhere on the interval. This iteration therefore does not produce UV^T but rather something like US'V^T where S' is diagonal with S_{ii}' ~ Uniform(0.5, 1.5), which turns out not to hurt model performance at all relative to UV^T, where USV^T = G is the SVD. """ assert G.ndim >= 2 # batched Muon implementation by @scottjmaddox, and put into practice in the record by @YouJiacheng X = G.bfloat16() if G.size(-2) > G.size(-1): X = X.mT # Ensure spectral norm is at most 1 X = X / (X.norm(dim=(-2, -1), keepdim=True) + 1e-7) # Perform the NS iterations for a, b, c in [ (4.0848, -6.8946, 2.9270), (3.9505, -6.3029, 2.6377), (3.7418, -5.5913, 2.3037), (2.8769, -3.1427, 1.2046), (2.8366, -3.0525, 1.2012), ]: A = X @ X.mT B = b * A + c * A @ A # quintic computation strategy adapted from suggestion by @jxbz, @leloykun, and @YouJiacheng X = a * X + B @ X if G.size(-2) > G.size(-1): X = X.mT return X class Muon(torch.optim.Optimizer): """ Muon - MomentUm Orthogonalized by Newton-schulz https://kellerjordan.github.io/posts/muon/ Muon internally runs standard SGD-momentum, and then performs an orthogonalization post- processing step, in which each 2D parameter's update is replaced with the nearest orthogonal matrix. To efficiently orthogonalize each update, we use a Newton-Schulz iteration, which has the advantage that it can be stably run in bfloat16 on the GPU. Some warnings: - This optimizer should not be used for the embedding layer, the final fully connected layer, or any {0,1}-D parameters; those should all be optimized by a standard method (e.g., AdamW). - To use it with 4D convolutional filters, it works well to just flatten their last 3 dimensions. Arguments: lr: The learning rate used by the internal SGD. momentum: The momentum used by the internal SGD. nesterov: Whether to use Nesterov-style momentum in the internal SGD. (recommended) ns_steps: The number of Newton-Schulz iteration steps to use. """ def __init__(self, params, lr=0.02, weight_decay=0.01, momentum=0.95, nesterov=True, ns_steps=5, rank=0, world_size=1): self.rank = rank self.world_size = world_size defaults = dict(lr=lr, weight_decay=weight_decay, momentum=momentum, nesterov=nesterov, ns_steps=ns_steps) params: list[Tensor] = [*params] param_groups = [] for size in {p.numel() for p in params}: b = torch.empty(world_size, size, dtype=torch.bfloat16, device="cuda") group = dict(params=[p for p in params if p.numel() == size], update_buffer=b, update_buffer_views=[b[i] for i in range(world_size)]) param_groups.append(group) super().__init__(param_groups, defaults) @torch.no_grad() def step(self): for group in self.param_groups: update_buffer: Tensor = group["update_buffer"] update_buffer_views: list[Tensor] = group["update_buffer_views"] # generate weight updates in distributed fashion params: list[Tensor] = group["params"] handle = None params_world = None def update_prev(): # optimized Muon implementation contributed by @YouJiacheng handle.wait() for p_world, g_world in zip(params_world, update_buffer_views): p_world.mul_(1 - group["lr"] * group["weight_decay"]) p_world.add_(g_world.view_as(p_world), alpha=-group["lr"] * max(1, p_world.size(-2) / p_world.size(-1))**0.5) for base_i in range(len(params))[::self.world_size]: if base_i + self.rank < len(params): p = params[base_i + self.rank] g = p.grad assert g is not None state = self.state[p] if "momentum_buffer" not in state: state["momentum_buffer"] = torch.zeros_like(g) buf: Tensor = state["momentum_buffer"] buf.lerp_(g, 1 - group["momentum"]) g = g.lerp_(buf, group["momentum"]) if group["nesterov"] else buf g = zeropower_via_newtonschulz5(g, steps=group["ns_steps"]).flatten() else: g = update_buffer_views[self.rank] if base_i > 0: update_prev() # async all_gather instead of sync all_reduce by @YouJiacheng handle = dist.all_gather_into_tensor(update_buffer, g, async_op=True) params_world = params[base_i : base_i + self.world_size] update_prev() # ----------------------------------------------------------------------------- # PyTorch nn.Module definitions for the model def norm(x: Tensor): return F.rms_norm(x, (x.size(-1),)) class CastedLinear(nn.Linear): def __init__(self, in_features: int, out_features: int, use_fp8: bool = False, x_s: float = 1.0, w_s: float = 1.0, grad_s: float = 1.0): super().__init__(in_features, out_features, bias=False) self.use_fp8 = use_fp8 self.x_s = x_s self.w_s = w_s self.grad_s = grad_s def reset_parameters(self) -> None: std = 0.5 * (self.in_features ** -0.5) # 0.5 is a bit better than the default 1/sqrt(3) bound = (3 ** 0.5) * std with torch.no_grad(): self.weight.uniform_(-bound, bound) def forward(self, x: Tensor): if self.use_fp8 and self.training: _x = x.flatten(0, -2) out: Tensor = torch.ops.nanogpt.mm(_x, self.weight, x_s=self.x_s, w_s=self.w_s, grad_s=self.grad_s)[0] return out.reshape(*x.shape[:-1], -1) else: return F.linear(x, self.weight.type_as(x)) class Rotary(nn.Module): def __init__(self, dim: int, max_seq_len: int): super().__init__() # half-truncate RoPE by @YouJiacheng (w/ base freq tuning) angular_freq = (1 / 1024) ** torch.linspace(0, 1, steps=dim//4, dtype=torch.float32) angular_freq = torch.cat([angular_freq, angular_freq.new_zeros(dim//4)]) t = torch.arange(max_seq_len, dtype=torch.float32) theta = torch.einsum("i,j -> ij", t, angular_freq) self.cos = nn.Buffer(theta.cos(), persistent=False) self.sin = nn.Buffer(theta.sin(), persistent=False) def forward(self, x_BTHD: Tensor): assert self.cos.size(0) >= x_BTHD.size(-3) cos, sin = self.cos[None, :x_BTHD.size(-3), None, :], self.sin[None, :x_BTHD.size(-3), None, :] x1, x2 = x_BTHD.to(dtype=torch.float32).chunk(2, dim=-1) y1 = x1 * cos + x2 * sin y2 = x1 * (-sin) + x2 * cos return torch.cat((y1, y2), 3).type_as(x_BTHD) class CausalSelfAttention(nn.Module): def __init__(self, dim: int, num_heads: int, max_seq_len: int, head_dim=128): super().__init__() self.num_heads = num_heads self.head_dim = head_dim hdim = num_heads * head_dim std = 0.5 * (dim ** -0.5) bound = (3 ** 0.5) * std # improved init scale by @YouJiacheng # merged QKV weights: suggested by many, implemented by @fernbear.bsky.social, and further improved by @YouJiacheng # https://x.com/hi_tysam/status/1879699187107033311 self.qkv_w = nn.Parameter(torch.empty(3, hdim, dim).uniform_(-bound, bound)) self.lambdas = nn.Parameter(torch.tensor([0.5, 0.5])) self.rotary = Rotary(head_dim, max_seq_len) self.c_proj = CastedLinear(hdim, dim) self.c_proj.weight.detach().zero_() # zero init suggested by @Grad62304977 # scale the attention logits by given constant, instead of the default head_dim**-0.5, by @leloykun # inspired by learnable scalars used by @brendanh0gan https://x.com/hi_tysam/status/1879693583898591283 self.attn_scale = 0.12 def forward(self, x: Tensor, ve: Tensor | None, block_mask: BlockMask): B, T = x.size(0), x.size(1) # batch size, sequence length assert B == 1, "Must use batch size = 1 for FlexAttention" q, k, v = F.linear(x, self.qkv_w.flatten(end_dim=1).type_as(x)).view(B, T, 3 * self.num_heads, self.head_dim).chunk(3, dim=-2) q, k = norm(q), norm(k) # QK norm @Grad62304977 q, k = self.rotary(q), self.rotary(k) if ve is not None: v = self.lambdas[0] * v + self.lambdas[1] * ve.view_as(v) # @KoszarskyB & @Grad62304977 else: # skip mid-layers token value embeddings by @YouJiacheng v = self.lambdas[0] * v y = flex_attention(q.transpose(1, 2), k.transpose(1, 2), v.transpose(1, 2), block_mask=block_mask, scale=self.attn_scale).transpose(1, 2) y = y.contiguous().view(B, T, self.num_heads * self.head_dim) # re-assemble all head outputs side by side y = self.c_proj(y) return y class MLP(nn.Module): def __init__(self, dim: int): super().__init__() hdim = 4 * dim self.c_fc = CastedLinear(dim, hdim) self.c_proj = CastedLinear(hdim, dim) self.c_proj.weight.detach().zero_() # zero init suggested by @Grad62304977 def forward(self, x: Tensor): x = self.c_fc(x) x = F.relu(x).square() # https://arxiv.org/abs/2109.08668v2; ~1-2% better than GELU; suggested by @SKYLINEZ007 and @Grad62304977 x = self.c_proj(x) return x class Block(nn.Module): def __init__(self, dim: int, num_heads: int, max_seq_len: int, layer_idx: int): super().__init__() # skip attention of blocks.7 (the 8th layer) by @YouJiacheng self.attn = CausalSelfAttention(dim, num_heads, max_seq_len) if layer_idx != 7 else None self.mlp = MLP(dim) self.lambdas = nn.Parameter(torch.tensor([1., 0.])) def forward(self, x: Tensor, ve: Tensor | None, x0: Tensor, block_mask: BlockMask): x = self.lambdas[0] * x + self.lambdas[1] * x0 if self.attn is not None: x = x + self.attn(norm(x), ve, block_mask) x = x + self.mlp(norm(x)) return x # ----------------------------------------------------------------------------- # The main model def next_multiple_of_n(v: float | int, *, n: int): return next(x for x in range(n, int(v) + 1 + n, n) if x >= v) class GPT(nn.Module): def __init__(self, vocab_size: int, num_layers: int, num_heads: int, model_dim: int, max_seq_len: int): super().__init__() self.embed = nn.Embedding(vocab_size, model_dim) # token value embeddings by @KoszarskyB - inspired by @Grad62304977's value residual implementation following https://arxiv.org/abs/2410.17897 # value embedding code simplification inspired by @ragulpr https://github.com/KellerJordan/modded-nanogpt/pull/78 self.value_embeds = nn.ModuleList([nn.Embedding(vocab_size, model_dim) for _ in range(3)]) self.blocks = nn.ModuleList([Block(model_dim, num_heads, max_seq_len, i) for i in range(num_layers)]) # there are only 50257 unique GPT-2 tokens; we extend to nearest multiple of 128 for efficiency. # suggested to me by @Grad62304977. this originates from Karpathy's experiments. self.lm_head = CastedLinear(model_dim, next_multiple_of_n(vocab_size, n=128), use_fp8=True, x_s=0.5, w_s=2**-9, grad_s=2**-19) self.lm_head.weight.detach().zero_() # @Grad62304977 # Add learnable skip connection weights for decoder layers assert num_layers % 2 == 0 self.skip_weights = nn.Parameter(torch.ones(num_layers//2)) def create_blockmasks(self, input_seq: Tensor, sliding_window_num_blocks: Tensor): BLOCK_SIZE = 128 docs = (input_seq == 50256).cumsum(0) def document_causal(b, h, q_idx, kv_idx): causal_mask = q_idx >= kv_idx document_mask = docs[q_idx] == docs[kv_idx] return causal_mask & document_mask def dense_to_ordered(dense_blockmask: Tensor): num_blocks = dense_blockmask.sum(dim=-1, dtype=torch.int32) indices = dense_blockmask.argsort(dim=-1, descending=False, stable=True).flip(-1).to(torch.int32) return num_blocks[None, None].contiguous(), indices[None, None].contiguous() # manual block mask creation by @YouJiacheng assert len(input_seq) % BLOCK_SIZE == 0 NUM_BLOCKS = len(input_seq) // BLOCK_SIZE block_idx = torch.arange(NUM_BLOCKS, dtype=torch.int32, device="cuda") causal_blockmask_any = block_idx[:, None] >= block_idx causal_blockmask_all = block_idx[:, None] > block_idx docs_low = docs.view(-1, BLOCK_SIZE)[:, 0].contiguous() docs_high = docs.view(-1, BLOCK_SIZE)[:, -1].contiguous() document_blockmask_any = (docs_low[:, None] <= docs_high) & (docs_high[:, None] >= docs_low) document_blockmask_all = (docs_low[:, None] == docs_high) & (docs_high[:, None] == docs_low) blockmask_any = causal_blockmask_any & document_blockmask_any blockmask_all = causal_blockmask_all & document_blockmask_all partial_kv_num_blocks, partial_kv_indices = dense_to_ordered(blockmask_any & ~blockmask_all) full_kv_num_blocks, full_kv_indices = dense_to_ordered(blockmask_all) def build_bm(window_size_blocks: Tensor) -> BlockMask: return BlockMask.from_kv_blocks( torch.clamp_max(partial_kv_num_blocks, torch.clamp_min(window_size_blocks - full_kv_num_blocks, 1)), partial_kv_indices, torch.clamp_max(full_kv_num_blocks, window_size_blocks - 1), full_kv_indices, BLOCK_SIZE=BLOCK_SIZE, mask_mod=document_causal, ) # Long-short SWA block masks by @leloykun & @YouJiacheng, adapated from suggestion by @Grad62304977, following Gemma 2 paper return build_bm(sliding_window_num_blocks), build_bm(sliding_window_num_blocks // 2) def forward(self, input_seq: Tensor, target_seq: Tensor, sliding_window_num_blocks: Tensor): assert input_seq.ndim == 1 ve = [value_embed(input_seq) for value_embed in self.value_embeds] # 012 ... 012 structure on token value embeddings by @YouJiacheng, improved on @leloykun's U-net structure ve = [ve[0], ve[1], ve[2]] + [None] * (len(self.blocks) - 6) + [ve[0], ve[1], ve[2]] assert len(ve) == len(self.blocks) long_bm, short_bm = self.create_blockmasks(input_seq, sliding_window_num_blocks) block_masks = [long_bm, short_bm, short_bm, short_bm, long_bm, short_bm, short_bm, short_bm, short_bm, short_bm, short_bm, long_bm, short_bm, short_bm, short_bm, long_bm] assert len(block_masks) == len(self.blocks) x = x0 = norm(self.embed(input_seq)[None]) # use of norm here by @Grad62304977 # U-net design by @brendanh0gan skip_connections = [] n = len(self.skip_weights) for i in range(len(self.blocks)): if i >= n: x = x + self.skip_weights[i - n] * skip_connections.pop() x = self.blocks[i](x, ve[i], x0, block_masks[i]) if i < n: skip_connections.append(x) x = norm(x) logits = self.lm_head(x) # @Grad62304977 added tanh softcapping following Gemma 2 paper, @KoszarskyB reduced it from 30 to 15, @YouJiacheng shifted it by +15 (2*sigmoid(2*x)=tanh(x)+1) logits = 30 * torch.sigmoid(logits.float() / 7.5) loss = F.cross_entropy(logits.view(-1, logits.size(-1)), target_seq) return loss # ----------------------------------------------------------------------------- # Our own simple Distributed Data Loader def _load_data_shard(file: Path): header = torch.from_file(str(file), False, 256, dtype=torch.int32) # header is 256 int32 assert header[0] == 20240520, "magic number mismatch in the data .bin file" assert header[1] == 1, "unsupported version" num_tokens = int(header[2]) # number of tokens (claimed) with file.open("rb", buffering=0) as f: tokens = torch.empty(num_tokens, dtype=torch.uint16, pin_memory=True) # avoid pin_memory copy by @YouJiacheng f.seek(256 * 4) nbytes = f.readinto(tokens.numpy()) # avoid bytes->array copy by @YouJiacheng assert nbytes == 2 * num_tokens, "number of tokens read does not match header" return tokens def distributed_data_generator(filename_pattern: str, batch_size: int, rank : int, world_size : int): files = sorted(Path.cwd().glob(filename_pattern)) assert batch_size % world_size == 0 local_batch_size = batch_size // world_size file_iter = iter(files) # use itertools.cycle(files) instead if you want to do multi-epoch training tokens, pos = _load_data_shard(next(file_iter)), 0 while True: if pos + batch_size + 1 >= len(tokens): tokens, pos = _load_data_shard(next(file_iter)), 0 buf = tokens[pos + rank * local_batch_size:][:local_batch_size + 1] inputs = buf[:-1].to(device="cuda", dtype=torch.int32, non_blocking=True) # no sync on host side; targets = buf[1:].to(device="cuda", dtype=torch.int64, non_blocking=True) # H2D in another stream isn't helpful. pos += batch_size yield inputs, targets # ----------------------------------------------------------------------------- # int main @dataclass class Hyperparameters: # data train_files = "data/fineweb10B/fineweb_train_*.bin" # input .bin to train on val_files = "data/fineweb10B/fineweb_val_*.bin" # input .bin to eval validation loss on val_tokens = 10485760 # how many tokens of validation data? it's important to keep this fixed for consistent comparisons train_seq_len = 64*1024 # FlexAttention sequence length val_seq_len = 4*64*1024 # FlexAttention sequence length for validation # optimization num_iterations = 7050 # number of iterations to run cooldown_frac = 0.4 # fraction of training spent cooling down the learning rate # architecture vocab_size = 50257 # evaluation and logging val_loss_every = 125 # every how many steps to evaluate val loss? 0 for only at the end save_checkpoint = False args = Hyperparameters() # torchrun sets these env variables rank = int(os.environ["RANK"]) world_size = int(os.environ["WORLD_SIZE"]) assert world_size == 8 # this code is designed for 8xH100 assert torch.cuda.is_available() device = torch.device("cuda", int(os.environ["LOCAL_RANK"])) torch.cuda.set_device(device) dist.init_process_group(backend="nccl", device_id=device) dist.barrier() master_process = (rank == 0) # this process will do logging, checkpointing etc. # begin logging logfile = None if master_process: run_id = uuid.uuid4() os.makedirs("logs", exist_ok=True) logfile = f"logs/{run_id}.txt" print(logfile) def print0(s, console=False): if master_process: with open(logfile, "a") as f: if console: print(s) print(s, file=f) # begin by printing this file (the Python code) print0(code) print0("="*100) # log information about the hardware/software environment this is running on print0(f"Running Python {sys.version}") print0(f"Running PyTorch {torch.version.__version__} compiled for CUDA {torch.version.cuda}") def nvidia_smi(): import subprocess # avoid top level import return subprocess.run(["nvidia-smi"], stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True).stdout print0(nvidia_smi()) print0("="*100) ######################################## # Construct model and optimizer # ######################################## model: nn.Module = GPT(vocab_size=args.vocab_size, num_layers=16, num_heads=8, model_dim=1024, max_seq_len=max(args.train_seq_len, args.val_seq_len)).cuda() for m in model.modules(): if isinstance(m, nn.Embedding): m.bfloat16() for param in model.parameters(): dist.broadcast(param.detach(), 0) # collect the parameters to optimize hidden_matrix_params = [p for n, p in model.blocks.named_parameters() if p.ndim >= 2 and "embed" not in n] embed_params = [p for n, p in model.named_parameters() if "embed" in n] scalar_params = [p for p in model.parameters() if p.ndim < 2] head_params = [model.lm_head.weight] # init the optimizer(s) adam_params = [dict(params=head_params, lr=0.1/1024**0.5), dict(params=embed_params, lr=0.3), dict(params=scalar_params, lr=0.015)] # small adam epsilon by @YouJiacheng. this is an alternate method of fixing the world_size dependence # discovered by @fernbear.bsky.social https://x.com/hi_tysam/status/1879692937589875094 optimizer1 = torch.optim.Adam(adam_params, betas=(0.8, 0.95), eps=1e-10, fused=True) optimizer2 = Muon(hidden_matrix_params, lr=0.025, momentum=0.95, rank=rank, world_size=world_size) optimizers = [optimizer1, optimizer2] for opt in optimizers: for group in opt.param_groups: group["initial_lr"] = group["lr"] # learning rate schedule: stable then decay def get_lr(step: int): x = step / args.num_iterations # progress in training assert 0 <= x < 1 if x < 1 - args.cooldown_frac: return 1.0 else: return (1 - x) / args.cooldown_frac # attention window size schedule: linearly increase @lru_cache(1) def get_window_size_blocks_helper(window_size: int): return torch.tensor(window_size // 128, dtype=torch.int32, pin_memory=True).cuda(non_blocking=True) def get_window_size_blocks(step: int): x = step / args.num_iterations # progress in training assert 0 <= x <= 1 # Linearly increase the block-wise sliding window size over training 128 -> 1792 # increase by @fernbear.bsky.social; block-wise by @YouJiacheng window_size = next_multiple_of_n(1728 * x, n=128) return get_window_size_blocks_helper(window_size) model: nn.Module = torch.compile(model, dynamic=False) ######################################## # Warmup kernels # ######################################## # Warmup the training kernels, then re-initialize the state so we aren't cheating warmup_steps = 10 initial_state = dict(model=copy.deepcopy(model.state_dict()), optimizers=[copy.deepcopy(opt.state_dict()) for opt in optimizers]) # save the initial state for _ in range(warmup_steps): inputs = targets = torch.randint(0, args.vocab_size, size=(args.train_seq_len,), device="cuda") model(inputs.to(torch.int32), targets, get_window_size_blocks(0)).backward() for param in model.parameters(): dist.all_reduce(param.grad, op=dist.ReduceOp.AVG) for opt in optimizers: opt.step() model.zero_grad(set_to_none=True) model.load_state_dict(initial_state["model"]) for opt, opt_state in zip(optimizers, initial_state["optimizers"]): opt.load_state_dict(opt_state) del initial_state ######################################## # Training and validation # ######################################## train_loader = distributed_data_generator(args.train_files, world_size * args.train_seq_len, rank, world_size) training_time_ms = 0 # start the clock torch.cuda.synchronize() t0 = time.perf_counter() # begin training train_steps = args.num_iterations for step in range(train_steps + 1): last_step = (step == train_steps) # --------------- VALIDATION SECTION ----------------- if last_step or (args.val_loss_every > 0 and step % args.val_loss_every == 0): # stop the clock torch.cuda.synchronize() training_time_ms += 1000 * (time.perf_counter() - t0) model.eval() val_batch_size = world_size * args.val_seq_len assert args.val_tokens % val_batch_size == 0 val_steps = args.val_tokens // val_batch_size val_loader = distributed_data_generator(args.val_files, val_batch_size, rank, world_size) val_loss = 0 with torch.no_grad(): for _ in range(val_steps): inputs, targets = next(val_loader) val_loss += model(inputs, targets, get_window_size_blocks(step)) val_loss /= val_steps del val_loader dist.all_reduce(val_loss, op=dist.ReduceOp.AVG) print0(f"step:{step}/{train_steps} val_loss:{val_loss:.4f} train_time:{training_time_ms:.0f}ms step_avg:{training_time_ms/max(step, 1):.2f}ms", console=True) model.train() # start the clock again torch.cuda.synchronize() t0 = time.perf_counter() if last_step: if master_process and args.save_checkpoint: log = dict(step=step, code=code, model=model.state_dict(), optimizers=[opt.state_dict() for opt in optimizers]) os.makedirs(f"logs/{run_id}", exist_ok=True) torch.save(log, f"logs/{run_id}/state_step{step:06d}.pt") # the last step only has the validation loop, so break to avoid training break # --------------- TRAINING SECTION ----------------- inputs, targets = next(train_loader) model(inputs, targets, get_window_size_blocks(step)).backward() for param in model.parameters(): dist.all_reduce(param.grad, op=dist.ReduceOp.AVG) # set optimization hyperparameters for opt in optimizers: for group in opt.param_groups: group["lr"] = group["initial_lr"] * get_lr(step) for group in optimizer2.param_groups: frac = min(step / 300, 1) # momentum warmup for muon group["momentum"] = (1 - frac) * 0.85 + frac * 0.95 # step the optimizers for opt in optimizers: opt.step() # null the gradients model.zero_grad(set_to_none=True) # logging approx_training_time_ms = training_time_ms + 1000 * (time.perf_counter() - t0) print0(f"step:{step+1}/{train_steps} train_time:{approx_training_time_ms:.0f}ms step_avg:{approx_training_time_ms/(step + 1):.2f}ms", console=True) print0(f"peak memory allocated: {torch.cuda.max_memory_allocated() // 1024 // 1024} MiB " f"reserved: {torch.cuda.max_memory_reserved() // 1024 // 1024} MiB", console=True) dist.destroy_process_group() ==================================================================================================== Running Python 3.10.12 (main, Nov 6 2024, 20:22:13) [GCC 11.4.0] Running PyTorch 2.7.0.dev20250125+cu126 compiled for CUDA 12.6 Wed Feb 19 02:05:59 2025 +-----------------------------------------------------------------------------------------+ | NVIDIA-SMI 550.90.07 Driver Version: 550.90.07 CUDA Version: 12.4 | |-----------------------------------------+------------------------+----------------------+ | GPU Name Persistence-M | Bus-Id Disp.A | Volatile Uncorr. ECC | | Fan Temp Perf Pwr:Usage/Cap | Memory-Usage | GPU-Util Compute M. | | | | MIG M. | |=========================================+========================+======================| | 0 NVIDIA H100 80GB HBM3 On | 00000000:19:00.0 Off | 0 | | N/A 28C P0 109W / 700W | 7714MiB / 81559MiB | 0% Default | | | | Disabled | +-----------------------------------------+------------------------+----------------------+ | 1 NVIDIA H100 80GB HBM3 On | 00000000:3B:00.0 Off | 0 | | N/A 25C P0 108W / 700W | 3452MiB / 81559MiB | 0% Default | | | | Disabled | +-----------------------------------------+------------------------+----------------------+ | 2 NVIDIA H100 80GB HBM3 On | 00000000:4C:00.0 Off | 0 | | N/A 25C P0 107W / 700W | 3452MiB / 81559MiB | 0% Default | | | | Disabled | +-----------------------------------------+------------------------+----------------------+ | 3 NVIDIA H100 80GB HBM3 On | 00000000:5D:00.0 Off | 0 | | N/A 26C P0 109W / 700W | 3452MiB / 81559MiB | 0% Default | | | | Disabled | +-----------------------------------------+------------------------+----------------------+ | 4 NVIDIA H100 80GB HBM3 On | 00000000:9B:00.0 Off | 0 | | N/A 27C P0 110W / 700W | 3452MiB / 81559MiB | 0% Default | | | | Disabled | +-----------------------------------------+------------------------+----------------------+ | 5 NVIDIA H100 80GB HBM3 On | 00000000:BB:00.0 Off | 0 | | N/A 25C P0 105W / 700W | 3452MiB / 81559MiB | 0% Default | | | | Disabled | +-----------------------------------------+------------------------+----------------------+ | 6 NVIDIA H100 80GB HBM3 On | 00000000:CB:00.0 Off | 0 | | N/A 27C P0 112W / 700W | 3452MiB / 81559MiB | 0% Default | | | | Disabled | +-----------------------------------------+------------------------+----------------------+ | 7 NVIDIA H100 80GB HBM3 On | 00000000:DB:00.0 Off | 0 | | N/A 25C P0 109W / 700W | 3212MiB / 81559MiB | 0% Default | | | | Disabled | +-----------------------------------------+------------------------+----------------------+ +-----------------------------------------------------------------------------------------+ | Processes: | | GPU GI CI PID Type Process name GPU Memory | | ID ID Usage | |=========================================================================================| +-----------------------------------------------------------------------------------------+ ==================================================================================================== step:0/7050 val_loss:10.8258 train_time:0ms step_avg:0.06ms step:1/7050 train_time:183ms step_avg:182.50ms step:2/7050 train_time:341ms step_avg:170.48ms step:3/7050 train_time:552ms step_avg:183.88ms step:4/7050 train_time:773ms step_avg:193.26ms step:5/7050 train_time:993ms step_avg:198.51ms step:6/7050 train_time:1213ms step_avg:202.13ms step:7/7050 train_time:1438ms step_avg:205.46ms step:8/7050 train_time:1661ms step_avg:207.64ms step:9/7050 train_time:1883ms step_avg:209.23ms step:10/7050 train_time:2104ms step_avg:210.40ms step:11/7050 train_time:2325ms step_avg:211.36ms step:12/7050 train_time:2547ms step_avg:212.25ms step:13/7050 train_time:2770ms step_avg:213.04ms step:14/7050 train_time:2991ms step_avg:213.63ms step:15/7050 train_time:3213ms step_avg:214.23ms step:16/7050 train_time:3437ms step_avg:214.82ms step:17/7050 train_time:3659ms step_avg:215.26ms step:18/7050 train_time:3882ms step_avg:215.64ms step:19/7050 train_time:4103ms step_avg:215.95ms step:20/7050 train_time:4325ms step_avg:216.24ms step:21/7050 train_time:4547ms step_avg:216.50ms step:22/7050 train_time:4769ms step_avg:216.79ms step:23/7050 train_time:4991ms step_avg:216.99ms step:24/7050 train_time:5213ms step_avg:217.22ms step:25/7050 train_time:5435ms step_avg:217.40ms step:26/7050 train_time:5658ms step_avg:217.61ms step:27/7050 train_time:5881ms step_avg:217.80ms step:28/7050 train_time:6104ms step_avg:217.99ms step:29/7050 train_time:6326ms step_avg:218.13ms step:30/7050 train_time:6547ms step_avg:218.23ms step:31/7050 train_time:6770ms step_avg:218.38ms step:32/7050 train_time:6992ms step_avg:218.50ms step:33/7050 train_time:7217ms step_avg:218.69ms step:34/7050 train_time:7438ms step_avg:218.76ms step:35/7050 train_time:7659ms step_avg:218.83ms step:36/7050 train_time:7883ms step_avg:218.96ms step:37/7050 train_time:8105ms step_avg:219.04ms step:38/7050 train_time:8327ms step_avg:219.12ms step:39/7050 train_time:8548ms step_avg:219.17ms step:40/7050 train_time:8769ms step_avg:219.23ms step:41/7050 train_time:8992ms step_avg:219.32ms step:42/7050 train_time:9215ms step_avg:219.41ms step:43/7050 train_time:9438ms step_avg:219.49ms step:44/7050 train_time:9661ms step_avg:219.57ms step:45/7050 train_time:9883ms step_avg:219.63ms step:46/7050 train_time:10105ms step_avg:219.67ms step:47/7050 train_time:10326ms step_avg:219.70ms step:48/7050 train_time:10549ms step_avg:219.76ms step:49/7050 train_time:10771ms step_avg:219.82ms step:50/7050 train_time:10994ms step_avg:219.88ms step:51/7050 train_time:11218ms step_avg:219.95ms step:52/7050 train_time:11439ms step_avg:219.97ms step:53/7050 train_time:11660ms step_avg:219.99ms step:54/7050 train_time:11882ms step_avg:220.04ms step:55/7050 train_time:12105ms step_avg:220.09ms step:56/7050 train_time:12327ms step_avg:220.13ms step:57/7050 train_time:12549ms step_avg:220.16ms step:58/7050 train_time:12772ms step_avg:220.20ms step:59/7050 train_time:12994ms step_avg:220.23ms step:60/7050 train_time:13216ms step_avg:220.27ms step:61/7050 train_time:13438ms step_avg:220.30ms step:62/7050 train_time:13660ms step_avg:220.32ms step:63/7050 train_time:13882ms step_avg:220.35ms step:64/7050 train_time:14104ms step_avg:220.38ms step:65/7050 train_time:14326ms step_avg:220.40ms step:66/7050 train_time:14548ms step_avg:220.42ms step:67/7050 train_time:14770ms step_avg:220.45ms step:68/7050 train_time:14993ms step_avg:220.49ms step:69/7050 train_time:15216ms step_avg:220.52ms step:70/7050 train_time:15437ms step_avg:220.53ms step:71/7050 train_time:15660ms step_avg:220.56ms step:72/7050 train_time:15883ms step_avg:220.60ms step:73/7050 train_time:16105ms step_avg:220.61ms step:74/7050 train_time:16327ms step_avg:220.64ms step:75/7050 train_time:16549ms step_avg:220.66ms step:76/7050 train_time:16771ms step_avg:220.67ms step:77/7050 train_time:16994ms step_avg:220.70ms step:78/7050 train_time:17217ms step_avg:220.73ms step:79/7050 train_time:17438ms step_avg:220.74ms step:80/7050 train_time:17660ms step_avg:220.75ms step:81/7050 train_time:17881ms step_avg:220.75ms step:82/7050 train_time:18104ms step_avg:220.77ms step:83/7050 train_time:18326ms step_avg:220.80ms step:84/7050 train_time:18549ms step_avg:220.82ms step:85/7050 train_time:18770ms step_avg:220.82ms step:86/7050 train_time:18992ms step_avg:220.84ms step:87/7050 train_time:19214ms step_avg:220.86ms step:88/7050 train_time:19437ms step_avg:220.88ms step:89/7050 train_time:19659ms step_avg:220.89ms step:90/7050 train_time:19882ms step_avg:220.91ms step:91/7050 train_time:20104ms step_avg:220.93ms step:92/7050 train_time:20326ms step_avg:220.94ms step:93/7050 train_time:20549ms step_avg:220.95ms step:94/7050 train_time:20771ms step_avg:220.97ms step:95/7050 train_time:20994ms step_avg:220.99ms step:96/7050 train_time:21217ms step_avg:221.02ms step:97/7050 train_time:21439ms step_avg:221.02ms step:98/7050 train_time:21660ms step_avg:221.02ms step:99/7050 train_time:21881ms step_avg:221.02ms step:100/7050 train_time:22104ms step_avg:221.04ms step:101/7050 train_time:22326ms step_avg:221.05ms step:102/7050 train_time:22548ms step_avg:221.06ms step:103/7050 train_time:22770ms step_avg:221.07ms step:104/7050 train_time:22992ms step_avg:221.08ms step:105/7050 train_time:23215ms step_avg:221.09ms step:106/7050 train_time:23437ms step_avg:221.10ms step:107/7050 train_time:23659ms step_avg:221.11ms step:108/7050 train_time:23881ms step_avg:221.12ms step:109/7050 train_time:24104ms step_avg:221.14ms step:110/7050 train_time:24326ms step_avg:221.15ms step:111/7050 train_time:24547ms step_avg:221.15ms step:112/7050 train_time:24769ms step_avg:221.15ms step:113/7050 train_time:24990ms step_avg:221.15ms step:114/7050 train_time:25212ms step_avg:221.16ms step:115/7050 train_time:25433ms step_avg:221.16ms step:116/7050 train_time:25655ms step_avg:221.17ms step:117/7050 train_time:25878ms step_avg:221.18ms step:118/7050 train_time:26101ms step_avg:221.20ms step:119/7050 train_time:26324ms step_avg:221.21ms step:120/7050 train_time:26544ms step_avg:221.20ms step:121/7050 train_time:26767ms step_avg:221.22ms step:122/7050 train_time:26988ms step_avg:221.22ms step:123/7050 train_time:27211ms step_avg:221.23ms step:124/7050 train_time:27433ms step_avg:221.24ms step:125/7050 train_time:27654ms step_avg:221.24ms step:125/7050 val_loss:4.5208 train_time:27830ms step_avg:222.64ms step:126/7050 train_time:27877ms step_avg:221.25ms step:127/7050 train_time:28103ms step_avg:221.29ms step:128/7050 train_time:28331ms step_avg:221.33ms step:129/7050 train_time:28555ms step_avg:221.35ms step:130/7050 train_time:28776ms step_avg:221.35ms step:131/7050 train_time:28996ms step_avg:221.34ms step:132/7050 train_time:29219ms step_avg:221.36ms step:133/7050 train_time:29444ms step_avg:221.38ms step:134/7050 train_time:29667ms step_avg:221.39ms step:135/7050 train_time:29887ms step_avg:221.39ms step:136/7050 train_time:30109ms step_avg:221.39ms step:137/7050 train_time:30332ms step_avg:221.40ms step:138/7050 train_time:30556ms step_avg:221.42ms step:139/7050 train_time:30777ms step_avg:221.42ms step:140/7050 train_time:30997ms step_avg:221.41ms step:141/7050 train_time:31219ms step_avg:221.41ms step:142/7050 train_time:31442ms step_avg:221.43ms step:143/7050 train_time:31663ms step_avg:221.42ms step:144/7050 train_time:31885ms step_avg:221.42ms step:145/7050 train_time:32108ms step_avg:221.43ms step:146/7050 train_time:32329ms step_avg:221.43ms step:147/7050 train_time:32552ms step_avg:221.44ms step:148/7050 train_time:32774ms step_avg:221.45ms step:149/7050 train_time:32995ms step_avg:221.45ms step:150/7050 train_time:33218ms step_avg:221.45ms step:151/7050 train_time:33439ms step_avg:221.45ms step:152/7050 train_time:33660ms step_avg:221.45ms step:153/7050 train_time:33880ms step_avg:221.44ms step:154/7050 train_time:34101ms step_avg:221.44ms step:155/7050 train_time:34323ms step_avg:221.44ms step:156/7050 train_time:34545ms step_avg:221.44ms step:157/7050 train_time:34767ms step_avg:221.45ms step:158/7050 train_time:34988ms step_avg:221.44ms step:159/7050 train_time:35209ms step_avg:221.44ms step:160/7050 train_time:35431ms step_avg:221.45ms step:161/7050 train_time:35653ms step_avg:221.45ms step:162/7050 train_time:35875ms step_avg:221.45ms step:163/7050 train_time:36098ms step_avg:221.46ms step:164/7050 train_time:36319ms step_avg:221.46ms step:165/7050 train_time:36541ms step_avg:221.46ms step:166/7050 train_time:36763ms step_avg:221.46ms step:167/7050 train_time:36984ms step_avg:221.46ms step:168/7050 train_time:37205ms step_avg:221.46ms step:169/7050 train_time:37426ms step_avg:221.46ms step:170/7050 train_time:37648ms step_avg:221.46ms step:171/7050 train_time:37870ms step_avg:221.46ms step:172/7050 train_time:38091ms step_avg:221.46ms step:173/7050 train_time:38313ms step_avg:221.47ms step:174/7050 train_time:38536ms step_avg:221.47ms step:175/7050 train_time:38758ms step_avg:221.47ms step:176/7050 train_time:38978ms step_avg:221.47ms step:177/7050 train_time:39200ms step_avg:221.47ms step:178/7050 train_time:39421ms step_avg:221.47ms step:179/7050 train_time:39643ms step_avg:221.47ms step:180/7050 train_time:39865ms step_avg:221.47ms step:181/7050 train_time:40086ms step_avg:221.47ms step:182/7050 train_time:40307ms step_avg:221.47ms step:183/7050 train_time:40529ms step_avg:221.47ms step:184/7050 train_time:40750ms step_avg:221.47ms step:185/7050 train_time:40970ms step_avg:221.46ms step:186/7050 train_time:41191ms step_avg:221.46ms step:187/7050 train_time:41411ms step_avg:221.45ms step:188/7050 train_time:41632ms step_avg:221.45ms step:189/7050 train_time:41853ms step_avg:221.45ms step:190/7050 train_time:42074ms step_avg:221.44ms step:191/7050 train_time:42296ms step_avg:221.44ms step:192/7050 train_time:42517ms step_avg:221.45ms step:193/7050 train_time:42738ms step_avg:221.44ms step:194/7050 train_time:42959ms step_avg:221.44ms step:195/7050 train_time:43178ms step_avg:221.43ms step:196/7050 train_time:43399ms step_avg:221.43ms step:197/7050 train_time:43619ms step_avg:221.42ms step:198/7050 train_time:43840ms step_avg:221.41ms step:199/7050 train_time:44060ms step_avg:221.41ms step:200/7050 train_time:44280ms step_avg:221.40ms step:201/7050 train_time:44502ms step_avg:221.40ms step:202/7050 train_time:44724ms step_avg:221.40ms step:203/7050 train_time:44943ms step_avg:221.40ms step:204/7050 train_time:45163ms step_avg:221.39ms step:205/7050 train_time:45384ms step_avg:221.38ms step:206/7050 train_time:45604ms step_avg:221.38ms step:207/7050 train_time:45827ms step_avg:221.39ms step:208/7050 train_time:46048ms step_avg:221.38ms step:209/7050 train_time:46269ms step_avg:221.38ms step:210/7050 train_time:46491ms step_avg:221.38ms step:211/7050 train_time:46712ms step_avg:221.39ms step:212/7050 train_time:46934ms step_avg:221.39ms step:213/7050 train_time:47156ms step_avg:221.39ms step:214/7050 train_time:47376ms step_avg:221.38ms step:215/7050 train_time:47596ms step_avg:221.38ms step:216/7050 train_time:47817ms step_avg:221.38ms step:217/7050 train_time:48038ms step_avg:221.37ms step:218/7050 train_time:48259ms step_avg:221.37ms step:219/7050 train_time:48480ms step_avg:221.37ms step:220/7050 train_time:48701ms step_avg:221.37ms step:221/7050 train_time:48921ms step_avg:221.36ms step:222/7050 train_time:49141ms step_avg:221.36ms step:223/7050 train_time:49362ms step_avg:221.35ms step:224/7050 train_time:49582ms step_avg:221.35ms step:225/7050 train_time:49804ms step_avg:221.35ms step:226/7050 train_time:50024ms step_avg:221.34ms step:227/7050 train_time:50245ms step_avg:221.34ms step:228/7050 train_time:50465ms step_avg:221.34ms step:229/7050 train_time:50685ms step_avg:221.33ms step:230/7050 train_time:50907ms step_avg:221.33ms step:231/7050 train_time:51127ms step_avg:221.33ms step:232/7050 train_time:51349ms step_avg:221.33ms step:233/7050 train_time:51569ms step_avg:221.33ms step:234/7050 train_time:51790ms step_avg:221.33ms step:235/7050 train_time:52011ms step_avg:221.32ms step:236/7050 train_time:52230ms step_avg:221.32ms step:237/7050 train_time:52452ms step_avg:221.32ms step:238/7050 train_time:52674ms step_avg:221.32ms step:239/7050 train_time:52895ms step_avg:221.32ms step:240/7050 train_time:53115ms step_avg:221.31ms step:241/7050 train_time:53337ms step_avg:221.31ms step:242/7050 train_time:53558ms step_avg:221.32ms step:243/7050 train_time:53778ms step_avg:221.31ms step:244/7050 train_time:53998ms step_avg:221.30ms step:245/7050 train_time:54219ms step_avg:221.30ms step:246/7050 train_time:54439ms step_avg:221.30ms step:247/7050 train_time:54659ms step_avg:221.29ms step:248/7050 train_time:54880ms step_avg:221.29ms step:249/7050 train_time:55100ms step_avg:221.28ms step:250/7050 train_time:55321ms step_avg:221.29ms step:250/7050 val_loss:4.1950 train_time:55494ms step_avg:221.98ms step:251/7050 train_time:55541ms step_avg:221.28ms step:252/7050 train_time:55759ms step_avg:221.27ms step:253/7050 train_time:55983ms step_avg:221.28ms step:254/7050 train_time:56207ms step_avg:221.29ms step:255/7050 train_time:56426ms step_avg:221.28ms step:256/7050 train_time:56646ms step_avg:221.27ms step:257/7050 train_time:56866ms step_avg:221.27ms step:258/7050 train_time:57091ms step_avg:221.28ms step:259/7050 train_time:57311ms step_avg:221.28ms step:260/7050 train_time:57530ms step_avg:221.27ms step:261/7050 train_time:57750ms step_avg:221.26ms step:262/7050 train_time:57970ms step_avg:221.26ms step:263/7050 train_time:58193ms step_avg:221.27ms step:264/7050 train_time:58414ms step_avg:221.26ms step:265/7050 train_time:58634ms step_avg:221.26ms step:266/7050 train_time:58853ms step_avg:221.25ms step:267/7050 train_time:59074ms step_avg:221.25ms step:268/7050 train_time:59294ms step_avg:221.25ms step:269/7050 train_time:59515ms step_avg:221.25ms step:270/7050 train_time:59735ms step_avg:221.24ms step:271/7050 train_time:59956ms step_avg:221.24ms step:272/7050 train_time:60177ms step_avg:221.24ms step:273/7050 train_time:60398ms step_avg:221.24ms step:274/7050 train_time:60619ms step_avg:221.24ms step:275/7050 train_time:60840ms step_avg:221.24ms step:276/7050 train_time:61060ms step_avg:221.23ms step:277/7050 train_time:61281ms step_avg:221.23ms step:278/7050 train_time:61502ms step_avg:221.23ms step:279/7050 train_time:61723ms step_avg:221.23ms step:280/7050 train_time:61943ms step_avg:221.23ms step:281/7050 train_time:62165ms step_avg:221.23ms step:282/7050 train_time:62385ms step_avg:221.22ms step:283/7050 train_time:62605ms step_avg:221.22ms step:284/7050 train_time:62826ms step_avg:221.22ms step:285/7050 train_time:63046ms step_avg:221.21ms step:286/7050 train_time:63267ms step_avg:221.21ms step:287/7050 train_time:63487ms step_avg:221.21ms step:288/7050 train_time:63710ms step_avg:221.21ms step:289/7050 train_time:63930ms step_avg:221.21ms step:290/7050 train_time:64150ms step_avg:221.21ms step:291/7050 train_time:64371ms step_avg:221.21ms step:292/7050 train_time:64591ms step_avg:221.20ms step:293/7050 train_time:64812ms step_avg:221.20ms step:294/7050 train_time:65032ms step_avg:221.20ms step:295/7050 train_time:65253ms step_avg:221.20ms step:296/7050 train_time:65474ms step_avg:221.20ms step:297/7050 train_time:65694ms step_avg:221.19ms step:298/7050 train_time:65914ms step_avg:221.19ms step:299/7050 train_time:66135ms step_avg:221.19ms step:300/7050 train_time:66357ms step_avg:221.19ms step:301/7050 train_time:66577ms step_avg:221.19ms step:302/7050 train_time:66799ms step_avg:221.19ms step:303/7050 train_time:67020ms step_avg:221.19ms step:304/7050 train_time:67240ms step_avg:221.18ms step:305/7050 train_time:67461ms step_avg:221.18ms step:306/7050 train_time:67680ms step_avg:221.18ms step:307/7050 train_time:67902ms step_avg:221.18ms step:308/7050 train_time:68123ms step_avg:221.18ms step:309/7050 train_time:68344ms step_avg:221.18ms step:310/7050 train_time:68565ms step_avg:221.18ms step:311/7050 train_time:68785ms step_avg:221.17ms step:312/7050 train_time:69006ms step_avg:221.17ms step:313/7050 train_time:69226ms step_avg:221.17ms step:314/7050 train_time:69446ms step_avg:221.17ms step:315/7050 train_time:69668ms step_avg:221.17ms step:316/7050 train_time:69888ms step_avg:221.16ms step:317/7050 train_time:70108ms step_avg:221.16ms step:318/7050 train_time:70329ms step_avg:221.16ms step:319/7050 train_time:70549ms step_avg:221.16ms step:320/7050 train_time:70769ms step_avg:221.15ms step:321/7050 train_time:70989ms step_avg:221.15ms step:322/7050 train_time:71209ms step_avg:221.15ms step:323/7050 train_time:71430ms step_avg:221.15ms step:324/7050 train_time:71651ms step_avg:221.15ms step:325/7050 train_time:71872ms step_avg:221.15ms step:326/7050 train_time:72093ms step_avg:221.14ms step:327/7050 train_time:72314ms step_avg:221.14ms step:328/7050 train_time:72535ms step_avg:221.14ms step:329/7050 train_time:72756ms step_avg:221.14ms step:330/7050 train_time:72978ms step_avg:221.14ms step:331/7050 train_time:73198ms step_avg:221.14ms step:332/7050 train_time:73418ms step_avg:221.14ms step:333/7050 train_time:73640ms step_avg:221.14ms step:334/7050 train_time:73860ms step_avg:221.14ms step:335/7050 train_time:74080ms step_avg:221.14ms step:336/7050 train_time:74302ms step_avg:221.14ms step:337/7050 train_time:74523ms step_avg:221.14ms step:338/7050 train_time:74744ms step_avg:221.14ms step:339/7050 train_time:74965ms step_avg:221.14ms step:340/7050 train_time:75186ms step_avg:221.13ms step:341/7050 train_time:75406ms step_avg:221.13ms step:342/7050 train_time:75626ms step_avg:221.13ms step:343/7050 train_time:75848ms step_avg:221.13ms step:344/7050 train_time:76068ms step_avg:221.13ms step:345/7050 train_time:76289ms step_avg:221.13ms step:346/7050 train_time:76508ms step_avg:221.12ms step:347/7050 train_time:76729ms step_avg:221.12ms step:348/7050 train_time:76950ms step_avg:221.12ms step:349/7050 train_time:77170ms step_avg:221.12ms step:350/7050 train_time:77390ms step_avg:221.11ms step:351/7050 train_time:77610ms step_avg:221.11ms step:352/7050 train_time:77831ms step_avg:221.11ms step:353/7050 train_time:78052ms step_avg:221.11ms step:354/7050 train_time:78273ms step_avg:221.11ms step:355/7050 train_time:78493ms step_avg:221.11ms step:356/7050 train_time:78714ms step_avg:221.11ms step:357/7050 train_time:78934ms step_avg:221.10ms step:358/7050 train_time:79154ms step_avg:221.10ms step:359/7050 train_time:79376ms step_avg:221.10ms step:360/7050 train_time:79596ms step_avg:221.10ms step:361/7050 train_time:79818ms step_avg:221.10ms step:362/7050 train_time:80038ms step_avg:221.10ms step:363/7050 train_time:80259ms step_avg:221.10ms step:364/7050 train_time:80479ms step_avg:221.10ms step:365/7050 train_time:80700ms step_avg:221.10ms step:366/7050 train_time:80921ms step_avg:221.09ms step:367/7050 train_time:81141ms step_avg:221.09ms step:368/7050 train_time:81361ms step_avg:221.09ms step:369/7050 train_time:81583ms step_avg:221.09ms step:370/7050 train_time:81804ms step_avg:221.09ms step:371/7050 train_time:82025ms step_avg:221.09ms step:372/7050 train_time:82245ms step_avg:221.09ms step:373/7050 train_time:82466ms step_avg:221.09ms step:374/7050 train_time:82688ms step_avg:221.09ms step:375/7050 train_time:82908ms step_avg:221.09ms step:375/7050 val_loss:4.0422 train_time:83082ms step_avg:221.55ms step:376/7050 train_time:83129ms step_avg:221.09ms step:377/7050 train_time:83350ms step_avg:221.09ms step:378/7050 train_time:83574ms step_avg:221.09ms step:379/7050 train_time:83795ms step_avg:221.10ms step:380/7050 train_time:84015ms step_avg:221.09ms step:381/7050 train_time:84236ms step_avg:221.09ms step:382/7050 train_time:84457ms step_avg:221.09ms step:383/7050 train_time:84681ms step_avg:221.10ms step:384/7050 train_time:84902ms step_avg:221.10ms step:385/7050 train_time:85122ms step_avg:221.10ms step:386/7050 train_time:85342ms step_avg:221.09ms step:387/7050 train_time:85562ms step_avg:221.09ms step:388/7050 train_time:85784ms step_avg:221.09ms step:389/7050 train_time:86003ms step_avg:221.09ms step:390/7050 train_time:86222ms step_avg:221.08ms step:391/7050 train_time:86443ms step_avg:221.08ms step:392/7050 train_time:86665ms step_avg:221.08ms step:393/7050 train_time:86887ms step_avg:221.09ms step:394/7050 train_time:87107ms step_avg:221.08ms step:395/7050 train_time:87327ms step_avg:221.08ms step:396/7050 train_time:87547ms step_avg:221.08ms step:397/7050 train_time:87768ms step_avg:221.08ms step:398/7050 train_time:87988ms step_avg:221.07ms step:399/7050 train_time:88209ms step_avg:221.07ms step:400/7050 train_time:88430ms step_avg:221.07ms step:401/7050 train_time:88650ms step_avg:221.07ms step:402/7050 train_time:88871ms step_avg:221.07ms step:403/7050 train_time:89092ms step_avg:221.07ms step:404/7050 train_time:89312ms step_avg:221.07ms step:405/7050 train_time:89533ms step_avg:221.07ms step:406/7050 train_time:89754ms step_avg:221.07ms step:407/7050 train_time:89974ms step_avg:221.07ms step:408/7050 train_time:90194ms step_avg:221.06ms step:409/7050 train_time:90416ms step_avg:221.07ms step:410/7050 train_time:90637ms step_avg:221.07ms step:411/7050 train_time:90858ms step_avg:221.07ms step:412/7050 train_time:91078ms step_avg:221.06ms step:413/7050 train_time:91299ms step_avg:221.06ms step:414/7050 train_time:91520ms step_avg:221.06ms step:415/7050 train_time:91741ms step_avg:221.06ms step:416/7050 train_time:91963ms step_avg:221.06ms step:417/7050 train_time:92182ms step_avg:221.06ms step:418/7050 train_time:92402ms step_avg:221.06ms step:419/7050 train_time:92622ms step_avg:221.06ms step:420/7050 train_time:92843ms step_avg:221.05ms step:421/7050 train_time:93063ms step_avg:221.05ms step:422/7050 train_time:93283ms step_avg:221.05ms step:423/7050 train_time:93504ms step_avg:221.05ms step:424/7050 train_time:93724ms step_avg:221.05ms step:425/7050 train_time:93944ms step_avg:221.04ms step:426/7050 train_time:94164ms step_avg:221.04ms step:427/7050 train_time:94384ms step_avg:221.04ms step:428/7050 train_time:94606ms step_avg:221.04ms step:429/7050 train_time:94826ms step_avg:221.04ms step:430/7050 train_time:95046ms step_avg:221.04ms step:431/7050 train_time:95267ms step_avg:221.04ms step:432/7050 train_time:95487ms step_avg:221.03ms step:433/7050 train_time:95708ms step_avg:221.04ms step:434/7050 train_time:95930ms step_avg:221.04ms step:435/7050 train_time:96150ms step_avg:221.04ms step:436/7050 train_time:96370ms step_avg:221.03ms step:437/7050 train_time:96591ms step_avg:221.03ms step:438/7050 train_time:96812ms step_avg:221.03ms step:439/7050 train_time:97032ms step_avg:221.03ms step:440/7050 train_time:97253ms step_avg:221.03ms step:441/7050 train_time:97472ms step_avg:221.03ms step:442/7050 train_time:97693ms step_avg:221.03ms step:443/7050 train_time:97913ms step_avg:221.02ms step:444/7050 train_time:98134ms step_avg:221.02ms step:445/7050 train_time:98355ms step_avg:221.02ms step:446/7050 train_time:98576ms step_avg:221.02ms step:447/7050 train_time:98797ms step_avg:221.02ms step:448/7050 train_time:99018ms step_avg:221.02ms step:449/7050 train_time:99240ms step_avg:221.02ms step:450/7050 train_time:99460ms step_avg:221.02ms step:451/7050 train_time:99681ms step_avg:221.02ms step:452/7050 train_time:99901ms step_avg:221.02ms step:453/7050 train_time:100122ms step_avg:221.02ms step:454/7050 train_time:100344ms step_avg:221.02ms step:455/7050 train_time:100563ms step_avg:221.02ms step:456/7050 train_time:100783ms step_avg:221.02ms step:457/7050 train_time:101004ms step_avg:221.01ms step:458/7050 train_time:101224ms step_avg:221.01ms step:459/7050 train_time:101444ms step_avg:221.01ms step:460/7050 train_time:101666ms step_avg:221.01ms step:461/7050 train_time:101886ms step_avg:221.01ms step:462/7050 train_time:102107ms step_avg:221.01ms step:463/7050 train_time:102327ms step_avg:221.01ms step:464/7050 train_time:102549ms step_avg:221.01ms step:465/7050 train_time:102769ms step_avg:221.01ms step:466/7050 train_time:102990ms step_avg:221.01ms step:467/7050 train_time:103211ms step_avg:221.01ms step:468/7050 train_time:103431ms step_avg:221.01ms step:469/7050 train_time:103653ms step_avg:221.01ms step:470/7050 train_time:103874ms step_avg:221.01ms step:471/7050 train_time:104095ms step_avg:221.01ms step:472/7050 train_time:104316ms step_avg:221.01ms step:473/7050 train_time:104537ms step_avg:221.01ms step:474/7050 train_time:104758ms step_avg:221.01ms step:475/7050 train_time:104978ms step_avg:221.01ms step:476/7050 train_time:105199ms step_avg:221.01ms step:477/7050 train_time:105420ms step_avg:221.01ms step:478/7050 train_time:105641ms step_avg:221.01ms step:479/7050 train_time:105861ms step_avg:221.00ms step:480/7050 train_time:106081ms step_avg:221.00ms step:481/7050 train_time:106302ms step_avg:221.00ms step:482/7050 train_time:106523ms step_avg:221.00ms step:483/7050 train_time:106742ms step_avg:221.00ms step:484/7050 train_time:106963ms step_avg:221.00ms step:485/7050 train_time:107184ms step_avg:221.00ms step:486/7050 train_time:107405ms step_avg:221.00ms step:487/7050 train_time:107626ms step_avg:221.00ms step:488/7050 train_time:107846ms step_avg:221.00ms step:489/7050 train_time:108067ms step_avg:221.00ms step:490/7050 train_time:108287ms step_avg:220.99ms step:491/7050 train_time:108510ms step_avg:221.00ms step:492/7050 train_time:108731ms step_avg:221.00ms step:493/7050 train_time:108951ms step_avg:221.00ms step:494/7050 train_time:109172ms step_avg:221.00ms step:495/7050 train_time:109392ms step_avg:220.99ms step:496/7050 train_time:109614ms step_avg:221.00ms step:497/7050 train_time:109834ms step_avg:220.99ms step:498/7050 train_time:110056ms step_avg:221.00ms step:499/7050 train_time:110277ms step_avg:221.00ms step:500/7050 train_time:110499ms step_avg:221.00ms step:500/7050 val_loss:3.9440 train_time:110676ms step_avg:221.35ms step:501/7050 train_time:110725ms step_avg:221.01ms step:502/7050 train_time:110946ms step_avg:221.01ms step:503/7050 train_time:111168ms step_avg:221.01ms step:504/7050 train_time:111390ms step_avg:221.01ms step:505/7050 train_time:111609ms step_avg:221.01ms step:506/7050 train_time:111829ms step_avg:221.01ms step:507/7050 train_time:112051ms step_avg:221.01ms step:508/7050 train_time:112273ms step_avg:221.01ms step:509/7050 train_time:112493ms step_avg:221.01ms step:510/7050 train_time:112713ms step_avg:221.01ms step:511/7050 train_time:112934ms step_avg:221.01ms step:512/7050 train_time:113155ms step_avg:221.01ms step:513/7050 train_time:113376ms step_avg:221.01ms step:514/7050 train_time:113596ms step_avg:221.00ms step:515/7050 train_time:113817ms step_avg:221.00ms step:516/7050 train_time:114037ms step_avg:221.00ms step:517/7050 train_time:114260ms step_avg:221.00ms step:518/7050 train_time:114480ms step_avg:221.00ms step:519/7050 train_time:114700ms step_avg:221.00ms step:520/7050 train_time:114920ms step_avg:221.00ms step:521/7050 train_time:115140ms step_avg:221.00ms step:522/7050 train_time:115361ms step_avg:221.00ms step:523/7050 train_time:115582ms step_avg:221.00ms step:524/7050 train_time:115803ms step_avg:221.00ms step:525/7050 train_time:116024ms step_avg:221.00ms step:526/7050 train_time:116244ms step_avg:221.00ms step:527/7050 train_time:116466ms step_avg:221.00ms step:528/7050 train_time:116688ms step_avg:221.00ms step:529/7050 train_time:116909ms step_avg:221.00ms step:530/7050 train_time:117130ms step_avg:221.00ms step:531/7050 train_time:117354ms step_avg:221.01ms step:532/7050 train_time:117576ms step_avg:221.01ms step:533/7050 train_time:117798ms step_avg:221.01ms step:534/7050 train_time:118019ms step_avg:221.01ms step:535/7050 train_time:118242ms step_avg:221.01ms step:536/7050 train_time:118465ms step_avg:221.02ms step:537/7050 train_time:118686ms step_avg:221.02ms step:538/7050 train_time:118908ms step_avg:221.02ms step:539/7050 train_time:119130ms step_avg:221.02ms step:540/7050 train_time:119351ms step_avg:221.02ms step:541/7050 train_time:119573ms step_avg:221.02ms step:542/7050 train_time:119795ms step_avg:221.02ms step:543/7050 train_time:120018ms step_avg:221.03ms step:544/7050 train_time:120239ms step_avg:221.03ms step:545/7050 train_time:120460ms step_avg:221.03ms step:546/7050 train_time:120683ms step_avg:221.03ms step:547/7050 train_time:120905ms step_avg:221.03ms step:548/7050 train_time:121126ms step_avg:221.03ms step:549/7050 train_time:121348ms step_avg:221.03ms step:550/7050 train_time:121570ms step_avg:221.04ms step:551/7050 train_time:121792ms step_avg:221.04ms step:552/7050 train_time:122013ms step_avg:221.04ms step:553/7050 train_time:122236ms step_avg:221.04ms step:554/7050 train_time:122459ms step_avg:221.04ms step:555/7050 train_time:122682ms step_avg:221.05ms step:556/7050 train_time:122903ms step_avg:221.05ms step:557/7050 train_time:123124ms step_avg:221.05ms step:558/7050 train_time:123346ms step_avg:221.05ms step:559/7050 train_time:123569ms step_avg:221.05ms step:560/7050 train_time:123791ms step_avg:221.06ms step:561/7050 train_time:124013ms step_avg:221.06ms step:562/7050 train_time:124233ms step_avg:221.06ms step:563/7050 train_time:124455ms step_avg:221.06ms step:564/7050 train_time:124678ms step_avg:221.06ms step:565/7050 train_time:124900ms step_avg:221.06ms step:566/7050 train_time:125123ms step_avg:221.07ms step:567/7050 train_time:125343ms step_avg:221.06ms step:568/7050 train_time:125565ms step_avg:221.07ms step:569/7050 train_time:125787ms step_avg:221.07ms step:570/7050 train_time:126008ms step_avg:221.07ms step:571/7050 train_time:126230ms step_avg:221.07ms step:572/7050 train_time:126452ms step_avg:221.07ms step:573/7050 train_time:126674ms step_avg:221.07ms step:574/7050 train_time:126895ms step_avg:221.07ms step:575/7050 train_time:127117ms step_avg:221.07ms step:576/7050 train_time:127339ms step_avg:221.08ms step:577/7050 train_time:127563ms step_avg:221.08ms step:578/7050 train_time:127785ms step_avg:221.08ms step:579/7050 train_time:128006ms step_avg:221.08ms step:580/7050 train_time:128228ms step_avg:221.08ms step:581/7050 train_time:128450ms step_avg:221.08ms step:582/7050 train_time:128672ms step_avg:221.09ms step:583/7050 train_time:128893ms step_avg:221.09ms step:584/7050 train_time:129116ms step_avg:221.09ms step:585/7050 train_time:129337ms step_avg:221.09ms step:586/7050 train_time:129559ms step_avg:221.09ms step:587/7050 train_time:129781ms step_avg:221.09ms step:588/7050 train_time:130003ms step_avg:221.09ms step:589/7050 train_time:130224ms step_avg:221.09ms step:590/7050 train_time:130445ms step_avg:221.09ms step:591/7050 train_time:130668ms step_avg:221.10ms step:592/7050 train_time:130890ms step_avg:221.10ms step:593/7050 train_time:131111ms step_avg:221.10ms step:594/7050 train_time:131332ms step_avg:221.10ms step:595/7050 train_time:131553ms step_avg:221.10ms step:596/7050 train_time:131775ms step_avg:221.10ms step:597/7050 train_time:131996ms step_avg:221.10ms step:598/7050 train_time:132218ms step_avg:221.10ms step:599/7050 train_time:132439ms step_avg:221.10ms step:600/7050 train_time:132662ms step_avg:221.10ms step:601/7050 train_time:132883ms step_avg:221.10ms step:602/7050 train_time:133105ms step_avg:221.11ms step:603/7050 train_time:133327ms step_avg:221.11ms step:604/7050 train_time:133547ms step_avg:221.10ms step:605/7050 train_time:133772ms step_avg:221.11ms step:606/7050 train_time:133994ms step_avg:221.11ms step:607/7050 train_time:134215ms step_avg:221.11ms step:608/7050 train_time:134436ms step_avg:221.11ms step:609/7050 train_time:134659ms step_avg:221.11ms step:610/7050 train_time:134882ms step_avg:221.12ms step:611/7050 train_time:135104ms step_avg:221.12ms step:612/7050 train_time:135326ms step_avg:221.12ms step:613/7050 train_time:135547ms step_avg:221.12ms step:614/7050 train_time:135770ms step_avg:221.12ms step:615/7050 train_time:135991ms step_avg:221.12ms step:616/7050 train_time:136213ms step_avg:221.12ms step:617/7050 train_time:136435ms step_avg:221.13ms step:618/7050 train_time:136656ms step_avg:221.13ms step:619/7050 train_time:136879ms step_avg:221.13ms step:620/7050 train_time:137101ms step_avg:221.13ms step:621/7050 train_time:137322ms step_avg:221.13ms step:622/7050 train_time:137543ms step_avg:221.13ms step:623/7050 train_time:137765ms step_avg:221.13ms step:624/7050 train_time:137987ms step_avg:221.13ms step:625/7050 train_time:138209ms step_avg:221.13ms step:625/7050 val_loss:3.6602 train_time:138383ms step_avg:221.41ms step:626/7050 train_time:138431ms step_avg:221.14ms step:627/7050 train_time:138652ms step_avg:221.14ms step:628/7050 train_time:138877ms step_avg:221.14ms step:629/7050 train_time:139101ms step_avg:221.15ms step:630/7050 train_time:139321ms step_avg:221.15ms step:631/7050 train_time:139543ms step_avg:221.15ms step:632/7050 train_time:139767ms step_avg:221.15ms step:633/7050 train_time:139991ms step_avg:221.15ms step:634/7050 train_time:140213ms step_avg:221.16ms step:635/7050 train_time:140434ms step_avg:221.16ms step:636/7050 train_time:140656ms step_avg:221.16ms step:637/7050 train_time:140879ms step_avg:221.16ms step:638/7050 train_time:141102ms step_avg:221.16ms step:639/7050 train_time:141323ms step_avg:221.16ms step:640/7050 train_time:141545ms step_avg:221.16ms step:641/7050 train_time:141767ms step_avg:221.16ms step:642/7050 train_time:141989ms step_avg:221.17ms step:643/7050 train_time:142210ms step_avg:221.17ms step:644/7050 train_time:142434ms step_avg:221.17ms step:645/7050 train_time:142656ms step_avg:221.17ms step:646/7050 train_time:142878ms step_avg:221.17ms step:647/7050 train_time:143102ms step_avg:221.18ms step:648/7050 train_time:143324ms step_avg:221.18ms step:649/7050 train_time:143546ms step_avg:221.18ms step:650/7050 train_time:143769ms step_avg:221.18ms step:651/7050 train_time:143991ms step_avg:221.18ms step:652/7050 train_time:144213ms step_avg:221.19ms step:653/7050 train_time:144434ms step_avg:221.19ms step:654/7050 train_time:144656ms step_avg:221.19ms step:655/7050 train_time:144878ms step_avg:221.19ms step:656/7050 train_time:145100ms step_avg:221.19ms step:657/7050 train_time:145323ms step_avg:221.19ms step:658/7050 train_time:145545ms step_avg:221.19ms step:659/7050 train_time:145767ms step_avg:221.19ms step:660/7050 train_time:145988ms step_avg:221.19ms step:661/7050 train_time:146210ms step_avg:221.19ms step:662/7050 train_time:146433ms step_avg:221.20ms step:663/7050 train_time:146655ms step_avg:221.20ms step:664/7050 train_time:146876ms step_avg:221.20ms step:665/7050 train_time:147098ms step_avg:221.20ms step:666/7050 train_time:147320ms step_avg:221.20ms step:667/7050 train_time:147543ms step_avg:221.20ms step:668/7050 train_time:147766ms step_avg:221.21ms step:669/7050 train_time:147988ms step_avg:221.21ms step:670/7050 train_time:148210ms step_avg:221.21ms step:671/7050 train_time:148432ms step_avg:221.21ms step:672/7050 train_time:148654ms step_avg:221.21ms step:673/7050 train_time:148875ms step_avg:221.21ms step:674/7050 train_time:149097ms step_avg:221.21ms step:675/7050 train_time:149319ms step_avg:221.21ms step:676/7050 train_time:149542ms step_avg:221.22ms step:677/7050 train_time:149764ms step_avg:221.22ms step:678/7050 train_time:149987ms step_avg:221.22ms step:679/7050 train_time:150211ms step_avg:221.22ms step:680/7050 train_time:150433ms step_avg:221.22ms step:681/7050 train_time:150655ms step_avg:221.23ms step:682/7050 train_time:150877ms step_avg:221.23ms step:683/7050 train_time:151098ms step_avg:221.23ms step:684/7050 train_time:151320ms step_avg:221.23ms step:685/7050 train_time:151542ms step_avg:221.23ms step:686/7050 train_time:151764ms step_avg:221.23ms step:687/7050 train_time:151986ms step_avg:221.23ms step:688/7050 train_time:152209ms step_avg:221.23ms step:689/7050 train_time:152432ms step_avg:221.24ms step:690/7050 train_time:152654ms step_avg:221.24ms step:691/7050 train_time:152876ms step_avg:221.24ms step:692/7050 train_time:153097ms step_avg:221.24ms step:693/7050 train_time:153319ms step_avg:221.24ms step:694/7050 train_time:153540ms step_avg:221.24ms step:695/7050 train_time:153763ms step_avg:221.24ms step:696/7050 train_time:153985ms step_avg:221.24ms step:697/7050 train_time:154207ms step_avg:221.24ms step:698/7050 train_time:154429ms step_avg:221.25ms step:699/7050 train_time:154651ms step_avg:221.25ms step:700/7050 train_time:154873ms step_avg:221.25ms step:701/7050 train_time:155094ms step_avg:221.25ms step:702/7050 train_time:155315ms step_avg:221.25ms step:703/7050 train_time:155537ms step_avg:221.25ms step:704/7050 train_time:155759ms step_avg:221.25ms step:705/7050 train_time:155981ms step_avg:221.25ms step:706/7050 train_time:156203ms step_avg:221.25ms step:707/7050 train_time:156425ms step_avg:221.25ms step:708/7050 train_time:156647ms step_avg:221.25ms step:709/7050 train_time:156869ms step_avg:221.25ms step:710/7050 train_time:157090ms step_avg:221.25ms step:711/7050 train_time:157313ms step_avg:221.26ms step:712/7050 train_time:157534ms step_avg:221.26ms step:713/7050 train_time:157755ms step_avg:221.26ms step:714/7050 train_time:157978ms step_avg:221.26ms step:715/7050 train_time:158199ms step_avg:221.26ms step:716/7050 train_time:158422ms step_avg:221.26ms step:717/7050 train_time:158645ms step_avg:221.26ms step:718/7050 train_time:158867ms step_avg:221.26ms step:719/7050 train_time:159088ms step_avg:221.26ms step:720/7050 train_time:159309ms step_avg:221.26ms step:721/7050 train_time:159531ms step_avg:221.26ms step:722/7050 train_time:159753ms step_avg:221.27ms step:723/7050 train_time:159975ms step_avg:221.27ms step:724/7050 train_time:160197ms step_avg:221.27ms step:725/7050 train_time:160419ms step_avg:221.27ms step:726/7050 train_time:160640ms step_avg:221.27ms step:727/7050 train_time:160863ms step_avg:221.27ms step:728/7050 train_time:161086ms step_avg:221.27ms step:729/7050 train_time:161307ms step_avg:221.27ms step:730/7050 train_time:161529ms step_avg:221.27ms step:731/7050 train_time:161751ms step_avg:221.27ms step:732/7050 train_time:161973ms step_avg:221.27ms step:733/7050 train_time:162194ms step_avg:221.27ms step:734/7050 train_time:162416ms step_avg:221.27ms step:735/7050 train_time:162638ms step_avg:221.28ms step:736/7050 train_time:162859ms step_avg:221.28ms step:737/7050 train_time:163081ms step_avg:221.28ms step:738/7050 train_time:163303ms step_avg:221.28ms step:739/7050 train_time:163525ms step_avg:221.28ms step:740/7050 train_time:163749ms step_avg:221.28ms step:741/7050 train_time:163970ms step_avg:221.28ms step:742/7050 train_time:164192ms step_avg:221.28ms step:743/7050 train_time:164414ms step_avg:221.28ms step:744/7050 train_time:164636ms step_avg:221.28ms step:745/7050 train_time:164857ms step_avg:221.28ms step:746/7050 train_time:165079ms step_avg:221.29ms step:747/7050 train_time:165300ms step_avg:221.29ms step:748/7050 train_time:165521ms step_avg:221.29ms step:749/7050 train_time:165744ms step_avg:221.29ms step:750/7050 train_time:165966ms step_avg:221.29ms step:750/7050 val_loss:3.5910 train_time:166140ms step_avg:221.52ms step:751/7050 train_time:166188ms step_avg:221.29ms step:752/7050 train_time:166410ms step_avg:221.29ms step:753/7050 train_time:166636ms step_avg:221.30ms step:754/7050 train_time:166862ms step_avg:221.30ms step:755/7050 train_time:167082ms step_avg:221.30ms step:756/7050 train_time:167304ms step_avg:221.30ms step:757/7050 train_time:167525ms step_avg:221.30ms step:758/7050 train_time:167749ms step_avg:221.30ms step:759/7050 train_time:167972ms step_avg:221.31ms step:760/7050 train_time:168193ms step_avg:221.31ms step:761/7050 train_time:168414ms step_avg:221.31ms step:762/7050 train_time:168636ms step_avg:221.31ms step:763/7050 train_time:168859ms step_avg:221.31ms step:764/7050 train_time:169081ms step_avg:221.31ms step:765/7050 train_time:169302ms step_avg:221.31ms step:766/7050 train_time:169524ms step_avg:221.31ms step:767/7050 train_time:169747ms step_avg:221.31ms step:768/7050 train_time:169970ms step_avg:221.31ms step:769/7050 train_time:170191ms step_avg:221.31ms step:770/7050 train_time:170413ms step_avg:221.32ms step:771/7050 train_time:170635ms step_avg:221.32ms step:772/7050 train_time:170859ms step_avg:221.32ms step:773/7050 train_time:171080ms step_avg:221.32ms step:774/7050 train_time:171301ms step_avg:221.32ms step:775/7050 train_time:171524ms step_avg:221.32ms step:776/7050 train_time:171744ms step_avg:221.32ms step:777/7050 train_time:171967ms step_avg:221.32ms step:778/7050 train_time:172189ms step_avg:221.32ms step:779/7050 train_time:172411ms step_avg:221.32ms step:780/7050 train_time:172634ms step_avg:221.33ms step:781/7050 train_time:172856ms step_avg:221.33ms step:782/7050 train_time:173078ms step_avg:221.33ms step:783/7050 train_time:173301ms step_avg:221.33ms step:784/7050 train_time:173523ms step_avg:221.33ms step:785/7050 train_time:173744ms step_avg:221.33ms step:786/7050 train_time:173966ms step_avg:221.33ms step:787/7050 train_time:174188ms step_avg:221.33ms step:788/7050 train_time:174411ms step_avg:221.33ms step:789/7050 train_time:174632ms step_avg:221.33ms step:790/7050 train_time:174855ms step_avg:221.34ms step:791/7050 train_time:175077ms step_avg:221.34ms step:792/7050 train_time:175299ms step_avg:221.34ms step:793/7050 train_time:175521ms step_avg:221.34ms step:794/7050 train_time:175741ms step_avg:221.34ms step:795/7050 train_time:175964ms step_avg:221.34ms step:796/7050 train_time:176184ms step_avg:221.34ms step:797/7050 train_time:176406ms step_avg:221.34ms step:798/7050 train_time:176629ms step_avg:221.34ms step:799/7050 train_time:176851ms step_avg:221.34ms step:800/7050 train_time:177073ms step_avg:221.34ms step:801/7050 train_time:177296ms step_avg:221.34ms step:802/7050 train_time:177520ms step_avg:221.35ms step:803/7050 train_time:177741ms step_avg:221.35ms step:804/7050 train_time:177963ms step_avg:221.35ms step:805/7050 train_time:178185ms step_avg:221.35ms step:806/7050 train_time:178407ms step_avg:221.35ms step:807/7050 train_time:178630ms step_avg:221.35ms step:808/7050 train_time:178852ms step_avg:221.35ms step:809/7050 train_time:179075ms step_avg:221.35ms step:810/7050 train_time:179297ms step_avg:221.35ms step:811/7050 train_time:179519ms step_avg:221.35ms step:812/7050 train_time:179740ms step_avg:221.36ms step:813/7050 train_time:179961ms step_avg:221.35ms step:814/7050 train_time:180182ms step_avg:221.35ms step:815/7050 train_time:180404ms step_avg:221.35ms step:816/7050 train_time:180626ms step_avg:221.36ms step:817/7050 train_time:180848ms step_avg:221.36ms step:818/7050 train_time:181069ms step_avg:221.36ms step:819/7050 train_time:181292ms step_avg:221.36ms step:820/7050 train_time:181514ms step_avg:221.36ms step:821/7050 train_time:181736ms step_avg:221.36ms step:822/7050 train_time:181958ms step_avg:221.36ms step:823/7050 train_time:182180ms step_avg:221.36ms step:824/7050 train_time:182402ms step_avg:221.36ms step:825/7050 train_time:182623ms step_avg:221.36ms step:826/7050 train_time:182844ms step_avg:221.36ms step:827/7050 train_time:183066ms step_avg:221.36ms step:828/7050 train_time:183289ms step_avg:221.36ms step:829/7050 train_time:183511ms step_avg:221.36ms step:830/7050 train_time:183734ms step_avg:221.37ms step:831/7050 train_time:183956ms step_avg:221.37ms step:832/7050 train_time:184179ms step_avg:221.37ms step:833/7050 train_time:184402ms step_avg:221.37ms step:834/7050 train_time:184624ms step_avg:221.37ms step:835/7050 train_time:184846ms step_avg:221.37ms step:836/7050 train_time:185069ms step_avg:221.37ms step:837/7050 train_time:185291ms step_avg:221.37ms step:838/7050 train_time:185513ms step_avg:221.38ms step:839/7050 train_time:185734ms step_avg:221.38ms step:840/7050 train_time:185956ms step_avg:221.38ms step:841/7050 train_time:186178ms step_avg:221.38ms step:842/7050 train_time:186401ms step_avg:221.38ms step:843/7050 train_time:186623ms step_avg:221.38ms step:844/7050 train_time:186844ms step_avg:221.38ms step:845/7050 train_time:187066ms step_avg:221.38ms step:846/7050 train_time:187288ms step_avg:221.38ms step:847/7050 train_time:187509ms step_avg:221.38ms step:848/7050 train_time:187732ms step_avg:221.38ms step:849/7050 train_time:187955ms step_avg:221.38ms step:850/7050 train_time:188178ms step_avg:221.39ms step:851/7050 train_time:188400ms step_avg:221.39ms step:852/7050 train_time:188621ms step_avg:221.39ms step:853/7050 train_time:188842ms step_avg:221.39ms step:854/7050 train_time:189063ms step_avg:221.38ms step:855/7050 train_time:189285ms step_avg:221.39ms step:856/7050 train_time:189508ms step_avg:221.39ms step:857/7050 train_time:189729ms step_avg:221.39ms step:858/7050 train_time:189951ms step_avg:221.39ms step:859/7050 train_time:190173ms step_avg:221.39ms step:860/7050 train_time:190395ms step_avg:221.39ms step:861/7050 train_time:190617ms step_avg:221.39ms step:862/7050 train_time:190838ms step_avg:221.39ms step:863/7050 train_time:191059ms step_avg:221.39ms step:864/7050 train_time:191280ms step_avg:221.39ms step:865/7050 train_time:191502ms step_avg:221.39ms step:866/7050 train_time:191724ms step_avg:221.39ms step:867/7050 train_time:191945ms step_avg:221.39ms step:868/7050 train_time:192168ms step_avg:221.39ms step:869/7050 train_time:192391ms step_avg:221.39ms step:870/7050 train_time:192613ms step_avg:221.39ms step:871/7050 train_time:192835ms step_avg:221.39ms step:872/7050 train_time:193057ms step_avg:221.40ms step:873/7050 train_time:193279ms step_avg:221.40ms step:874/7050 train_time:193502ms step_avg:221.40ms step:875/7050 train_time:193724ms step_avg:221.40ms step:875/7050 val_loss:3.5372 train_time:193899ms step_avg:221.60ms step:876/7050 train_time:193948ms step_avg:221.40ms step:877/7050 train_time:194169ms step_avg:221.40ms step:878/7050 train_time:194397ms step_avg:221.41ms step:879/7050 train_time:194620ms step_avg:221.41ms step:880/7050 train_time:194840ms step_avg:221.41ms step:881/7050 train_time:195061ms step_avg:221.41ms step:882/7050 train_time:195285ms step_avg:221.41ms step:883/7050 train_time:195509ms step_avg:221.41ms step:884/7050 train_time:195730ms step_avg:221.41ms step:885/7050 train_time:195952ms step_avg:221.41ms step:886/7050 train_time:196173ms step_avg:221.41ms step:887/7050 train_time:196395ms step_avg:221.42ms step:888/7050 train_time:196617ms step_avg:221.42ms step:889/7050 train_time:196838ms step_avg:221.41ms step:890/7050 train_time:197059ms step_avg:221.41ms step:891/7050 train_time:197281ms step_avg:221.41ms step:892/7050 train_time:197504ms step_avg:221.42ms step:893/7050 train_time:197727ms step_avg:221.42ms step:894/7050 train_time:197950ms step_avg:221.42ms step:895/7050 train_time:198171ms step_avg:221.42ms step:896/7050 train_time:198393ms step_avg:221.42ms step:897/7050 train_time:198616ms step_avg:221.42ms step:898/7050 train_time:198839ms step_avg:221.42ms step:899/7050 train_time:199060ms step_avg:221.42ms step:900/7050 train_time:199283ms step_avg:221.43ms step:901/7050 train_time:199505ms step_avg:221.43ms step:902/7050 train_time:199728ms step_avg:221.43ms step:903/7050 train_time:199951ms step_avg:221.43ms step:904/7050 train_time:200172ms step_avg:221.43ms step:905/7050 train_time:200394ms step_avg:221.43ms step:906/7050 train_time:200617ms step_avg:221.43ms step:907/7050 train_time:200839ms step_avg:221.43ms step:908/7050 train_time:201061ms step_avg:221.43ms step:909/7050 train_time:201283ms step_avg:221.43ms step:910/7050 train_time:201507ms step_avg:221.44ms step:911/7050 train_time:201729ms step_avg:221.44ms step:912/7050 train_time:201952ms step_avg:221.44ms step:913/7050 train_time:202173ms step_avg:221.44ms step:914/7050 train_time:202395ms step_avg:221.44ms step:915/7050 train_time:202616ms step_avg:221.44ms step:916/7050 train_time:202839ms step_avg:221.44ms step:917/7050 train_time:203061ms step_avg:221.44ms step:918/7050 train_time:203283ms step_avg:221.44ms step:919/7050 train_time:203504ms step_avg:221.44ms step:920/7050 train_time:203727ms step_avg:221.44ms step:921/7050 train_time:203949ms step_avg:221.44ms step:922/7050 train_time:204171ms step_avg:221.44ms step:923/7050 train_time:204392ms step_avg:221.44ms step:924/7050 train_time:204615ms step_avg:221.44ms step:925/7050 train_time:204837ms step_avg:221.45ms step:926/7050 train_time:205059ms step_avg:221.45ms step:927/7050 train_time:205280ms step_avg:221.45ms step:928/7050 train_time:205503ms step_avg:221.45ms step:929/7050 train_time:205726ms step_avg:221.45ms step:930/7050 train_time:205948ms step_avg:221.45ms step:931/7050 train_time:206170ms step_avg:221.45ms step:932/7050 train_time:206390ms step_avg:221.45ms step:933/7050 train_time:206612ms step_avg:221.45ms step:934/7050 train_time:206834ms step_avg:221.45ms step:935/7050 train_time:207057ms step_avg:221.45ms step:936/7050 train_time:207278ms step_avg:221.45ms step:937/7050 train_time:207500ms step_avg:221.45ms step:938/7050 train_time:207723ms step_avg:221.45ms step:939/7050 train_time:207945ms step_avg:221.45ms step:940/7050 train_time:208167ms step_avg:221.45ms step:941/7050 train_time:208388ms step_avg:221.45ms step:942/7050 train_time:208610ms step_avg:221.45ms step:943/7050 train_time:208832ms step_avg:221.45ms step:944/7050 train_time:209054ms step_avg:221.46ms step:945/7050 train_time:209275ms step_avg:221.46ms step:946/7050 train_time:209497ms step_avg:221.46ms step:947/7050 train_time:209719ms step_avg:221.46ms step:948/7050 train_time:209941ms step_avg:221.46ms step:949/7050 train_time:210164ms step_avg:221.46ms step:950/7050 train_time:210385ms step_avg:221.46ms step:951/7050 train_time:210608ms step_avg:221.46ms step:952/7050 train_time:210829ms step_avg:221.46ms step:953/7050 train_time:211050ms step_avg:221.46ms step:954/7050 train_time:211271ms step_avg:221.46ms step:955/7050 train_time:211493ms step_avg:221.46ms step:956/7050 train_time:211717ms step_avg:221.46ms step:957/7050 train_time:211938ms step_avg:221.46ms step:958/7050 train_time:212162ms step_avg:221.46ms step:959/7050 train_time:212384ms step_avg:221.46ms step:960/7050 train_time:212607ms step_avg:221.47ms step:961/7050 train_time:212828ms step_avg:221.47ms step:962/7050 train_time:213051ms step_avg:221.47ms step:963/7050 train_time:213273ms step_avg:221.47ms step:964/7050 train_time:213494ms step_avg:221.47ms step:965/7050 train_time:213716ms step_avg:221.47ms step:966/7050 train_time:213938ms step_avg:221.47ms step:967/7050 train_time:214162ms step_avg:221.47ms step:968/7050 train_time:214383ms step_avg:221.47ms step:969/7050 train_time:214604ms step_avg:221.47ms step:970/7050 train_time:214826ms step_avg:221.47ms step:971/7050 train_time:215048ms step_avg:221.47ms step:972/7050 train_time:215270ms step_avg:221.47ms step:973/7050 train_time:215492ms step_avg:221.47ms step:974/7050 train_time:215715ms step_avg:221.47ms step:975/7050 train_time:215937ms step_avg:221.47ms step:976/7050 train_time:216159ms step_avg:221.47ms step:977/7050 train_time:216380ms step_avg:221.47ms step:978/7050 train_time:216602ms step_avg:221.47ms step:979/7050 train_time:216826ms step_avg:221.48ms step:980/7050 train_time:217048ms step_avg:221.48ms step:981/7050 train_time:217270ms step_avg:221.48ms step:982/7050 train_time:217491ms step_avg:221.48ms step:983/7050 train_time:217713ms step_avg:221.48ms step:984/7050 train_time:217935ms step_avg:221.48ms step:985/7050 train_time:218158ms step_avg:221.48ms step:986/7050 train_time:218380ms step_avg:221.48ms step:987/7050 train_time:218601ms step_avg:221.48ms step:988/7050 train_time:218823ms step_avg:221.48ms step:989/7050 train_time:219049ms step_avg:221.49ms step:990/7050 train_time:219271ms step_avg:221.49ms step:991/7050 train_time:219491ms step_avg:221.48ms step:992/7050 train_time:219712ms step_avg:221.48ms step:993/7050 train_time:219935ms step_avg:221.49ms step:994/7050 train_time:220157ms step_avg:221.49ms step:995/7050 train_time:220379ms step_avg:221.49ms step:996/7050 train_time:220600ms step_avg:221.49ms step:997/7050 train_time:220823ms step_avg:221.49ms step:998/7050 train_time:221047ms step_avg:221.49ms step:999/7050 train_time:221269ms step_avg:221.49ms step:1000/7050 train_time:221490ms step_avg:221.49ms step:1000/7050 val_loss:3.4938 train_time:221664ms step_avg:221.66ms step:1001/7050 train_time:221714ms step_avg:221.49ms step:1002/7050 train_time:221933ms step_avg:221.49ms step:1003/7050 train_time:222160ms step_avg:221.50ms step:1004/7050 train_time:222384ms step_avg:221.50ms step:1005/7050 train_time:222604ms step_avg:221.50ms step:1006/7050 train_time:222826ms step_avg:221.50ms step:1007/7050 train_time:223048ms step_avg:221.50ms step:1008/7050 train_time:223272ms step_avg:221.50ms step:1009/7050 train_time:223495ms step_avg:221.50ms step:1010/7050 train_time:223717ms step_avg:221.50ms step:1011/7050 train_time:223937ms step_avg:221.50ms step:1012/7050 train_time:224160ms step_avg:221.50ms step:1013/7050 train_time:224382ms step_avg:221.50ms step:1014/7050 train_time:224604ms step_avg:221.50ms step:1015/7050 train_time:224826ms step_avg:221.50ms step:1016/7050 train_time:225047ms step_avg:221.50ms step:1017/7050 train_time:225269ms step_avg:221.50ms step:1018/7050 train_time:225492ms step_avg:221.51ms step:1019/7050 train_time:225714ms step_avg:221.51ms step:1020/7050 train_time:225936ms step_avg:221.51ms step:1021/7050 train_time:226158ms step_avg:221.51ms step:1022/7050 train_time:226380ms step_avg:221.51ms step:1023/7050 train_time:226603ms step_avg:221.51ms step:1024/7050 train_time:226825ms step_avg:221.51ms step:1025/7050 train_time:227048ms step_avg:221.51ms step:1026/7050 train_time:227270ms step_avg:221.51ms step:1027/7050 train_time:227492ms step_avg:221.51ms step:1028/7050 train_time:227714ms step_avg:221.51ms step:1029/7050 train_time:227936ms step_avg:221.51ms step:1030/7050 train_time:228159ms step_avg:221.51ms step:1031/7050 train_time:228381ms step_avg:221.51ms step:1032/7050 train_time:228603ms step_avg:221.51ms step:1033/7050 train_time:228826ms step_avg:221.52ms step:1034/7050 train_time:229046ms step_avg:221.51ms step:1035/7050 train_time:229269ms step_avg:221.52ms step:1036/7050 train_time:229492ms step_avg:221.52ms step:1037/7050 train_time:229715ms step_avg:221.52ms step:1038/7050 train_time:229936ms step_avg:221.52ms step:1039/7050 train_time:230158ms step_avg:221.52ms step:1040/7050 train_time:230380ms step_avg:221.52ms step:1041/7050 train_time:230602ms step_avg:221.52ms step:1042/7050 train_time:230824ms step_avg:221.52ms step:1043/7050 train_time:231046ms step_avg:221.52ms step:1044/7050 train_time:231268ms step_avg:221.52ms step:1045/7050 train_time:231491ms step_avg:221.52ms step:1046/7050 train_time:231713ms step_avg:221.52ms step:1047/7050 train_time:231937ms step_avg:221.53ms step:1048/7050 train_time:232160ms step_avg:221.53ms step:1049/7050 train_time:232383ms step_avg:221.53ms step:1050/7050 train_time:232606ms step_avg:221.53ms step:1051/7050 train_time:232829ms step_avg:221.53ms step:1052/7050 train_time:233053ms step_avg:221.53ms step:1053/7050 train_time:233275ms step_avg:221.53ms step:1054/7050 train_time:233499ms step_avg:221.54ms step:1055/7050 train_time:233722ms step_avg:221.54ms step:1056/7050 train_time:233946ms step_avg:221.54ms step:1057/7050 train_time:234169ms step_avg:221.54ms step:1058/7050 train_time:234392ms step_avg:221.54ms step:1059/7050 train_time:234616ms step_avg:221.55ms step:1060/7050 train_time:234838ms step_avg:221.55ms step:1061/7050 train_time:235060ms step_avg:221.55ms step:1062/7050 train_time:235284ms step_avg:221.55ms step:1063/7050 train_time:235508ms step_avg:221.55ms step:1064/7050 train_time:235731ms step_avg:221.55ms step:1065/7050 train_time:235953ms step_avg:221.55ms step:1066/7050 train_time:236176ms step_avg:221.55ms step:1067/7050 train_time:236399ms step_avg:221.55ms step:1068/7050 train_time:236622ms step_avg:221.56ms step:1069/7050 train_time:236844ms step_avg:221.56ms step:1070/7050 train_time:237067ms step_avg:221.56ms step:1071/7050 train_time:237290ms step_avg:221.56ms step:1072/7050 train_time:237513ms step_avg:221.56ms step:1073/7050 train_time:237736ms step_avg:221.56ms step:1074/7050 train_time:237959ms step_avg:221.56ms step:1075/7050 train_time:238184ms step_avg:221.57ms step:1076/7050 train_time:238407ms step_avg:221.57ms step:1077/7050 train_time:238630ms step_avg:221.57ms step:1078/7050 train_time:238854ms step_avg:221.57ms step:1079/7050 train_time:239077ms step_avg:221.57ms step:1080/7050 train_time:239300ms step_avg:221.57ms step:1081/7050 train_time:239522ms step_avg:221.57ms step:1082/7050 train_time:239745ms step_avg:221.58ms step:1083/7050 train_time:239969ms step_avg:221.58ms step:1084/7050 train_time:240193ms step_avg:221.58ms step:1085/7050 train_time:240417ms step_avg:221.58ms step:1086/7050 train_time:240640ms step_avg:221.58ms step:1087/7050 train_time:240864ms step_avg:221.59ms step:1088/7050 train_time:241087ms step_avg:221.59ms step:1089/7050 train_time:241311ms step_avg:221.59ms step:1090/7050 train_time:241534ms step_avg:221.59ms step:1091/7050 train_time:241757ms step_avg:221.59ms step:1092/7050 train_time:241980ms step_avg:221.59ms step:1093/7050 train_time:242204ms step_avg:221.60ms step:1094/7050 train_time:242427ms step_avg:221.60ms step:1095/7050 train_time:242650ms step_avg:221.60ms step:1096/7050 train_time:242874ms step_avg:221.60ms step:1097/7050 train_time:243098ms step_avg:221.60ms step:1098/7050 train_time:243320ms step_avg:221.60ms step:1099/7050 train_time:243544ms step_avg:221.60ms step:1100/7050 train_time:243766ms step_avg:221.61ms step:1101/7050 train_time:243989ms step_avg:221.61ms step:1102/7050 train_time:244213ms step_avg:221.61ms step:1103/7050 train_time:244436ms step_avg:221.61ms step:1104/7050 train_time:244661ms step_avg:221.61ms step:1105/7050 train_time:244883ms step_avg:221.61ms step:1106/7050 train_time:245107ms step_avg:221.62ms step:1107/7050 train_time:245331ms step_avg:221.62ms step:1108/7050 train_time:245554ms step_avg:221.62ms step:1109/7050 train_time:245777ms step_avg:221.62ms step:1110/7050 train_time:246001ms step_avg:221.62ms step:1111/7050 train_time:246224ms step_avg:221.62ms step:1112/7050 train_time:246447ms step_avg:221.62ms step:1113/7050 train_time:246669ms step_avg:221.63ms step:1114/7050 train_time:246892ms step_avg:221.63ms step:1115/7050 train_time:247116ms step_avg:221.63ms step:1116/7050 train_time:247338ms step_avg:221.63ms step:1117/7050 train_time:247560ms step_avg:221.63ms step:1118/7050 train_time:247782ms step_avg:221.63ms step:1119/7050 train_time:248006ms step_avg:221.63ms step:1120/7050 train_time:248229ms step_avg:221.63ms step:1121/7050 train_time:248453ms step_avg:221.64ms step:1122/7050 train_time:248677ms step_avg:221.64ms step:1123/7050 train_time:248901ms step_avg:221.64ms step:1124/7050 train_time:249124ms step_avg:221.64ms step:1125/7050 train_time:249346ms step_avg:221.64ms step:1125/7050 val_loss:3.4290 train_time:249524ms step_avg:221.80ms step:1126/7050 train_time:249571ms step_avg:221.64ms step:1127/7050 train_time:249793ms step_avg:221.64ms step:1128/7050 train_time:250021ms step_avg:221.65ms step:1129/7050 train_time:250246ms step_avg:221.65ms step:1130/7050 train_time:250468ms step_avg:221.65ms step:1131/7050 train_time:250690ms step_avg:221.65ms step:1132/7050 train_time:250914ms step_avg:221.66ms step:1133/7050 train_time:251138ms step_avg:221.66ms step:1134/7050 train_time:251363ms step_avg:221.66ms step:1135/7050 train_time:251584ms step_avg:221.66ms step:1136/7050 train_time:251806ms step_avg:221.66ms step:1137/7050 train_time:252029ms step_avg:221.66ms step:1138/7050 train_time:252253ms step_avg:221.66ms step:1139/7050 train_time:252476ms step_avg:221.67ms step:1140/7050 train_time:252699ms step_avg:221.67ms step:1141/7050 train_time:252922ms step_avg:221.67ms step:1142/7050 train_time:253146ms step_avg:221.67ms step:1143/7050 train_time:253370ms step_avg:221.67ms step:1144/7050 train_time:253593ms step_avg:221.67ms step:1145/7050 train_time:253817ms step_avg:221.67ms step:1146/7050 train_time:254041ms step_avg:221.68ms step:1147/7050 train_time:254265ms step_avg:221.68ms step:1148/7050 train_time:254486ms step_avg:221.68ms step:1149/7050 train_time:254709ms step_avg:221.68ms step:1150/7050 train_time:254932ms step_avg:221.68ms step:1151/7050 train_time:255155ms step_avg:221.68ms step:1152/7050 train_time:255379ms step_avg:221.68ms step:1153/7050 train_time:255601ms step_avg:221.68ms step:1154/7050 train_time:255823ms step_avg:221.68ms step:1155/7050 train_time:256047ms step_avg:221.69ms step:1156/7050 train_time:256268ms step_avg:221.69ms step:1157/7050 train_time:256492ms step_avg:221.69ms step:1158/7050 train_time:256714ms step_avg:221.69ms step:1159/7050 train_time:256938ms step_avg:221.69ms step:1160/7050 train_time:257162ms step_avg:221.69ms step:1161/7050 train_time:257385ms step_avg:221.69ms step:1162/7050 train_time:257608ms step_avg:221.69ms step:1163/7050 train_time:257831ms step_avg:221.69ms step:1164/7050 train_time:258054ms step_avg:221.70ms step:1165/7050 train_time:258278ms step_avg:221.70ms step:1166/7050 train_time:258502ms step_avg:221.70ms step:1167/7050 train_time:258724ms step_avg:221.70ms step:1168/7050 train_time:258946ms step_avg:221.70ms step:1169/7050 train_time:259169ms step_avg:221.70ms step:1170/7050 train_time:259393ms step_avg:221.70ms step:1171/7050 train_time:259616ms step_avg:221.70ms step:1172/7050 train_time:259840ms step_avg:221.71ms step:1173/7050 train_time:260065ms step_avg:221.71ms step:1174/7050 train_time:260287ms step_avg:221.71ms step:1175/7050 train_time:260510ms step_avg:221.71ms step:1176/7050 train_time:260733ms step_avg:221.71ms step:1177/7050 train_time:260956ms step_avg:221.71ms step:1178/7050 train_time:261179ms step_avg:221.71ms step:1179/7050 train_time:261402ms step_avg:221.72ms step:1180/7050 train_time:261625ms step_avg:221.72ms step:1181/7050 train_time:261847ms step_avg:221.72ms step:1182/7050 train_time:262070ms step_avg:221.72ms step:1183/7050 train_time:262292ms step_avg:221.72ms step:1184/7050 train_time:262516ms step_avg:221.72ms step:1185/7050 train_time:262740ms step_avg:221.72ms step:1186/7050 train_time:262963ms step_avg:221.72ms step:1187/7050 train_time:263186ms step_avg:221.72ms step:1188/7050 train_time:263411ms step_avg:221.73ms step:1189/7050 train_time:263633ms step_avg:221.73ms step:1190/7050 train_time:263856ms step_avg:221.73ms step:1191/7050 train_time:264080ms step_avg:221.73ms step:1192/7050 train_time:264303ms step_avg:221.73ms step:1193/7050 train_time:264527ms step_avg:221.73ms step:1194/7050 train_time:264749ms step_avg:221.73ms step:1195/7050 train_time:264973ms step_avg:221.73ms step:1196/7050 train_time:265195ms step_avg:221.73ms step:1197/7050 train_time:265420ms step_avg:221.74ms step:1198/7050 train_time:265644ms step_avg:221.74ms step:1199/7050 train_time:265866ms step_avg:221.74ms step:1200/7050 train_time:266090ms step_avg:221.74ms step:1201/7050 train_time:266314ms step_avg:221.74ms step:1202/7050 train_time:266538ms step_avg:221.75ms step:1203/7050 train_time:266763ms step_avg:221.75ms step:1204/7050 train_time:266984ms step_avg:221.75ms step:1205/7050 train_time:267208ms step_avg:221.75ms step:1206/7050 train_time:267432ms step_avg:221.75ms step:1207/7050 train_time:267655ms step_avg:221.75ms step:1208/7050 train_time:267878ms step_avg:221.75ms step:1209/7050 train_time:268101ms step_avg:221.75ms step:1210/7050 train_time:268324ms step_avg:221.76ms step:1211/7050 train_time:268548ms step_avg:221.76ms step:1212/7050 train_time:268771ms step_avg:221.76ms step:1213/7050 train_time:268994ms step_avg:221.76ms step:1214/7050 train_time:269216ms step_avg:221.76ms step:1215/7050 train_time:269441ms step_avg:221.76ms step:1216/7050 train_time:269665ms step_avg:221.76ms step:1217/7050 train_time:269888ms step_avg:221.77ms step:1218/7050 train_time:270110ms step_avg:221.77ms step:1219/7050 train_time:270333ms step_avg:221.77ms step:1220/7050 train_time:270556ms step_avg:221.77ms step:1221/7050 train_time:270780ms step_avg:221.77ms step:1222/7050 train_time:271002ms step_avg:221.77ms step:1223/7050 train_time:271225ms step_avg:221.77ms step:1224/7050 train_time:271449ms step_avg:221.77ms step:1225/7050 train_time:271672ms step_avg:221.77ms step:1226/7050 train_time:271896ms step_avg:221.77ms step:1227/7050 train_time:272119ms step_avg:221.78ms step:1228/7050 train_time:272342ms step_avg:221.78ms step:1229/7050 train_time:272564ms step_avg:221.78ms step:1230/7050 train_time:272788ms step_avg:221.78ms step:1231/7050 train_time:273012ms step_avg:221.78ms step:1232/7050 train_time:273236ms step_avg:221.78ms step:1233/7050 train_time:273460ms step_avg:221.78ms step:1234/7050 train_time:273682ms step_avg:221.78ms step:1235/7050 train_time:273905ms step_avg:221.79ms step:1236/7050 train_time:274127ms step_avg:221.79ms step:1237/7050 train_time:274350ms step_avg:221.79ms step:1238/7050 train_time:274574ms step_avg:221.79ms step:1239/7050 train_time:274798ms step_avg:221.79ms step:1240/7050 train_time:275021ms step_avg:221.79ms step:1241/7050 train_time:275244ms step_avg:221.79ms step:1242/7050 train_time:275467ms step_avg:221.79ms step:1243/7050 train_time:275690ms step_avg:221.79ms step:1244/7050 train_time:275913ms step_avg:221.79ms step:1245/7050 train_time:276135ms step_avg:221.80ms step:1246/7050 train_time:276358ms step_avg:221.80ms step:1247/7050 train_time:276581ms step_avg:221.80ms step:1248/7050 train_time:276803ms step_avg:221.80ms step:1249/7050 train_time:277026ms step_avg:221.80ms step:1250/7050 train_time:277250ms step_avg:221.80ms step:1250/7050 val_loss:3.3979 train_time:277427ms step_avg:221.94ms step:1251/7050 train_time:277474ms step_avg:221.80ms step:1252/7050 train_time:277696ms step_avg:221.80ms step:1253/7050 train_time:277929ms step_avg:221.81ms step:1254/7050 train_time:278152ms step_avg:221.81ms step:1255/7050 train_time:278374ms step_avg:221.81ms step:1256/7050 train_time:278596ms step_avg:221.81ms step:1257/7050 train_time:278821ms step_avg:221.81ms step:1258/7050 train_time:279047ms step_avg:221.82ms step:1259/7050 train_time:279268ms step_avg:221.82ms step:1260/7050 train_time:279491ms step_avg:221.82ms step:1261/7050 train_time:279714ms step_avg:221.82ms step:1262/7050 train_time:279939ms step_avg:221.82ms step:1263/7050 train_time:280163ms step_avg:221.82ms step:1264/7050 train_time:280384ms step_avg:221.82ms step:1265/7050 train_time:280607ms step_avg:221.82ms step:1266/7050 train_time:280830ms step_avg:221.82ms step:1267/7050 train_time:281054ms step_avg:221.83ms step:1268/7050 train_time:281277ms step_avg:221.83ms step:1269/7050 train_time:281500ms step_avg:221.83ms step:1270/7050 train_time:281722ms step_avg:221.83ms step:1271/7050 train_time:281944ms step_avg:221.83ms step:1272/7050 train_time:282168ms step_avg:221.83ms step:1273/7050 train_time:282392ms step_avg:221.83ms step:1274/7050 train_time:282614ms step_avg:221.83ms step:1275/7050 train_time:282837ms step_avg:221.83ms step:1276/7050 train_time:283060ms step_avg:221.83ms step:1277/7050 train_time:283284ms step_avg:221.84ms step:1278/7050 train_time:283505ms step_avg:221.83ms step:1279/7050 train_time:283726ms step_avg:221.83ms step:1280/7050 train_time:283949ms step_avg:221.84ms step:1281/7050 train_time:284172ms step_avg:221.84ms step:1282/7050 train_time:284397ms step_avg:221.84ms step:1283/7050 train_time:284620ms step_avg:221.84ms step:1284/7050 train_time:284843ms step_avg:221.84ms step:1285/7050 train_time:285065ms step_avg:221.84ms step:1286/7050 train_time:285288ms step_avg:221.84ms step:1287/7050 train_time:285511ms step_avg:221.84ms step:1288/7050 train_time:285733ms step_avg:221.84ms step:1289/7050 train_time:285957ms step_avg:221.84ms step:1290/7050 train_time:286183ms step_avg:221.85ms step:1291/7050 train_time:286404ms step_avg:221.85ms step:1292/7050 train_time:286626ms step_avg:221.85ms step:1293/7050 train_time:286849ms step_avg:221.85ms step:1294/7050 train_time:287072ms step_avg:221.85ms step:1295/7050 train_time:287296ms step_avg:221.85ms step:1296/7050 train_time:287519ms step_avg:221.85ms step:1297/7050 train_time:287743ms step_avg:221.85ms step:1298/7050 train_time:287965ms step_avg:221.85ms step:1299/7050 train_time:288188ms step_avg:221.85ms step:1300/7050 train_time:288412ms step_avg:221.86ms step:1301/7050 train_time:288637ms step_avg:221.86ms step:1302/7050 train_time:288859ms step_avg:221.86ms step:1303/7050 train_time:289083ms step_avg:221.86ms step:1304/7050 train_time:289307ms step_avg:221.86ms step:1305/7050 train_time:289530ms step_avg:221.86ms step:1306/7050 train_time:289754ms step_avg:221.86ms step:1307/7050 train_time:289975ms step_avg:221.86ms step:1308/7050 train_time:290199ms step_avg:221.86ms step:1309/7050 train_time:290422ms step_avg:221.87ms step:1310/7050 train_time:290646ms step_avg:221.87ms step:1311/7050 train_time:290869ms step_avg:221.87ms step:1312/7050 train_time:291096ms step_avg:221.87ms step:1313/7050 train_time:291316ms step_avg:221.87ms step:1314/7050 train_time:291541ms step_avg:221.87ms step:1315/7050 train_time:291765ms step_avg:221.87ms step:1316/7050 train_time:291987ms step_avg:221.87ms step:1317/7050 train_time:292209ms step_avg:221.88ms step:1318/7050 train_time:292432ms step_avg:221.88ms step:1319/7050 train_time:292656ms step_avg:221.88ms step:1320/7050 train_time:292879ms step_avg:221.88ms step:1321/7050 train_time:293102ms step_avg:221.88ms step:1322/7050 train_time:293327ms step_avg:221.88ms step:1323/7050 train_time:293548ms step_avg:221.88ms step:1324/7050 train_time:293770ms step_avg:221.88ms step:1325/7050 train_time:293994ms step_avg:221.88ms step:1326/7050 train_time:294216ms step_avg:221.88ms step:1327/7050 train_time:294441ms step_avg:221.88ms step:1328/7050 train_time:294664ms step_avg:221.89ms step:1329/7050 train_time:294887ms step_avg:221.89ms step:1330/7050 train_time:295111ms step_avg:221.89ms step:1331/7050 train_time:295333ms step_avg:221.89ms step:1332/7050 train_time:295556ms step_avg:221.89ms step:1333/7050 train_time:295780ms step_avg:221.89ms step:1334/7050 train_time:296004ms step_avg:221.89ms step:1335/7050 train_time:296227ms step_avg:221.89ms step:1336/7050 train_time:296450ms step_avg:221.89ms step:1337/7050 train_time:296674ms step_avg:221.90ms step:1338/7050 train_time:296898ms step_avg:221.90ms step:1339/7050 train_time:297121ms step_avg:221.90ms step:1340/7050 train_time:297345ms step_avg:221.90ms step:1341/7050 train_time:297569ms step_avg:221.90ms step:1342/7050 train_time:297793ms step_avg:221.90ms step:1343/7050 train_time:298016ms step_avg:221.90ms step:1344/7050 train_time:298240ms step_avg:221.90ms step:1345/7050 train_time:298463ms step_avg:221.91ms step:1346/7050 train_time:298687ms step_avg:221.91ms step:1347/7050 train_time:298911ms step_avg:221.91ms step:1348/7050 train_time:299134ms step_avg:221.91ms step:1349/7050 train_time:299357ms step_avg:221.91ms step:1350/7050 train_time:299580ms step_avg:221.91ms step:1351/7050 train_time:299807ms step_avg:221.92ms step:1352/7050 train_time:300031ms step_avg:221.92ms step:1353/7050 train_time:300253ms step_avg:221.92ms step:1354/7050 train_time:300475ms step_avg:221.92ms step:1355/7050 train_time:300700ms step_avg:221.92ms step:1356/7050 train_time:300925ms step_avg:221.92ms step:1357/7050 train_time:301150ms step_avg:221.92ms step:1358/7050 train_time:301372ms step_avg:221.92ms step:1359/7050 train_time:301595ms step_avg:221.92ms step:1360/7050 train_time:301818ms step_avg:221.92ms step:1361/7050 train_time:302044ms step_avg:221.93ms step:1362/7050 train_time:302267ms step_avg:221.93ms step:1363/7050 train_time:302489ms step_avg:221.93ms step:1364/7050 train_time:302712ms step_avg:221.93ms step:1365/7050 train_time:302936ms step_avg:221.93ms step:1366/7050 train_time:303160ms step_avg:221.93ms step:1367/7050 train_time:303383ms step_avg:221.93ms step:1368/7050 train_time:303606ms step_avg:221.93ms step:1369/7050 train_time:303831ms step_avg:221.94ms step:1370/7050 train_time:304055ms step_avg:221.94ms step:1371/7050 train_time:304279ms step_avg:221.94ms step:1372/7050 train_time:304503ms step_avg:221.94ms step:1373/7050 train_time:304724ms step_avg:221.94ms step:1374/7050 train_time:304946ms step_avg:221.94ms step:1375/7050 train_time:305171ms step_avg:221.94ms step:1375/7050 val_loss:3.3756 train_time:305347ms step_avg:222.07ms step:1376/7050 train_time:305395ms step_avg:221.94ms step:1377/7050 train_time:305620ms step_avg:221.95ms step:1378/7050 train_time:305848ms step_avg:221.95ms step:1379/7050 train_time:306072ms step_avg:221.95ms step:1380/7050 train_time:306294ms step_avg:221.95ms step:1381/7050 train_time:306518ms step_avg:221.95ms step:1382/7050 train_time:306742ms step_avg:221.96ms step:1383/7050 train_time:306966ms step_avg:221.96ms step:1384/7050 train_time:307189ms step_avg:221.96ms step:1385/7050 train_time:307413ms step_avg:221.96ms step:1386/7050 train_time:307636ms step_avg:221.96ms step:1387/7050 train_time:307859ms step_avg:221.96ms step:1388/7050 train_time:308083ms step_avg:221.96ms step:1389/7050 train_time:308307ms step_avg:221.96ms step:1390/7050 train_time:308529ms step_avg:221.96ms step:1391/7050 train_time:308752ms step_avg:221.96ms step:1392/7050 train_time:308975ms step_avg:221.96ms step:1393/7050 train_time:309198ms step_avg:221.97ms step:1394/7050 train_time:309421ms step_avg:221.97ms step:1395/7050 train_time:309645ms step_avg:221.97ms step:1396/7050 train_time:309868ms step_avg:221.97ms step:1397/7050 train_time:310091ms step_avg:221.97ms step:1398/7050 train_time:310315ms step_avg:221.97ms step:1399/7050 train_time:310539ms step_avg:221.97ms step:1400/7050 train_time:310762ms step_avg:221.97ms step:1401/7050 train_time:310985ms step_avg:221.97ms step:1402/7050 train_time:311208ms step_avg:221.97ms step:1403/7050 train_time:311431ms step_avg:221.98ms step:1404/7050 train_time:311657ms step_avg:221.98ms step:1405/7050 train_time:311878ms step_avg:221.98ms step:1406/7050 train_time:312102ms step_avg:221.98ms step:1407/7050 train_time:312326ms step_avg:221.98ms step:1408/7050 train_time:312548ms step_avg:221.98ms step:1409/7050 train_time:312772ms step_avg:221.98ms step:1410/7050 train_time:312994ms step_avg:221.98ms step:1411/7050 train_time:313218ms step_avg:221.98ms step:1412/7050 train_time:313441ms step_avg:221.98ms step:1413/7050 train_time:313665ms step_avg:221.98ms step:1414/7050 train_time:313889ms step_avg:221.99ms step:1415/7050 train_time:314110ms step_avg:221.99ms step:1416/7050 train_time:314334ms step_avg:221.99ms step:1417/7050 train_time:314557ms step_avg:221.99ms step:1418/7050 train_time:314780ms step_avg:221.99ms step:1419/7050 train_time:315004ms step_avg:221.99ms step:1420/7050 train_time:315228ms step_avg:221.99ms step:1421/7050 train_time:315451ms step_avg:221.99ms step:1422/7050 train_time:315673ms step_avg:221.99ms step:1423/7050 train_time:315896ms step_avg:221.99ms step:1424/7050 train_time:316119ms step_avg:221.99ms step:1425/7050 train_time:316343ms step_avg:222.00ms step:1426/7050 train_time:316566ms step_avg:222.00ms step:1427/7050 train_time:316788ms step_avg:222.00ms step:1428/7050 train_time:317014ms step_avg:222.00ms step:1429/7050 train_time:317238ms step_avg:222.00ms step:1430/7050 train_time:317460ms step_avg:222.00ms step:1431/7050 train_time:317683ms step_avg:222.00ms step:1432/7050 train_time:317905ms step_avg:222.00ms step:1433/7050 train_time:318130ms step_avg:222.00ms step:1434/7050 train_time:318353ms step_avg:222.00ms step:1435/7050 train_time:318574ms step_avg:222.00ms step:1436/7050 train_time:318797ms step_avg:222.00ms step:1437/7050 train_time:319020ms step_avg:222.00ms step:1438/7050 train_time:319245ms step_avg:222.01ms step:1439/7050 train_time:319468ms step_avg:222.01ms step:1440/7050 train_time:319690ms step_avg:222.01ms step:1441/7050 train_time:319914ms step_avg:222.01ms step:1442/7050 train_time:320138ms step_avg:222.01ms step:1443/7050 train_time:320360ms step_avg:222.01ms step:1444/7050 train_time:320585ms step_avg:222.01ms step:1445/7050 train_time:320808ms step_avg:222.01ms step:1446/7050 train_time:321030ms step_avg:222.01ms step:1447/7050 train_time:321253ms step_avg:222.01ms step:1448/7050 train_time:321477ms step_avg:222.01ms step:1449/7050 train_time:321700ms step_avg:222.02ms step:1450/7050 train_time:321925ms step_avg:222.02ms step:1451/7050 train_time:322150ms step_avg:222.02ms step:1452/7050 train_time:322370ms step_avg:222.02ms step:1453/7050 train_time:322595ms step_avg:222.02ms step:1454/7050 train_time:322817ms step_avg:222.02ms step:1455/7050 train_time:323040ms step_avg:222.02ms step:1456/7050 train_time:323264ms step_avg:222.02ms step:1457/7050 train_time:323486ms step_avg:222.02ms step:1458/7050 train_time:323709ms step_avg:222.02ms step:1459/7050 train_time:323931ms step_avg:222.02ms step:1460/7050 train_time:324155ms step_avg:222.02ms step:1461/7050 train_time:324378ms step_avg:222.02ms step:1462/7050 train_time:324602ms step_avg:222.03ms step:1463/7050 train_time:324825ms step_avg:222.03ms step:1464/7050 train_time:325048ms step_avg:222.03ms step:1465/7050 train_time:325271ms step_avg:222.03ms step:1466/7050 train_time:325493ms step_avg:222.03ms step:1467/7050 train_time:325717ms step_avg:222.03ms step:1468/7050 train_time:325941ms step_avg:222.03ms step:1469/7050 train_time:326165ms step_avg:222.03ms step:1470/7050 train_time:326390ms step_avg:222.03ms step:1471/7050 train_time:326613ms step_avg:222.03ms step:1472/7050 train_time:326836ms step_avg:222.04ms step:1473/7050 train_time:327060ms step_avg:222.04ms step:1474/7050 train_time:327283ms step_avg:222.04ms step:1475/7050 train_time:327507ms step_avg:222.04ms step:1476/7050 train_time:327730ms step_avg:222.04ms step:1477/7050 train_time:327953ms step_avg:222.04ms step:1478/7050 train_time:328175ms step_avg:222.04ms step:1479/7050 train_time:328399ms step_avg:222.04ms step:1480/7050 train_time:328622ms step_avg:222.04ms step:1481/7050 train_time:328846ms step_avg:222.04ms step:1482/7050 train_time:329068ms step_avg:222.04ms step:1483/7050 train_time:329291ms step_avg:222.04ms step:1484/7050 train_time:329514ms step_avg:222.04ms step:1485/7050 train_time:329738ms step_avg:222.05ms step:1486/7050 train_time:329960ms step_avg:222.05ms step:1487/7050 train_time:330183ms step_avg:222.05ms step:1488/7050 train_time:330407ms step_avg:222.05ms step:1489/7050 train_time:330630ms step_avg:222.05ms step:1490/7050 train_time:330854ms step_avg:222.05ms step:1491/7050 train_time:331076ms step_avg:222.05ms step:1492/7050 train_time:331300ms step_avg:222.05ms step:1493/7050 train_time:331522ms step_avg:222.05ms step:1494/7050 train_time:331746ms step_avg:222.05ms step:1495/7050 train_time:331968ms step_avg:222.05ms step:1496/7050 train_time:332191ms step_avg:222.05ms step:1497/7050 train_time:332413ms step_avg:222.05ms step:1498/7050 train_time:332637ms step_avg:222.05ms step:1499/7050 train_time:332861ms step_avg:222.06ms step:1500/7050 train_time:333084ms step_avg:222.06ms step:1500/7050 val_loss:3.3521 train_time:333260ms step_avg:222.17ms step:1501/7050 train_time:333311ms step_avg:222.06ms step:1502/7050 train_time:333531ms step_avg:222.06ms step:1503/7050 train_time:333758ms step_avg:222.06ms step:1504/7050 train_time:333983ms step_avg:222.06ms step:1505/7050 train_time:334205ms step_avg:222.06ms step:1506/7050 train_time:334427ms step_avg:222.06ms step:1507/7050 train_time:334650ms step_avg:222.06ms step:1508/7050 train_time:334875ms step_avg:222.07ms step:1509/7050 train_time:335099ms step_avg:222.07ms step:1510/7050 train_time:335321ms step_avg:222.07ms step:1511/7050 train_time:335543ms step_avg:222.07ms step:1512/7050 train_time:335767ms step_avg:222.07ms step:1513/7050 train_time:335992ms step_avg:222.07ms step:1514/7050 train_time:336213ms step_avg:222.07ms step:1515/7050 train_time:336436ms step_avg:222.07ms step:1516/7050 train_time:336660ms step_avg:222.07ms step:1517/7050 train_time:336884ms step_avg:222.07ms step:1518/7050 train_time:337107ms step_avg:222.07ms step:1519/7050 train_time:337330ms step_avg:222.07ms step:1520/7050 train_time:337553ms step_avg:222.07ms step:1521/7050 train_time:337776ms step_avg:222.07ms step:1522/7050 train_time:338001ms step_avg:222.08ms step:1523/7050 train_time:338223ms step_avg:222.08ms step:1524/7050 train_time:338445ms step_avg:222.08ms step:1525/7050 train_time:338668ms step_avg:222.08ms step:1526/7050 train_time:338893ms step_avg:222.08ms step:1527/7050 train_time:339117ms step_avg:222.08ms step:1528/7050 train_time:339340ms step_avg:222.08ms step:1529/7050 train_time:339562ms step_avg:222.08ms step:1530/7050 train_time:339787ms step_avg:222.08ms step:1531/7050 train_time:340010ms step_avg:222.08ms step:1532/7050 train_time:340234ms step_avg:222.08ms step:1533/7050 train_time:340457ms step_avg:222.09ms step:1534/7050 train_time:340680ms step_avg:222.09ms step:1535/7050 train_time:340904ms step_avg:222.09ms step:1536/7050 train_time:341127ms step_avg:222.09ms step:1537/7050 train_time:341350ms step_avg:222.09ms step:1538/7050 train_time:341574ms step_avg:222.09ms step:1539/7050 train_time:341797ms step_avg:222.09ms step:1540/7050 train_time:342022ms step_avg:222.09ms step:1541/7050 train_time:342244ms step_avg:222.09ms step:1542/7050 train_time:342466ms step_avg:222.09ms step:1543/7050 train_time:342690ms step_avg:222.09ms step:1544/7050 train_time:342913ms step_avg:222.09ms step:1545/7050 train_time:343137ms step_avg:222.10ms step:1546/7050 train_time:343360ms step_avg:222.10ms step:1547/7050 train_time:343584ms step_avg:222.10ms step:1548/7050 train_time:343809ms step_avg:222.10ms step:1549/7050 train_time:344032ms step_avg:222.10ms step:1550/7050 train_time:344254ms step_avg:222.10ms step:1551/7050 train_time:344478ms step_avg:222.10ms step:1552/7050 train_time:344700ms step_avg:222.10ms step:1553/7050 train_time:344922ms step_avg:222.10ms step:1554/7050 train_time:345145ms step_avg:222.10ms step:1555/7050 train_time:345369ms step_avg:222.10ms step:1556/7050 train_time:345592ms step_avg:222.10ms step:1557/7050 train_time:345814ms step_avg:222.10ms step:1558/7050 train_time:346038ms step_avg:222.10ms step:1559/7050 train_time:346261ms step_avg:222.10ms step:1560/7050 train_time:346484ms step_avg:222.11ms step:1561/7050 train_time:346706ms step_avg:222.10ms step:1562/7050 train_time:346929ms step_avg:222.11ms step:1563/7050 train_time:347152ms step_avg:222.11ms step:1564/7050 train_time:347376ms step_avg:222.11ms step:1565/7050 train_time:347599ms step_avg:222.11ms step:1566/7050 train_time:347823ms step_avg:222.11ms step:1567/7050 train_time:348046ms step_avg:222.11ms step:1568/7050 train_time:348272ms step_avg:222.11ms step:1569/7050 train_time:348502ms step_avg:222.12ms step:1570/7050 train_time:348729ms step_avg:222.12ms step:1571/7050 train_time:348956ms step_avg:222.12ms step:1572/7050 train_time:349186ms step_avg:222.13ms step:1573/7050 train_time:349414ms step_avg:222.13ms step:1574/7050 train_time:349644ms step_avg:222.14ms step:1575/7050 train_time:349872ms step_avg:222.14ms step:1576/7050 train_time:350099ms step_avg:222.14ms step:1577/7050 train_time:350328ms step_avg:222.15ms step:1578/7050 train_time:350556ms step_avg:222.15ms step:1579/7050 train_time:350785ms step_avg:222.16ms step:1580/7050 train_time:351013ms step_avg:222.16ms step:1581/7050 train_time:351241ms step_avg:222.16ms step:1582/7050 train_time:351471ms step_avg:222.17ms step:1583/7050 train_time:351699ms step_avg:222.17ms step:1584/7050 train_time:351925ms step_avg:222.18ms step:1585/7050 train_time:352153ms step_avg:222.18ms step:1586/7050 train_time:352381ms step_avg:222.18ms step:1587/7050 train_time:352608ms step_avg:222.19ms step:1588/7050 train_time:352837ms step_avg:222.19ms step:1589/7050 train_time:353066ms step_avg:222.19ms step:1590/7050 train_time:353294ms step_avg:222.20ms step:1591/7050 train_time:353522ms step_avg:222.20ms step:1592/7050 train_time:353750ms step_avg:222.20ms step:1593/7050 train_time:353978ms step_avg:222.21ms step:1594/7050 train_time:354207ms step_avg:222.21ms step:1595/7050 train_time:354434ms step_avg:222.22ms step:1596/7050 train_time:354663ms step_avg:222.22ms step:1597/7050 train_time:354892ms step_avg:222.22ms step:1598/7050 train_time:355120ms step_avg:222.23ms step:1599/7050 train_time:355348ms step_avg:222.23ms step:1600/7050 train_time:355576ms step_avg:222.23ms step:1601/7050 train_time:355804ms step_avg:222.24ms step:1602/7050 train_time:356031ms step_avg:222.24ms step:1603/7050 train_time:356260ms step_avg:222.25ms step:1604/7050 train_time:356490ms step_avg:222.25ms step:1605/7050 train_time:356717ms step_avg:222.25ms step:1606/7050 train_time:356944ms step_avg:222.26ms step:1607/7050 train_time:357170ms step_avg:222.26ms step:1608/7050 train_time:357398ms step_avg:222.26ms step:1609/7050 train_time:357626ms step_avg:222.27ms step:1610/7050 train_time:357855ms step_avg:222.27ms step:1611/7050 train_time:358082ms step_avg:222.27ms step:1612/7050 train_time:358309ms step_avg:222.28ms step:1613/7050 train_time:358538ms step_avg:222.28ms step:1614/7050 train_time:358768ms step_avg:222.28ms step:1615/7050 train_time:358995ms step_avg:222.29ms step:1616/7050 train_time:359223ms step_avg:222.29ms step:1617/7050 train_time:359451ms step_avg:222.29ms step:1618/7050 train_time:359680ms step_avg:222.30ms step:1619/7050 train_time:359908ms step_avg:222.30ms step:1620/7050 train_time:360135ms step_avg:222.31ms step:1621/7050 train_time:360362ms step_avg:222.31ms step:1622/7050 train_time:360590ms step_avg:222.31ms step:1623/7050 train_time:360820ms step_avg:222.32ms step:1624/7050 train_time:361047ms step_avg:222.32ms step:1625/7050 train_time:361276ms step_avg:222.32ms step:1625/7050 val_loss:3.3065 train_time:361455ms step_avg:222.43ms step:1626/7050 train_time:361504ms step_avg:222.33ms step:1627/7050 train_time:361731ms step_avg:222.33ms step:1628/7050 train_time:361962ms step_avg:222.34ms step:1629/7050 train_time:362192ms step_avg:222.34ms step:1630/7050 train_time:362419ms step_avg:222.34ms step:1631/7050 train_time:362646ms step_avg:222.35ms step:1632/7050 train_time:362875ms step_avg:222.35ms step:1633/7050 train_time:363106ms step_avg:222.36ms step:1634/7050 train_time:363335ms step_avg:222.36ms step:1635/7050 train_time:363561ms step_avg:222.36ms step:1636/7050 train_time:363789ms step_avg:222.37ms step:1637/7050 train_time:364018ms step_avg:222.37ms step:1638/7050 train_time:364247ms step_avg:222.37ms step:1639/7050 train_time:364474ms step_avg:222.38ms step:1640/7050 train_time:364703ms step_avg:222.38ms step:1641/7050 train_time:364932ms step_avg:222.38ms step:1642/7050 train_time:365159ms step_avg:222.39ms step:1643/7050 train_time:365386ms step_avg:222.39ms step:1644/7050 train_time:365615ms step_avg:222.39ms step:1645/7050 train_time:365841ms step_avg:222.40ms step:1646/7050 train_time:366070ms step_avg:222.40ms step:1647/7050 train_time:366299ms step_avg:222.40ms step:1648/7050 train_time:366527ms step_avg:222.41ms step:1649/7050 train_time:366754ms step_avg:222.41ms step:1650/7050 train_time:366983ms step_avg:222.41ms step:1651/7050 train_time:367212ms step_avg:222.42ms step:1652/7050 train_time:367440ms step_avg:222.42ms step:1653/7050 train_time:367668ms step_avg:222.42ms step:1654/7050 train_time:367896ms step_avg:222.43ms step:1655/7050 train_time:368125ms step_avg:222.43ms step:1656/7050 train_time:368353ms step_avg:222.44ms step:1657/7050 train_time:368581ms step_avg:222.44ms step:1658/7050 train_time:368810ms step_avg:222.44ms step:1659/7050 train_time:369038ms step_avg:222.45ms step:1660/7050 train_time:369265ms step_avg:222.45ms step:1661/7050 train_time:369494ms step_avg:222.45ms step:1662/7050 train_time:369722ms step_avg:222.46ms step:1663/7050 train_time:369951ms step_avg:222.46ms step:1664/7050 train_time:370178ms step_avg:222.46ms step:1665/7050 train_time:370406ms step_avg:222.47ms step:1666/7050 train_time:370635ms step_avg:222.47ms step:1667/7050 train_time:370862ms step_avg:222.47ms step:1668/7050 train_time:371090ms step_avg:222.48ms step:1669/7050 train_time:371320ms step_avg:222.48ms step:1670/7050 train_time:371547ms step_avg:222.48ms step:1671/7050 train_time:371775ms step_avg:222.49ms step:1672/7050 train_time:372005ms step_avg:222.49ms step:1673/7050 train_time:372232ms step_avg:222.49ms step:1674/7050 train_time:372460ms step_avg:222.50ms step:1675/7050 train_time:372688ms step_avg:222.50ms step:1676/7050 train_time:372917ms step_avg:222.50ms step:1677/7050 train_time:373143ms step_avg:222.51ms step:1678/7050 train_time:373370ms step_avg:222.51ms step:1679/7050 train_time:373599ms step_avg:222.51ms step:1680/7050 train_time:373826ms step_avg:222.52ms step:1681/7050 train_time:374055ms step_avg:222.52ms step:1682/7050 train_time:374284ms step_avg:222.52ms step:1683/7050 train_time:374512ms step_avg:222.53ms step:1684/7050 train_time:374739ms step_avg:222.53ms step:1685/7050 train_time:374966ms step_avg:222.53ms step:1686/7050 train_time:375196ms step_avg:222.54ms step:1687/7050 train_time:375424ms step_avg:222.54ms step:1688/7050 train_time:375651ms step_avg:222.54ms step:1689/7050 train_time:375880ms step_avg:222.55ms step:1690/7050 train_time:376109ms step_avg:222.55ms step:1691/7050 train_time:376337ms step_avg:222.55ms step:1692/7050 train_time:376564ms step_avg:222.56ms step:1693/7050 train_time:376793ms step_avg:222.56ms step:1694/7050 train_time:377021ms step_avg:222.56ms step:1695/7050 train_time:377249ms step_avg:222.57ms step:1696/7050 train_time:377476ms step_avg:222.57ms step:1697/7050 train_time:377705ms step_avg:222.57ms step:1698/7050 train_time:377934ms step_avg:222.58ms step:1699/7050 train_time:378161ms step_avg:222.58ms step:1700/7050 train_time:378389ms step_avg:222.58ms step:1701/7050 train_time:378618ms step_avg:222.59ms step:1702/7050 train_time:378847ms step_avg:222.59ms step:1703/7050 train_time:379074ms step_avg:222.59ms step:1704/7050 train_time:379303ms step_avg:222.60ms step:1705/7050 train_time:379530ms step_avg:222.60ms step:1706/7050 train_time:379757ms step_avg:222.60ms step:1707/7050 train_time:379985ms step_avg:222.60ms step:1708/7050 train_time:380213ms step_avg:222.61ms step:1709/7050 train_time:380441ms step_avg:222.61ms step:1710/7050 train_time:380667ms step_avg:222.61ms step:1711/7050 train_time:380896ms step_avg:222.62ms step:1712/7050 train_time:381124ms step_avg:222.62ms step:1713/7050 train_time:381352ms step_avg:222.62ms step:1714/7050 train_time:381579ms step_avg:222.62ms step:1715/7050 train_time:381808ms step_avg:222.63ms step:1716/7050 train_time:382036ms step_avg:222.63ms step:1717/7050 train_time:382265ms step_avg:222.64ms step:1718/7050 train_time:382493ms step_avg:222.64ms step:1719/7050 train_time:382722ms step_avg:222.64ms step:1720/7050 train_time:382951ms step_avg:222.65ms step:1721/7050 train_time:383180ms step_avg:222.65ms step:1722/7050 train_time:383409ms step_avg:222.65ms step:1723/7050 train_time:383636ms step_avg:222.66ms step:1724/7050 train_time:383866ms step_avg:222.66ms step:1725/7050 train_time:384095ms step_avg:222.66ms step:1726/7050 train_time:384323ms step_avg:222.67ms step:1727/7050 train_time:384552ms step_avg:222.67ms step:1728/7050 train_time:384779ms step_avg:222.67ms step:1729/7050 train_time:385007ms step_avg:222.68ms step:1730/7050 train_time:385233ms step_avg:222.68ms step:1731/7050 train_time:385460ms step_avg:222.68ms step:1732/7050 train_time:385688ms step_avg:222.68ms step:1733/7050 train_time:385917ms step_avg:222.69ms step:1734/7050 train_time:386145ms step_avg:222.69ms step:1735/7050 train_time:386372ms step_avg:222.69ms step:1736/7050 train_time:386601ms step_avg:222.70ms step:1737/7050 train_time:386827ms step_avg:222.70ms step:1738/7050 train_time:387054ms step_avg:222.70ms step:1739/7050 train_time:387283ms step_avg:222.70ms step:1740/7050 train_time:387512ms step_avg:222.71ms step:1741/7050 train_time:387740ms step_avg:222.71ms step:1742/7050 train_time:387968ms step_avg:222.71ms step:1743/7050 train_time:388198ms step_avg:222.72ms step:1744/7050 train_time:388425ms step_avg:222.72ms step:1745/7050 train_time:388652ms step_avg:222.72ms step:1746/7050 train_time:388882ms step_avg:222.73ms step:1747/7050 train_time:389111ms step_avg:222.73ms step:1748/7050 train_time:389339ms step_avg:222.73ms step:1749/7050 train_time:389567ms step_avg:222.74ms step:1750/7050 train_time:389795ms step_avg:222.74ms step:1750/7050 val_loss:3.2853 train_time:389975ms step_avg:222.84ms step:1751/7050 train_time:390024ms step_avg:222.74ms step:1752/7050 train_time:390249ms step_avg:222.75ms step:1753/7050 train_time:390480ms step_avg:222.75ms step:1754/7050 train_time:390710ms step_avg:222.75ms step:1755/7050 train_time:390939ms step_avg:222.76ms step:1756/7050 train_time:391165ms step_avg:222.76ms step:1757/7050 train_time:391394ms step_avg:222.76ms step:1758/7050 train_time:391624ms step_avg:222.77ms step:1759/7050 train_time:391851ms step_avg:222.77ms step:1760/7050 train_time:392078ms step_avg:222.77ms step:1761/7050 train_time:392306ms step_avg:222.77ms step:1762/7050 train_time:392536ms step_avg:222.78ms step:1763/7050 train_time:392764ms step_avg:222.78ms step:1764/7050 train_time:392992ms step_avg:222.78ms step:1765/7050 train_time:393220ms step_avg:222.79ms step:1766/7050 train_time:393448ms step_avg:222.79ms step:1767/7050 train_time:393677ms step_avg:222.79ms step:1768/7050 train_time:393904ms step_avg:222.80ms step:1769/7050 train_time:394132ms step_avg:222.80ms step:1770/7050 train_time:394361ms step_avg:222.80ms step:1771/7050 train_time:394589ms step_avg:222.81ms step:1772/7050 train_time:394817ms step_avg:222.81ms step:1773/7050 train_time:395044ms step_avg:222.81ms step:1774/7050 train_time:395271ms step_avg:222.81ms step:1775/7050 train_time:395499ms step_avg:222.82ms step:1776/7050 train_time:395729ms step_avg:222.82ms step:1777/7050 train_time:395957ms step_avg:222.82ms step:1778/7050 train_time:396186ms step_avg:222.83ms step:1779/7050 train_time:396414ms step_avg:222.83ms step:1780/7050 train_time:396642ms step_avg:222.83ms step:1781/7050 train_time:396869ms step_avg:222.84ms step:1782/7050 train_time:397098ms step_avg:222.84ms step:1783/7050 train_time:397326ms step_avg:222.84ms step:1784/7050 train_time:397554ms step_avg:222.84ms step:1785/7050 train_time:397782ms step_avg:222.85ms step:1786/7050 train_time:398009ms step_avg:222.85ms step:1787/7050 train_time:398238ms step_avg:222.85ms step:1788/7050 train_time:398466ms step_avg:222.86ms step:1789/7050 train_time:398694ms step_avg:222.86ms step:1790/7050 train_time:398922ms step_avg:222.86ms step:1791/7050 train_time:399150ms step_avg:222.86ms step:1792/7050 train_time:399377ms step_avg:222.87ms step:1793/7050 train_time:399605ms step_avg:222.87ms step:1794/7050 train_time:399834ms step_avg:222.87ms step:1795/7050 train_time:400062ms step_avg:222.88ms step:1796/7050 train_time:400290ms step_avg:222.88ms step:1797/7050 train_time:400517ms step_avg:222.88ms step:1798/7050 train_time:400746ms step_avg:222.88ms step:1799/7050 train_time:400973ms step_avg:222.89ms step:1800/7050 train_time:401202ms step_avg:222.89ms step:1801/7050 train_time:401429ms step_avg:222.89ms step:1802/7050 train_time:401656ms step_avg:222.89ms step:1803/7050 train_time:401883ms step_avg:222.90ms step:1804/7050 train_time:402111ms step_avg:222.90ms step:1805/7050 train_time:402340ms step_avg:222.90ms step:1806/7050 train_time:402568ms step_avg:222.91ms step:1807/7050 train_time:402797ms step_avg:222.91ms step:1808/7050 train_time:403024ms step_avg:222.91ms step:1809/7050 train_time:403253ms step_avg:222.91ms step:1810/7050 train_time:403480ms step_avg:222.92ms step:1811/7050 train_time:403709ms step_avg:222.92ms step:1812/7050 train_time:403938ms step_avg:222.92ms step:1813/7050 train_time:404166ms step_avg:222.93ms step:1814/7050 train_time:404394ms step_avg:222.93ms step:1815/7050 train_time:404623ms step_avg:222.93ms step:1816/7050 train_time:404851ms step_avg:222.94ms step:1817/7050 train_time:405080ms step_avg:222.94ms step:1818/7050 train_time:405309ms step_avg:222.94ms step:1819/7050 train_time:405538ms step_avg:222.95ms step:1820/7050 train_time:405765ms step_avg:222.95ms step:1821/7050 train_time:405992ms step_avg:222.95ms step:1822/7050 train_time:406220ms step_avg:222.95ms step:1823/7050 train_time:406448ms step_avg:222.96ms step:1824/7050 train_time:406677ms step_avg:222.96ms step:1825/7050 train_time:406904ms step_avg:222.96ms step:1826/7050 train_time:407132ms step_avg:222.96ms step:1827/7050 train_time:407360ms step_avg:222.97ms step:1828/7050 train_time:407588ms step_avg:222.97ms step:1829/7050 train_time:407817ms step_avg:222.97ms step:1830/7050 train_time:408044ms step_avg:222.98ms step:1831/7050 train_time:408272ms step_avg:222.98ms step:1832/7050 train_time:408501ms step_avg:222.98ms step:1833/7050 train_time:408728ms step_avg:222.98ms step:1834/7050 train_time:408957ms step_avg:222.99ms step:1835/7050 train_time:409183ms step_avg:222.99ms step:1836/7050 train_time:409413ms step_avg:222.99ms step:1837/7050 train_time:409643ms step_avg:223.00ms step:1838/7050 train_time:409871ms step_avg:223.00ms step:1839/7050 train_time:410098ms step_avg:223.00ms step:1840/7050 train_time:410325ms step_avg:223.00ms step:1841/7050 train_time:410554ms step_avg:223.01ms step:1842/7050 train_time:410782ms step_avg:223.01ms step:1843/7050 train_time:411008ms step_avg:223.01ms step:1844/7050 train_time:411238ms step_avg:223.01ms step:1845/7050 train_time:411464ms step_avg:223.02ms step:1846/7050 train_time:411692ms step_avg:223.02ms step:1847/7050 train_time:411920ms step_avg:223.02ms step:1848/7050 train_time:412149ms step_avg:223.02ms step:1849/7050 train_time:412377ms step_avg:223.03ms step:1850/7050 train_time:412605ms step_avg:223.03ms step:1851/7050 train_time:412835ms step_avg:223.03ms step:1852/7050 train_time:413062ms step_avg:223.04ms step:1853/7050 train_time:413290ms step_avg:223.04ms step:1854/7050 train_time:413518ms step_avg:223.04ms step:1855/7050 train_time:413746ms step_avg:223.04ms step:1856/7050 train_time:413974ms step_avg:223.05ms step:1857/7050 train_time:414202ms step_avg:223.05ms step:1858/7050 train_time:414430ms step_avg:223.05ms step:1859/7050 train_time:414659ms step_avg:223.05ms step:1860/7050 train_time:414886ms step_avg:223.06ms step:1861/7050 train_time:415113ms step_avg:223.06ms step:1862/7050 train_time:415341ms step_avg:223.06ms step:1863/7050 train_time:415568ms step_avg:223.06ms step:1864/7050 train_time:415796ms step_avg:223.07ms step:1865/7050 train_time:416025ms step_avg:223.07ms step:1866/7050 train_time:416252ms step_avg:223.07ms step:1867/7050 train_time:416481ms step_avg:223.07ms step:1868/7050 train_time:416709ms step_avg:223.08ms step:1869/7050 train_time:416937ms step_avg:223.08ms step:1870/7050 train_time:417164ms step_avg:223.08ms step:1871/7050 train_time:417392ms step_avg:223.08ms step:1872/7050 train_time:417621ms step_avg:223.09ms step:1873/7050 train_time:417850ms step_avg:223.09ms step:1874/7050 train_time:418078ms step_avg:223.09ms step:1875/7050 train_time:418305ms step_avg:223.10ms step:1875/7050 val_loss:3.2693 train_time:418484ms step_avg:223.19ms step:1876/7050 train_time:418533ms step_avg:223.10ms step:1877/7050 train_time:418760ms step_avg:223.10ms step:1878/7050 train_time:418991ms step_avg:223.11ms step:1879/7050 train_time:419219ms step_avg:223.11ms step:1880/7050 train_time:419446ms step_avg:223.11ms step:1881/7050 train_time:419672ms step_avg:223.11ms step:1882/7050 train_time:419902ms step_avg:223.11ms step:1883/7050 train_time:420131ms step_avg:223.12ms step:1884/7050 train_time:420360ms step_avg:223.12ms step:1885/7050 train_time:420587ms step_avg:223.12ms step:1886/7050 train_time:420813ms step_avg:223.12ms step:1887/7050 train_time:421042ms step_avg:223.13ms step:1888/7050 train_time:421269ms step_avg:223.13ms step:1889/7050 train_time:421497ms step_avg:223.13ms step:1890/7050 train_time:421726ms step_avg:223.14ms step:1891/7050 train_time:421954ms step_avg:223.14ms step:1892/7050 train_time:422184ms step_avg:223.14ms step:1893/7050 train_time:422410ms step_avg:223.14ms step:1894/7050 train_time:422638ms step_avg:223.15ms step:1895/7050 train_time:422866ms step_avg:223.15ms step:1896/7050 train_time:423096ms step_avg:223.15ms step:1897/7050 train_time:423323ms step_avg:223.15ms step:1898/7050 train_time:423552ms step_avg:223.16ms step:1899/7050 train_time:423780ms step_avg:223.16ms step:1900/7050 train_time:424011ms step_avg:223.16ms step:1901/7050 train_time:424239ms step_avg:223.17ms step:1902/7050 train_time:424466ms step_avg:223.17ms step:1903/7050 train_time:424694ms step_avg:223.17ms step:1904/7050 train_time:424920ms step_avg:223.17ms step:1905/7050 train_time:425149ms step_avg:223.18ms step:1906/7050 train_time:425377ms step_avg:223.18ms step:1907/7050 train_time:425604ms step_avg:223.18ms step:1908/7050 train_time:425832ms step_avg:223.18ms step:1909/7050 train_time:426059ms step_avg:223.18ms step:1910/7050 train_time:426287ms step_avg:223.19ms step:1911/7050 train_time:426514ms step_avg:223.19ms step:1912/7050 train_time:426743ms step_avg:223.19ms step:1913/7050 train_time:426970ms step_avg:223.19ms step:1914/7050 train_time:427198ms step_avg:223.20ms step:1915/7050 train_time:427427ms step_avg:223.20ms step:1916/7050 train_time:427655ms step_avg:223.20ms step:1917/7050 train_time:427883ms step_avg:223.20ms step:1918/7050 train_time:428110ms step_avg:223.21ms step:1919/7050 train_time:428338ms step_avg:223.21ms step:1920/7050 train_time:428566ms step_avg:223.21ms step:1921/7050 train_time:428795ms step_avg:223.21ms step:1922/7050 train_time:429022ms step_avg:223.22ms step:1923/7050 train_time:429250ms step_avg:223.22ms step:1924/7050 train_time:429477ms step_avg:223.22ms step:1925/7050 train_time:429707ms step_avg:223.22ms step:1926/7050 train_time:429935ms step_avg:223.23ms step:1927/7050 train_time:430162ms step_avg:223.23ms step:1928/7050 train_time:430390ms step_avg:223.23ms step:1929/7050 train_time:430618ms step_avg:223.23ms step:1930/7050 train_time:430849ms step_avg:223.24ms step:1931/7050 train_time:431076ms step_avg:223.24ms step:1932/7050 train_time:431303ms step_avg:223.24ms step:1933/7050 train_time:431530ms step_avg:223.24ms step:1934/7050 train_time:431757ms step_avg:223.25ms step:1935/7050 train_time:431984ms step_avg:223.25ms step:1936/7050 train_time:432213ms step_avg:223.25ms step:1937/7050 train_time:432442ms step_avg:223.25ms step:1938/7050 train_time:432671ms step_avg:223.26ms step:1939/7050 train_time:432900ms step_avg:223.26ms step:1940/7050 train_time:433126ms step_avg:223.26ms step:1941/7050 train_time:433355ms step_avg:223.26ms step:1942/7050 train_time:433582ms step_avg:223.27ms step:1943/7050 train_time:433811ms step_avg:223.27ms step:1944/7050 train_time:434038ms step_avg:223.27ms step:1945/7050 train_time:434265ms step_avg:223.27ms step:1946/7050 train_time:434494ms step_avg:223.28ms step:1947/7050 train_time:434722ms step_avg:223.28ms step:1948/7050 train_time:434950ms step_avg:223.28ms step:1949/7050 train_time:435178ms step_avg:223.28ms step:1950/7050 train_time:435405ms step_avg:223.28ms step:1951/7050 train_time:435633ms step_avg:223.29ms step:1952/7050 train_time:435860ms step_avg:223.29ms step:1953/7050 train_time:436089ms step_avg:223.29ms step:1954/7050 train_time:436317ms step_avg:223.29ms step:1955/7050 train_time:436545ms step_avg:223.30ms step:1956/7050 train_time:436773ms step_avg:223.30ms step:1957/7050 train_time:437002ms step_avg:223.30ms step:1958/7050 train_time:437229ms step_avg:223.30ms step:1959/7050 train_time:437456ms step_avg:223.31ms step:1960/7050 train_time:437684ms step_avg:223.31ms step:1961/7050 train_time:437913ms step_avg:223.31ms step:1962/7050 train_time:438141ms step_avg:223.31ms step:1963/7050 train_time:438369ms step_avg:223.32ms step:1964/7050 train_time:438596ms step_avg:223.32ms step:1965/7050 train_time:438828ms step_avg:223.32ms step:1966/7050 train_time:439058ms step_avg:223.33ms step:1967/7050 train_time:439283ms step_avg:223.33ms step:1968/7050 train_time:439511ms step_avg:223.33ms step:1969/7050 train_time:439740ms step_avg:223.33ms step:1970/7050 train_time:439969ms step_avg:223.33ms step:1971/7050 train_time:440195ms step_avg:223.34ms step:1972/7050 train_time:440423ms step_avg:223.34ms step:1973/7050 train_time:440652ms step_avg:223.34ms step:1974/7050 train_time:440880ms step_avg:223.34ms step:1975/7050 train_time:441108ms step_avg:223.35ms step:1976/7050 train_time:441338ms step_avg:223.35ms step:1977/7050 train_time:441564ms step_avg:223.35ms step:1978/7050 train_time:441792ms step_avg:223.35ms step:1979/7050 train_time:442020ms step_avg:223.36ms step:1980/7050 train_time:442250ms step_avg:223.36ms step:1981/7050 train_time:442477ms step_avg:223.36ms step:1982/7050 train_time:442704ms step_avg:223.36ms step:1983/7050 train_time:442932ms step_avg:223.36ms step:1984/7050 train_time:443163ms step_avg:223.37ms step:1985/7050 train_time:443390ms step_avg:223.37ms step:1986/7050 train_time:443617ms step_avg:223.37ms step:1987/7050 train_time:443847ms step_avg:223.38ms step:1988/7050 train_time:444074ms step_avg:223.38ms step:1989/7050 train_time:444302ms step_avg:223.38ms step:1990/7050 train_time:444531ms step_avg:223.38ms step:1991/7050 train_time:444759ms step_avg:223.38ms step:1992/7050 train_time:444988ms step_avg:223.39ms step:1993/7050 train_time:445215ms step_avg:223.39ms step:1994/7050 train_time:445442ms step_avg:223.39ms step:1995/7050 train_time:445672ms step_avg:223.39ms step:1996/7050 train_time:445900ms step_avg:223.40ms step:1997/7050 train_time:446127ms step_avg:223.40ms step:1998/7050 train_time:446356ms step_avg:223.40ms step:1999/7050 train_time:446583ms step_avg:223.40ms step:2000/7050 train_time:446812ms step_avg:223.41ms step:2000/7050 val_loss:3.2565 train_time:446994ms step_avg:223.50ms step:2001/7050 train_time:447043ms step_avg:223.41ms step:2002/7050 train_time:447270ms step_avg:223.41ms step:2003/7050 train_time:447503ms step_avg:223.42ms step:2004/7050 train_time:447732ms step_avg:223.42ms step:2005/7050 train_time:447960ms step_avg:223.42ms step:2006/7050 train_time:448186ms step_avg:223.42ms step:2007/7050 train_time:448414ms step_avg:223.43ms step:2008/7050 train_time:448644ms step_avg:223.43ms step:2009/7050 train_time:448872ms step_avg:223.43ms step:2010/7050 train_time:449100ms step_avg:223.43ms step:2011/7050 train_time:449326ms step_avg:223.43ms step:2012/7050 train_time:449556ms step_avg:223.44ms step:2013/7050 train_time:449784ms step_avg:223.44ms step:2014/7050 train_time:450012ms step_avg:223.44ms step:2015/7050 train_time:450240ms step_avg:223.44ms step:2016/7050 train_time:450467ms step_avg:223.45ms step:2017/7050 train_time:450695ms step_avg:223.45ms step:2018/7050 train_time:450924ms step_avg:223.45ms step:2019/7050 train_time:451152ms step_avg:223.45ms step:2020/7050 train_time:451381ms step_avg:223.46ms step:2021/7050 train_time:451610ms step_avg:223.46ms step:2022/7050 train_time:451838ms step_avg:223.46ms step:2023/7050 train_time:452067ms step_avg:223.46ms step:2024/7050 train_time:452295ms step_avg:223.47ms step:2025/7050 train_time:452522ms step_avg:223.47ms step:2026/7050 train_time:452750ms step_avg:223.47ms step:2027/7050 train_time:452978ms step_avg:223.47ms step:2028/7050 train_time:453205ms step_avg:223.47ms step:2029/7050 train_time:453433ms step_avg:223.48ms step:2030/7050 train_time:453661ms step_avg:223.48ms step:2031/7050 train_time:453887ms step_avg:223.48ms step:2032/7050 train_time:454114ms step_avg:223.48ms step:2033/7050 train_time:454343ms step_avg:223.48ms step:2034/7050 train_time:454572ms step_avg:223.49ms step:2035/7050 train_time:454801ms step_avg:223.49ms step:2036/7050 train_time:455029ms step_avg:223.49ms step:2037/7050 train_time:455258ms step_avg:223.49ms step:2038/7050 train_time:455486ms step_avg:223.50ms step:2039/7050 train_time:455714ms step_avg:223.50ms step:2040/7050 train_time:455942ms step_avg:223.50ms step:2041/7050 train_time:456169ms step_avg:223.50ms step:2042/7050 train_time:456397ms step_avg:223.51ms step:2043/7050 train_time:456625ms step_avg:223.51ms step:2044/7050 train_time:456854ms step_avg:223.51ms step:2045/7050 train_time:457082ms step_avg:223.51ms step:2046/7050 train_time:457309ms step_avg:223.51ms step:2047/7050 train_time:457538ms step_avg:223.52ms step:2048/7050 train_time:457765ms step_avg:223.52ms step:2049/7050 train_time:457992ms step_avg:223.52ms step:2050/7050 train_time:458221ms step_avg:223.52ms step:2051/7050 train_time:458450ms step_avg:223.52ms step:2052/7050 train_time:458678ms step_avg:223.53ms step:2053/7050 train_time:458906ms step_avg:223.53ms step:2054/7050 train_time:459134ms step_avg:223.53ms step:2055/7050 train_time:459362ms step_avg:223.53ms step:2056/7050 train_time:459591ms step_avg:223.54ms step:2057/7050 train_time:459819ms step_avg:223.54ms step:2058/7050 train_time:460046ms step_avg:223.54ms step:2059/7050 train_time:460274ms step_avg:223.54ms step:2060/7050 train_time:460502ms step_avg:223.54ms step:2061/7050 train_time:460729ms step_avg:223.55ms step:2062/7050 train_time:460958ms step_avg:223.55ms step:2063/7050 train_time:461186ms step_avg:223.55ms step:2064/7050 train_time:461414ms step_avg:223.55ms step:2065/7050 train_time:461643ms step_avg:223.56ms step:2066/7050 train_time:461871ms step_avg:223.56ms step:2067/7050 train_time:462099ms step_avg:223.56ms step:2068/7050 train_time:462327ms step_avg:223.56ms step:2069/7050 train_time:462555ms step_avg:223.56ms step:2070/7050 train_time:462782ms step_avg:223.57ms step:2071/7050 train_time:463010ms step_avg:223.57ms step:2072/7050 train_time:463240ms step_avg:223.57ms step:2073/7050 train_time:463467ms step_avg:223.57ms step:2074/7050 train_time:463695ms step_avg:223.58ms step:2075/7050 train_time:463925ms step_avg:223.58ms step:2076/7050 train_time:464151ms step_avg:223.58ms step:2077/7050 train_time:464379ms step_avg:223.58ms step:2078/7050 train_time:464607ms step_avg:223.58ms step:2079/7050 train_time:464837ms step_avg:223.59ms step:2080/7050 train_time:465065ms step_avg:223.59ms step:2081/7050 train_time:465292ms step_avg:223.59ms step:2082/7050 train_time:465521ms step_avg:223.59ms step:2083/7050 train_time:465749ms step_avg:223.60ms step:2084/7050 train_time:465976ms step_avg:223.60ms step:2085/7050 train_time:466204ms step_avg:223.60ms step:2086/7050 train_time:466432ms step_avg:223.60ms step:2087/7050 train_time:466660ms step_avg:223.60ms step:2088/7050 train_time:466888ms step_avg:223.61ms step:2089/7050 train_time:467116ms step_avg:223.61ms step:2090/7050 train_time:467345ms step_avg:223.61ms step:2091/7050 train_time:467573ms step_avg:223.61ms step:2092/7050 train_time:467802ms step_avg:223.61ms step:2093/7050 train_time:468029ms step_avg:223.62ms step:2094/7050 train_time:468260ms step_avg:223.62ms step:2095/7050 train_time:468487ms step_avg:223.62ms step:2096/7050 train_time:468716ms step_avg:223.62ms step:2097/7050 train_time:468944ms step_avg:223.63ms step:2098/7050 train_time:469172ms step_avg:223.63ms step:2099/7050 train_time:469402ms step_avg:223.63ms step:2100/7050 train_time:469630ms step_avg:223.63ms step:2101/7050 train_time:469859ms step_avg:223.64ms step:2102/7050 train_time:470086ms step_avg:223.64ms step:2103/7050 train_time:470315ms step_avg:223.64ms step:2104/7050 train_time:470545ms step_avg:223.64ms step:2105/7050 train_time:470773ms step_avg:223.65ms step:2106/7050 train_time:471002ms step_avg:223.65ms step:2107/7050 train_time:471230ms step_avg:223.65ms step:2108/7050 train_time:471460ms step_avg:223.65ms step:2109/7050 train_time:471690ms step_avg:223.66ms step:2110/7050 train_time:471918ms step_avg:223.66ms step:2111/7050 train_time:472148ms step_avg:223.66ms step:2112/7050 train_time:472377ms step_avg:223.66ms step:2113/7050 train_time:472605ms step_avg:223.67ms step:2114/7050 train_time:472834ms step_avg:223.67ms step:2115/7050 train_time:473064ms step_avg:223.67ms step:2116/7050 train_time:473292ms step_avg:223.67ms step:2117/7050 train_time:473520ms step_avg:223.67ms step:2118/7050 train_time:473747ms step_avg:223.68ms step:2119/7050 train_time:473976ms step_avg:223.68ms step:2120/7050 train_time:474204ms step_avg:223.68ms step:2121/7050 train_time:474433ms step_avg:223.68ms step:2122/7050 train_time:474663ms step_avg:223.69ms step:2123/7050 train_time:474892ms step_avg:223.69ms step:2124/7050 train_time:475120ms step_avg:223.69ms step:2125/7050 train_time:475348ms step_avg:223.69ms step:2125/7050 val_loss:3.2351 train_time:475528ms step_avg:223.78ms step:2126/7050 train_time:475578ms step_avg:223.70ms step:2127/7050 train_time:475807ms step_avg:223.70ms step:2128/7050 train_time:476042ms step_avg:223.70ms step:2129/7050 train_time:476272ms step_avg:223.71ms step:2130/7050 train_time:476498ms step_avg:223.71ms step:2131/7050 train_time:476724ms step_avg:223.71ms step:2132/7050 train_time:476957ms step_avg:223.71ms step:2133/7050 train_time:477187ms step_avg:223.72ms step:2134/7050 train_time:477416ms step_avg:223.72ms step:2135/7050 train_time:477644ms step_avg:223.72ms step:2136/7050 train_time:477872ms step_avg:223.72ms step:2137/7050 train_time:478102ms step_avg:223.73ms step:2138/7050 train_time:478331ms step_avg:223.73ms step:2139/7050 train_time:478560ms step_avg:223.73ms step:2140/7050 train_time:478787ms step_avg:223.73ms step:2141/7050 train_time:479016ms step_avg:223.73ms step:2142/7050 train_time:479245ms step_avg:223.74ms step:2143/7050 train_time:479474ms step_avg:223.74ms step:2144/7050 train_time:479702ms step_avg:223.74ms step:2145/7050 train_time:479930ms step_avg:223.74ms step:2146/7050 train_time:480162ms step_avg:223.75ms step:2147/7050 train_time:480389ms step_avg:223.75ms step:2148/7050 train_time:480618ms step_avg:223.75ms step:2149/7050 train_time:480846ms step_avg:223.75ms step:2150/7050 train_time:481074ms step_avg:223.76ms step:2151/7050 train_time:481303ms step_avg:223.76ms step:2152/7050 train_time:481532ms step_avg:223.76ms step:2153/7050 train_time:481761ms step_avg:223.76ms step:2154/7050 train_time:481991ms step_avg:223.77ms step:2155/7050 train_time:482221ms step_avg:223.77ms step:2156/7050 train_time:482450ms step_avg:223.77ms step:2157/7050 train_time:482678ms step_avg:223.77ms step:2158/7050 train_time:482905ms step_avg:223.77ms step:2159/7050 train_time:483133ms step_avg:223.78ms step:2160/7050 train_time:483363ms step_avg:223.78ms step:2161/7050 train_time:483591ms step_avg:223.78ms step:2162/7050 train_time:483820ms step_avg:223.78ms step:2163/7050 train_time:484049ms step_avg:223.79ms step:2164/7050 train_time:484277ms step_avg:223.79ms step:2165/7050 train_time:484505ms step_avg:223.79ms step:2166/7050 train_time:484734ms step_avg:223.79ms step:2167/7050 train_time:484963ms step_avg:223.79ms step:2168/7050 train_time:485191ms step_avg:223.80ms step:2169/7050 train_time:485420ms step_avg:223.80ms step:2170/7050 train_time:485649ms step_avg:223.80ms step:2171/7050 train_time:485879ms step_avg:223.80ms step:2172/7050 train_time:486106ms step_avg:223.81ms step:2173/7050 train_time:486334ms step_avg:223.81ms step:2174/7050 train_time:486563ms step_avg:223.81ms step:2175/7050 train_time:486790ms step_avg:223.81ms step:2176/7050 train_time:487018ms step_avg:223.81ms step:2177/7050 train_time:487247ms step_avg:223.82ms step:2178/7050 train_time:487476ms step_avg:223.82ms step:2179/7050 train_time:487705ms step_avg:223.82ms step:2180/7050 train_time:487933ms step_avg:223.82ms step:2181/7050 train_time:488163ms step_avg:223.83ms step:2182/7050 train_time:488391ms step_avg:223.83ms step:2183/7050 train_time:488621ms step_avg:223.83ms step:2184/7050 train_time:488853ms step_avg:223.83ms step:2185/7050 train_time:489081ms step_avg:223.84ms step:2186/7050 train_time:489311ms step_avg:223.84ms step:2187/7050 train_time:489540ms step_avg:223.84ms step:2188/7050 train_time:489769ms step_avg:223.84ms step:2189/7050 train_time:489997ms step_avg:223.84ms step:2190/7050 train_time:490225ms step_avg:223.85ms step:2191/7050 train_time:490453ms step_avg:223.85ms step:2192/7050 train_time:490685ms step_avg:223.85ms step:2193/7050 train_time:490911ms step_avg:223.85ms step:2194/7050 train_time:491141ms step_avg:223.86ms step:2195/7050 train_time:491372ms step_avg:223.86ms step:2196/7050 train_time:491601ms step_avg:223.86ms step:2197/7050 train_time:491831ms step_avg:223.86ms step:2198/7050 train_time:492060ms step_avg:223.87ms step:2199/7050 train_time:492289ms step_avg:223.87ms step:2200/7050 train_time:492517ms step_avg:223.87ms step:2201/7050 train_time:492747ms step_avg:223.87ms step:2202/7050 train_time:492975ms step_avg:223.88ms step:2203/7050 train_time:493205ms step_avg:223.88ms step:2204/7050 train_time:493433ms step_avg:223.88ms step:2205/7050 train_time:493662ms step_avg:223.88ms step:2206/7050 train_time:493893ms step_avg:223.89ms step:2207/7050 train_time:494121ms step_avg:223.89ms step:2208/7050 train_time:494350ms step_avg:223.89ms step:2209/7050 train_time:494581ms step_avg:223.89ms step:2210/7050 train_time:494810ms step_avg:223.90ms step:2211/7050 train_time:495040ms step_avg:223.90ms step:2212/7050 train_time:495269ms step_avg:223.90ms step:2213/7050 train_time:495498ms step_avg:223.90ms step:2214/7050 train_time:495727ms step_avg:223.91ms step:2215/7050 train_time:495956ms step_avg:223.91ms step:2216/7050 train_time:496185ms step_avg:223.91ms step:2217/7050 train_time:496414ms step_avg:223.91ms step:2218/7050 train_time:496644ms step_avg:223.92ms step:2219/7050 train_time:496872ms step_avg:223.92ms step:2220/7050 train_time:497102ms step_avg:223.92ms step:2221/7050 train_time:497331ms step_avg:223.92ms step:2222/7050 train_time:497561ms step_avg:223.92ms step:2223/7050 train_time:497790ms step_avg:223.93ms step:2224/7050 train_time:498019ms step_avg:223.93ms step:2225/7050 train_time:498247ms step_avg:223.93ms step:2226/7050 train_time:498476ms step_avg:223.93ms step:2227/7050 train_time:498704ms step_avg:223.94ms step:2228/7050 train_time:498935ms step_avg:223.94ms step:2229/7050 train_time:499164ms step_avg:223.94ms step:2230/7050 train_time:499391ms step_avg:223.94ms step:2231/7050 train_time:499621ms step_avg:223.94ms step:2232/7050 train_time:499851ms step_avg:223.95ms step:2233/7050 train_time:500079ms step_avg:223.95ms step:2234/7050 train_time:500308ms step_avg:223.95ms step:2235/7050 train_time:500537ms step_avg:223.95ms step:2236/7050 train_time:500765ms step_avg:223.96ms step:2237/7050 train_time:500995ms step_avg:223.96ms step:2238/7050 train_time:501224ms step_avg:223.96ms step:2239/7050 train_time:501456ms step_avg:223.96ms step:2240/7050 train_time:501684ms step_avg:223.97ms step:2241/7050 train_time:501914ms step_avg:223.97ms step:2242/7050 train_time:502144ms step_avg:223.97ms step:2243/7050 train_time:502372ms step_avg:223.97ms step:2244/7050 train_time:502601ms step_avg:223.98ms step:2245/7050 train_time:502831ms step_avg:223.98ms step:2246/7050 train_time:503060ms step_avg:223.98ms step:2247/7050 train_time:503291ms step_avg:223.98ms step:2248/7050 train_time:503519ms step_avg:223.99ms step:2249/7050 train_time:503747ms step_avg:223.99ms step:2250/7050 train_time:503976ms step_avg:223.99ms step:2250/7050 val_loss:3.2233 train_time:504156ms step_avg:224.07ms step:2251/7050 train_time:504205ms step_avg:223.99ms step:2252/7050 train_time:504433ms step_avg:223.99ms step:2253/7050 train_time:504667ms step_avg:224.00ms step:2254/7050 train_time:504897ms step_avg:224.00ms step:2255/7050 train_time:505123ms step_avg:224.00ms step:2256/7050 train_time:505351ms step_avg:224.00ms step:2257/7050 train_time:505581ms step_avg:224.01ms step:2258/7050 train_time:505812ms step_avg:224.01ms step:2259/7050 train_time:506041ms step_avg:224.01ms step:2260/7050 train_time:506268ms step_avg:224.01ms step:2261/7050 train_time:506497ms step_avg:224.01ms step:2262/7050 train_time:506726ms step_avg:224.02ms step:2263/7050 train_time:506955ms step_avg:224.02ms step:2264/7050 train_time:507185ms step_avg:224.02ms step:2265/7050 train_time:507411ms step_avg:224.02ms step:2266/7050 train_time:507642ms step_avg:224.03ms step:2267/7050 train_time:507869ms step_avg:224.03ms step:2268/7050 train_time:508098ms step_avg:224.03ms step:2269/7050 train_time:508327ms step_avg:224.03ms step:2270/7050 train_time:508557ms step_avg:224.03ms step:2271/7050 train_time:508786ms step_avg:224.04ms step:2272/7050 train_time:509015ms step_avg:224.04ms step:2273/7050 train_time:509242ms step_avg:224.04ms step:2274/7050 train_time:509473ms step_avg:224.04ms step:2275/7050 train_time:509702ms step_avg:224.04ms step:2276/7050 train_time:509930ms step_avg:224.05ms step:2277/7050 train_time:510159ms step_avg:224.05ms step:2278/7050 train_time:510388ms step_avg:224.05ms step:2279/7050 train_time:510616ms step_avg:224.05ms step:2280/7050 train_time:510844ms step_avg:224.05ms step:2281/7050 train_time:511073ms step_avg:224.06ms step:2282/7050 train_time:511301ms step_avg:224.06ms step:2283/7050 train_time:511528ms step_avg:224.06ms step:2284/7050 train_time:511758ms step_avg:224.06ms step:2285/7050 train_time:511988ms step_avg:224.06ms step:2286/7050 train_time:512217ms step_avg:224.07ms step:2287/7050 train_time:512445ms step_avg:224.07ms step:2288/7050 train_time:512674ms step_avg:224.07ms step:2289/7050 train_time:512904ms step_avg:224.07ms step:2290/7050 train_time:513132ms step_avg:224.08ms step:2291/7050 train_time:513361ms step_avg:224.08ms step:2292/7050 train_time:513590ms step_avg:224.08ms step:2293/7050 train_time:513818ms step_avg:224.08ms step:2294/7050 train_time:514047ms step_avg:224.08ms step:2295/7050 train_time:514277ms step_avg:224.09ms step:2296/7050 train_time:514505ms step_avg:224.09ms step:2297/7050 train_time:514735ms step_avg:224.09ms step:2298/7050 train_time:514964ms step_avg:224.09ms step:2299/7050 train_time:515193ms step_avg:224.09ms step:2300/7050 train_time:515421ms step_avg:224.10ms step:2301/7050 train_time:515650ms step_avg:224.10ms step:2302/7050 train_time:515879ms step_avg:224.10ms step:2303/7050 train_time:516108ms step_avg:224.10ms step:2304/7050 train_time:516336ms step_avg:224.10ms step:2305/7050 train_time:516564ms step_avg:224.11ms step:2306/7050 train_time:516795ms step_avg:224.11ms step:2307/7050 train_time:517024ms step_avg:224.11ms step:2308/7050 train_time:517253ms step_avg:224.11ms step:2309/7050 train_time:517482ms step_avg:224.12ms step:2310/7050 train_time:517711ms step_avg:224.12ms step:2311/7050 train_time:517940ms step_avg:224.12ms step:2312/7050 train_time:518169ms step_avg:224.12ms step:2313/7050 train_time:518400ms step_avg:224.12ms step:2314/7050 train_time:518628ms step_avg:224.13ms step:2315/7050 train_time:518856ms step_avg:224.13ms step:2316/7050 train_time:519085ms step_avg:224.13ms step:2317/7050 train_time:519314ms step_avg:224.13ms step:2318/7050 train_time:519543ms step_avg:224.13ms step:2319/7050 train_time:519771ms step_avg:224.14ms step:2320/7050 train_time:520001ms step_avg:224.14ms step:2321/7050 train_time:520228ms step_avg:224.14ms step:2322/7050 train_time:520458ms step_avg:224.14ms step:2323/7050 train_time:520687ms step_avg:224.14ms step:2324/7050 train_time:520916ms step_avg:224.15ms step:2325/7050 train_time:521144ms step_avg:224.15ms step:2326/7050 train_time:521372ms step_avg:224.15ms step:2327/7050 train_time:521602ms step_avg:224.15ms step:2328/7050 train_time:521829ms step_avg:224.15ms step:2329/7050 train_time:522060ms step_avg:224.16ms step:2330/7050 train_time:522290ms step_avg:224.16ms step:2331/7050 train_time:522518ms step_avg:224.16ms step:2332/7050 train_time:522747ms step_avg:224.16ms step:2333/7050 train_time:522976ms step_avg:224.16ms step:2334/7050 train_time:523205ms step_avg:224.17ms step:2335/7050 train_time:523435ms step_avg:224.17ms step:2336/7050 train_time:523663ms step_avg:224.17ms step:2337/7050 train_time:523891ms step_avg:224.17ms step:2338/7050 train_time:524120ms step_avg:224.17ms step:2339/7050 train_time:524347ms step_avg:224.18ms step:2340/7050 train_time:524576ms step_avg:224.18ms step:2341/7050 train_time:524809ms step_avg:224.18ms step:2342/7050 train_time:525037ms step_avg:224.18ms step:2343/7050 train_time:525264ms step_avg:224.18ms step:2344/7050 train_time:525494ms step_avg:224.19ms step:2345/7050 train_time:525722ms step_avg:224.19ms step:2346/7050 train_time:525951ms step_avg:224.19ms step:2347/7050 train_time:526180ms step_avg:224.19ms step:2348/7050 train_time:526410ms step_avg:224.19ms step:2349/7050 train_time:526639ms step_avg:224.20ms step:2350/7050 train_time:526868ms step_avg:224.20ms step:2351/7050 train_time:527097ms step_avg:224.20ms step:2352/7050 train_time:527325ms step_avg:224.20ms step:2353/7050 train_time:527554ms step_avg:224.20ms step:2354/7050 train_time:527783ms step_avg:224.21ms step:2355/7050 train_time:528012ms step_avg:224.21ms step:2356/7050 train_time:528240ms step_avg:224.21ms step:2357/7050 train_time:528469ms step_avg:224.21ms step:2358/7050 train_time:528697ms step_avg:224.21ms step:2359/7050 train_time:528926ms step_avg:224.22ms step:2360/7050 train_time:529155ms step_avg:224.22ms step:2361/7050 train_time:529384ms step_avg:224.22ms step:2362/7050 train_time:529612ms step_avg:224.22ms step:2363/7050 train_time:529843ms step_avg:224.22ms step:2364/7050 train_time:530070ms step_avg:224.23ms step:2365/7050 train_time:530301ms step_avg:224.23ms step:2366/7050 train_time:530529ms step_avg:224.23ms step:2367/7050 train_time:530758ms step_avg:224.23ms step:2368/7050 train_time:530988ms step_avg:224.23ms step:2369/7050 train_time:531217ms step_avg:224.24ms step:2370/7050 train_time:531447ms step_avg:224.24ms step:2371/7050 train_time:531677ms step_avg:224.24ms step:2372/7050 train_time:531905ms step_avg:224.24ms step:2373/7050 train_time:532134ms step_avg:224.25ms step:2374/7050 train_time:532362ms step_avg:224.25ms step:2375/7050 train_time:532591ms step_avg:224.25ms step:2375/7050 val_loss:3.2136 train_time:532772ms step_avg:224.33ms step:2376/7050 train_time:532822ms step_avg:224.25ms step:2377/7050 train_time:533047ms step_avg:224.25ms step:2378/7050 train_time:533282ms step_avg:224.26ms step:2379/7050 train_time:533513ms step_avg:224.26ms step:2380/7050 train_time:533739ms step_avg:224.26ms step:2381/7050 train_time:533966ms step_avg:224.26ms step:2382/7050 train_time:534196ms step_avg:224.26ms step:2383/7050 train_time:534426ms step_avg:224.27ms step:2384/7050 train_time:534654ms step_avg:224.27ms step:2385/7050 train_time:534883ms step_avg:224.27ms step:2386/7050 train_time:535112ms step_avg:224.27ms step:2387/7050 train_time:535340ms step_avg:224.27ms step:2388/7050 train_time:535569ms step_avg:224.28ms step:2389/7050 train_time:535799ms step_avg:224.28ms step:2390/7050 train_time:536027ms step_avg:224.28ms step:2391/7050 train_time:536255ms step_avg:224.28ms step:2392/7050 train_time:536485ms step_avg:224.28ms step:2393/7050 train_time:536715ms step_avg:224.29ms step:2394/7050 train_time:536943ms step_avg:224.29ms step:2395/7050 train_time:537171ms step_avg:224.29ms step:2396/7050 train_time:537401ms step_avg:224.29ms step:2397/7050 train_time:537631ms step_avg:224.29ms step:2398/7050 train_time:537860ms step_avg:224.30ms step:2399/7050 train_time:538088ms step_avg:224.30ms step:2400/7050 train_time:538321ms step_avg:224.30ms step:2401/7050 train_time:538550ms step_avg:224.30ms step:2402/7050 train_time:538778ms step_avg:224.30ms step:2403/7050 train_time:539498ms step_avg:224.51ms step:2404/7050 train_time:539688ms step_avg:224.50ms step:2405/7050 train_time:539914ms step_avg:224.50ms step:2406/7050 train_time:540140ms step_avg:224.50ms step:2407/7050 train_time:540367ms step_avg:224.50ms step:2408/7050 train_time:540597ms step_avg:224.50ms step:2409/7050 train_time:540830ms step_avg:224.50ms step:2410/7050 train_time:541058ms step_avg:224.51ms step:2411/7050 train_time:541284ms step_avg:224.51ms step:2412/7050 train_time:541512ms step_avg:224.51ms step:2413/7050 train_time:541741ms step_avg:224.51ms step:2414/7050 train_time:541973ms step_avg:224.51ms step:2415/7050 train_time:542200ms step_avg:224.51ms step:2416/7050 train_time:542428ms step_avg:224.51ms step:2417/7050 train_time:542656ms step_avg:224.52ms step:2418/7050 train_time:542886ms step_avg:224.52ms step:2419/7050 train_time:543116ms step_avg:224.52ms step:2420/7050 train_time:543344ms step_avg:224.52ms step:2421/7050 train_time:543573ms step_avg:224.52ms step:2422/7050 train_time:543803ms step_avg:224.53ms step:2423/7050 train_time:544032ms step_avg:224.53ms step:2424/7050 train_time:544262ms step_avg:224.53ms step:2425/7050 train_time:544490ms step_avg:224.53ms step:2426/7050 train_time:544719ms step_avg:224.53ms step:2427/7050 train_time:544949ms step_avg:224.54ms step:2428/7050 train_time:545177ms step_avg:224.54ms step:2429/7050 train_time:545406ms step_avg:224.54ms step:2430/7050 train_time:545633ms step_avg:224.54ms step:2431/7050 train_time:545861ms step_avg:224.54ms step:2432/7050 train_time:546090ms step_avg:224.54ms step:2433/7050 train_time:546320ms step_avg:224.55ms step:2434/7050 train_time:546547ms step_avg:224.55ms step:2435/7050 train_time:546776ms step_avg:224.55ms step:2436/7050 train_time:547004ms step_avg:224.55ms step:2437/7050 train_time:547233ms step_avg:224.55ms step:2438/7050 train_time:547463ms step_avg:224.55ms step:2439/7050 train_time:547691ms step_avg:224.56ms step:2440/7050 train_time:547920ms step_avg:224.56ms step:2441/7050 train_time:548149ms step_avg:224.56ms step:2442/7050 train_time:548377ms step_avg:224.56ms step:2443/7050 train_time:548605ms step_avg:224.56ms step:2444/7050 train_time:548834ms step_avg:224.56ms step:2445/7050 train_time:549062ms step_avg:224.57ms step:2446/7050 train_time:549290ms step_avg:224.57ms step:2447/7050 train_time:549518ms step_avg:224.57ms step:2448/7050 train_time:549746ms step_avg:224.57ms step:2449/7050 train_time:549975ms step_avg:224.57ms step:2450/7050 train_time:550203ms step_avg:224.57ms step:2451/7050 train_time:550432ms step_avg:224.57ms step:2452/7050 train_time:550660ms step_avg:224.58ms step:2453/7050 train_time:550889ms step_avg:224.58ms step:2454/7050 train_time:551118ms step_avg:224.58ms step:2455/7050 train_time:551346ms step_avg:224.58ms step:2456/7050 train_time:551574ms step_avg:224.58ms step:2457/7050 train_time:551803ms step_avg:224.58ms step:2458/7050 train_time:552031ms step_avg:224.59ms step:2459/7050 train_time:552260ms step_avg:224.59ms step:2460/7050 train_time:552490ms step_avg:224.59ms step:2461/7050 train_time:552717ms step_avg:224.59ms step:2462/7050 train_time:552945ms step_avg:224.59ms step:2463/7050 train_time:553175ms step_avg:224.59ms step:2464/7050 train_time:553404ms step_avg:224.60ms step:2465/7050 train_time:553633ms step_avg:224.60ms step:2466/7050 train_time:553863ms step_avg:224.60ms step:2467/7050 train_time:554092ms step_avg:224.60ms step:2468/7050 train_time:554321ms step_avg:224.60ms step:2469/7050 train_time:554549ms step_avg:224.60ms step:2470/7050 train_time:554778ms step_avg:224.61ms step:2471/7050 train_time:555007ms step_avg:224.61ms step:2472/7050 train_time:555235ms step_avg:224.61ms step:2473/7050 train_time:555463ms step_avg:224.61ms step:2474/7050 train_time:555692ms step_avg:224.61ms step:2475/7050 train_time:555923ms step_avg:224.62ms step:2476/7050 train_time:556150ms step_avg:224.62ms step:2477/7050 train_time:556378ms step_avg:224.62ms step:2478/7050 train_time:556606ms step_avg:224.62ms step:2479/7050 train_time:556834ms step_avg:224.62ms step:2480/7050 train_time:557064ms step_avg:224.62ms step:2481/7050 train_time:557292ms step_avg:224.62ms step:2482/7050 train_time:557522ms step_avg:224.63ms step:2483/7050 train_time:557750ms step_avg:224.63ms step:2484/7050 train_time:557979ms step_avg:224.63ms step:2485/7050 train_time:558208ms step_avg:224.63ms step:2486/7050 train_time:558438ms step_avg:224.63ms step:2487/7050 train_time:558664ms step_avg:224.63ms step:2488/7050 train_time:558892ms step_avg:224.64ms step:2489/7050 train_time:559122ms step_avg:224.64ms step:2490/7050 train_time:559351ms step_avg:224.64ms step:2491/7050 train_time:559579ms step_avg:224.64ms step:2492/7050 train_time:559808ms step_avg:224.64ms step:2493/7050 train_time:560037ms step_avg:224.64ms step:2494/7050 train_time:560266ms step_avg:224.65ms step:2495/7050 train_time:560496ms step_avg:224.65ms step:2496/7050 train_time:560723ms step_avg:224.65ms step:2497/7050 train_time:560952ms step_avg:224.65ms step:2498/7050 train_time:561180ms step_avg:224.65ms step:2499/7050 train_time:561410ms step_avg:224.65ms step:2500/7050 train_time:561638ms step_avg:224.66ms step:2500/7050 val_loss:3.2047 train_time:561818ms step_avg:224.73ms step:2501/7050 train_time:561867ms step_avg:224.66ms step:2502/7050 train_time:562096ms step_avg:224.66ms step:2503/7050 train_time:562328ms step_avg:224.66ms step:2504/7050 train_time:562557ms step_avg:224.66ms step:2505/7050 train_time:562785ms step_avg:224.66ms step:2506/7050 train_time:563014ms step_avg:224.67ms step:2507/7050 train_time:563242ms step_avg:224.67ms step:2508/7050 train_time:563472ms step_avg:224.67ms step:2509/7050 train_time:563700ms step_avg:224.67ms step:2510/7050 train_time:563927ms step_avg:224.67ms step:2511/7050 train_time:564156ms step_avg:224.67ms step:2512/7050 train_time:564387ms step_avg:224.68ms step:2513/7050 train_time:564617ms step_avg:224.68ms step:2514/7050 train_time:564843ms step_avg:224.68ms step:2515/7050 train_time:565073ms step_avg:224.68ms step:2516/7050 train_time:565303ms step_avg:224.68ms step:2517/7050 train_time:565532ms step_avg:224.68ms step:2518/7050 train_time:565760ms step_avg:224.69ms step:2519/7050 train_time:565988ms step_avg:224.69ms step:2520/7050 train_time:566216ms step_avg:224.69ms step:2521/7050 train_time:566445ms step_avg:224.69ms step:2522/7050 train_time:566674ms step_avg:224.69ms step:2523/7050 train_time:566904ms step_avg:224.69ms step:2524/7050 train_time:567132ms step_avg:224.70ms step:2525/7050 train_time:567361ms step_avg:224.70ms step:2526/7050 train_time:567589ms step_avg:224.70ms step:2527/7050 train_time:567818ms step_avg:224.70ms step:2528/7050 train_time:568045ms step_avg:224.70ms step:2529/7050 train_time:568275ms step_avg:224.70ms step:2530/7050 train_time:568507ms step_avg:224.71ms step:2531/7050 train_time:568735ms step_avg:224.71ms step:2532/7050 train_time:568964ms step_avg:224.71ms step:2533/7050 train_time:569193ms step_avg:224.71ms step:2534/7050 train_time:569422ms step_avg:224.71ms step:2535/7050 train_time:569652ms step_avg:224.71ms step:2536/7050 train_time:569880ms step_avg:224.72ms step:2537/7050 train_time:570109ms step_avg:224.72ms step:2538/7050 train_time:570336ms step_avg:224.72ms step:2539/7050 train_time:570565ms step_avg:224.72ms step:2540/7050 train_time:570794ms step_avg:224.72ms step:2541/7050 train_time:571025ms step_avg:224.72ms step:2542/7050 train_time:571254ms step_avg:224.73ms step:2543/7050 train_time:571483ms step_avg:224.73ms step:2544/7050 train_time:571712ms step_avg:224.73ms step:2545/7050 train_time:571941ms step_avg:224.73ms step:2546/7050 train_time:572171ms step_avg:224.73ms step:2547/7050 train_time:572399ms step_avg:224.73ms step:2548/7050 train_time:572627ms step_avg:224.74ms step:2549/7050 train_time:572858ms step_avg:224.74ms step:2550/7050 train_time:573086ms step_avg:224.74ms step:2551/7050 train_time:573315ms step_avg:224.74ms step:2552/7050 train_time:573543ms step_avg:224.74ms step:2553/7050 train_time:573772ms step_avg:224.74ms step:2554/7050 train_time:574001ms step_avg:224.75ms step:2555/7050 train_time:574229ms step_avg:224.75ms step:2556/7050 train_time:574458ms step_avg:224.75ms step:2557/7050 train_time:574689ms step_avg:224.75ms step:2558/7050 train_time:574917ms step_avg:224.75ms step:2559/7050 train_time:575145ms step_avg:224.75ms step:2560/7050 train_time:575376ms step_avg:224.76ms step:2561/7050 train_time:575606ms step_avg:224.76ms step:2562/7050 train_time:575833ms step_avg:224.76ms step:2563/7050 train_time:576063ms step_avg:224.76ms step:2564/7050 train_time:576292ms step_avg:224.76ms step:2565/7050 train_time:576522ms step_avg:224.76ms step:2566/7050 train_time:576751ms step_avg:224.77ms step:2567/7050 train_time:576980ms step_avg:224.77ms step:2568/7050 train_time:577208ms step_avg:224.77ms step:2569/7050 train_time:577436ms step_avg:224.77ms step:2570/7050 train_time:577665ms step_avg:224.77ms step:2571/7050 train_time:577898ms step_avg:224.78ms step:2572/7050 train_time:578126ms step_avg:224.78ms step:2573/7050 train_time:578354ms step_avg:224.78ms step:2574/7050 train_time:578584ms step_avg:224.78ms step:2575/7050 train_time:578813ms step_avg:224.78ms step:2576/7050 train_time:579042ms step_avg:224.78ms step:2577/7050 train_time:579272ms step_avg:224.79ms step:2578/7050 train_time:579501ms step_avg:224.79ms step:2579/7050 train_time:579730ms step_avg:224.79ms step:2580/7050 train_time:579958ms step_avg:224.79ms step:2581/7050 train_time:580187ms step_avg:224.79ms step:2582/7050 train_time:580418ms step_avg:224.79ms step:2583/7050 train_time:580648ms step_avg:224.80ms step:2584/7050 train_time:580876ms step_avg:224.80ms step:2585/7050 train_time:581107ms step_avg:224.80ms step:2586/7050 train_time:581336ms step_avg:224.80ms step:2587/7050 train_time:581565ms step_avg:224.80ms step:2588/7050 train_time:581794ms step_avg:224.80ms step:2589/7050 train_time:582022ms step_avg:224.81ms step:2590/7050 train_time:582251ms step_avg:224.81ms step:2591/7050 train_time:582480ms step_avg:224.81ms step:2592/7050 train_time:582710ms step_avg:224.81ms step:2593/7050 train_time:582939ms step_avg:224.81ms step:2594/7050 train_time:583167ms step_avg:224.81ms step:2595/7050 train_time:583396ms step_avg:224.82ms step:2596/7050 train_time:583628ms step_avg:224.82ms step:2597/7050 train_time:583855ms step_avg:224.82ms step:2598/7050 train_time:584084ms step_avg:224.82ms step:2599/7050 train_time:584312ms step_avg:224.82ms step:2600/7050 train_time:584540ms step_avg:224.82ms step:2601/7050 train_time:584768ms step_avg:224.82ms step:2602/7050 train_time:584997ms step_avg:224.83ms step:2603/7050 train_time:585226ms step_avg:224.83ms step:2604/7050 train_time:585454ms step_avg:224.83ms step:2605/7050 train_time:585682ms step_avg:224.83ms step:2606/7050 train_time:585912ms step_avg:224.83ms step:2607/7050 train_time:586140ms step_avg:224.83ms step:2608/7050 train_time:586369ms step_avg:224.83ms step:2609/7050 train_time:586597ms step_avg:224.84ms step:2610/7050 train_time:586825ms step_avg:224.84ms step:2611/7050 train_time:587055ms step_avg:224.84ms step:2612/7050 train_time:587284ms step_avg:224.84ms step:2613/7050 train_time:587514ms step_avg:224.84ms step:2614/7050 train_time:587747ms step_avg:224.85ms step:2615/7050 train_time:587981ms step_avg:224.85ms step:2616/7050 train_time:588214ms step_avg:224.85ms step:2617/7050 train_time:588446ms step_avg:224.86ms step:2618/7050 train_time:588679ms step_avg:224.86ms step:2619/7050 train_time:588912ms step_avg:224.86ms step:2620/7050 train_time:589622ms step_avg:225.05ms step:2621/7050 train_time:589852ms step_avg:225.05ms step:2622/7050 train_time:590082ms step_avg:225.05ms step:2623/7050 train_time:590313ms step_avg:225.05ms step:2624/7050 train_time:590551ms step_avg:225.06ms step:2625/7050 train_time:590786ms step_avg:225.06ms step:2625/7050 val_loss:3.1907 train_time:590968ms step_avg:225.13ms step:2626/7050 train_time:591021ms step_avg:225.07ms step:2627/7050 train_time:591250ms step_avg:225.07ms step:2628/7050 train_time:591489ms step_avg:225.07ms step:2629/7050 train_time:591722ms step_avg:225.07ms step:2630/7050 train_time:591952ms step_avg:225.08ms step:2631/7050 train_time:592183ms step_avg:225.08ms step:2632/7050 train_time:592418ms step_avg:225.08ms step:2633/7050 train_time:592650ms step_avg:225.09ms step:2634/7050 train_time:592883ms step_avg:225.09ms step:2635/7050 train_time:593116ms step_avg:225.09ms step:2636/7050 train_time:593348ms step_avg:225.09ms step:2637/7050 train_time:593584ms step_avg:225.10ms step:2638/7050 train_time:593817ms step_avg:225.10ms step:2639/7050 train_time:594049ms step_avg:225.10ms step:2640/7050 train_time:594281ms step_avg:225.11ms step:2641/7050 train_time:594516ms step_avg:225.11ms step:2642/7050 train_time:594747ms step_avg:225.11ms step:2643/7050 train_time:594979ms step_avg:225.11ms step:2644/7050 train_time:595213ms step_avg:225.12ms step:2645/7050 train_time:595445ms step_avg:225.12ms step:2646/7050 train_time:595679ms step_avg:225.12ms step:2647/7050 train_time:595911ms step_avg:225.13ms step:2648/7050 train_time:596143ms step_avg:225.13ms step:2649/7050 train_time:596378ms step_avg:225.13ms step:2650/7050 train_time:596611ms step_avg:225.14ms step:2651/7050 train_time:596843ms step_avg:225.14ms step:2652/7050 train_time:597075ms step_avg:225.14ms step:2653/7050 train_time:597309ms step_avg:225.14ms step:2654/7050 train_time:597540ms step_avg:225.15ms step:2655/7050 train_time:597775ms step_avg:225.15ms step:2656/7050 train_time:598010ms step_avg:225.15ms step:2657/7050 train_time:598241ms step_avg:225.16ms step:2658/7050 train_time:598474ms step_avg:225.16ms step:2659/7050 train_time:598707ms step_avg:225.16ms step:2660/7050 train_time:598940ms step_avg:225.17ms step:2661/7050 train_time:599172ms step_avg:225.17ms step:2662/7050 train_time:599408ms step_avg:225.17ms step:2663/7050 train_time:599640ms step_avg:225.17ms step:2664/7050 train_time:599872ms step_avg:225.18ms step:2665/7050 train_time:600106ms step_avg:225.18ms step:2666/7050 train_time:600337ms step_avg:225.18ms step:2667/7050 train_time:600570ms step_avg:225.19ms step:2668/7050 train_time:600803ms step_avg:225.19ms step:2669/7050 train_time:601037ms step_avg:225.19ms step:2670/7050 train_time:601269ms step_avg:225.19ms step:2671/7050 train_time:601503ms step_avg:225.20ms step:2672/7050 train_time:601735ms step_avg:225.20ms step:2673/7050 train_time:601968ms step_avg:225.20ms step:2674/7050 train_time:602202ms step_avg:225.21ms step:2675/7050 train_time:602435ms step_avg:225.21ms step:2676/7050 train_time:602667ms step_avg:225.21ms step:2677/7050 train_time:602898ms step_avg:225.21ms step:2678/7050 train_time:603131ms step_avg:225.22ms step:2679/7050 train_time:603363ms step_avg:225.22ms step:2680/7050 train_time:603596ms step_avg:225.22ms step:2681/7050 train_time:603828ms step_avg:225.22ms step:2682/7050 train_time:604061ms step_avg:225.23ms step:2683/7050 train_time:604294ms step_avg:225.23ms step:2684/7050 train_time:604527ms step_avg:225.23ms step:2685/7050 train_time:604759ms step_avg:225.24ms step:2686/7050 train_time:604993ms step_avg:225.24ms step:2687/7050 train_time:605225ms step_avg:225.24ms step:2688/7050 train_time:605457ms step_avg:225.24ms step:2689/7050 train_time:605690ms step_avg:225.25ms step:2690/7050 train_time:605923ms step_avg:225.25ms step:2691/7050 train_time:606155ms step_avg:225.25ms step:2692/7050 train_time:606387ms step_avg:225.26ms step:2693/7050 train_time:606620ms step_avg:225.26ms step:2694/7050 train_time:606851ms step_avg:225.26ms step:2695/7050 train_time:607082ms step_avg:225.26ms step:2696/7050 train_time:607316ms step_avg:225.27ms step:2697/7050 train_time:607549ms step_avg:225.27ms step:2698/7050 train_time:607781ms step_avg:225.27ms step:2699/7050 train_time:608013ms step_avg:225.27ms step:2700/7050 train_time:608246ms step_avg:225.28ms step:2701/7050 train_time:608478ms step_avg:225.28ms step:2702/7050 train_time:608713ms step_avg:225.28ms step:2703/7050 train_time:608945ms step_avg:225.28ms step:2704/7050 train_time:609176ms step_avg:225.29ms step:2705/7050 train_time:609409ms step_avg:225.29ms step:2706/7050 train_time:609642ms step_avg:225.29ms step:2707/7050 train_time:609876ms step_avg:225.30ms step:2708/7050 train_time:610109ms step_avg:225.30ms step:2709/7050 train_time:610341ms step_avg:225.30ms step:2710/7050 train_time:610573ms step_avg:225.30ms step:2711/7050 train_time:610805ms step_avg:225.31ms step:2712/7050 train_time:611038ms step_avg:225.31ms step:2713/7050 train_time:611272ms step_avg:225.31ms step:2714/7050 train_time:611503ms step_avg:225.31ms step:2715/7050 train_time:611737ms step_avg:225.32ms step:2716/7050 train_time:611970ms step_avg:225.32ms step:2717/7050 train_time:612204ms step_avg:225.32ms step:2718/7050 train_time:612437ms step_avg:225.33ms step:2719/7050 train_time:612669ms step_avg:225.33ms step:2720/7050 train_time:612902ms step_avg:225.33ms step:2721/7050 train_time:613136ms step_avg:225.33ms step:2722/7050 train_time:613368ms step_avg:225.34ms step:2723/7050 train_time:613600ms step_avg:225.34ms step:2724/7050 train_time:613833ms step_avg:225.34ms step:2725/7050 train_time:614065ms step_avg:225.35ms step:2726/7050 train_time:614298ms step_avg:225.35ms step:2727/7050 train_time:614531ms step_avg:225.35ms step:2728/7050 train_time:614764ms step_avg:225.35ms step:2729/7050 train_time:614996ms step_avg:225.36ms step:2730/7050 train_time:615229ms step_avg:225.36ms step:2731/7050 train_time:615461ms step_avg:225.36ms step:2732/7050 train_time:615695ms step_avg:225.36ms step:2733/7050 train_time:615927ms step_avg:225.37ms step:2734/7050 train_time:616160ms step_avg:225.37ms step:2735/7050 train_time:616393ms step_avg:225.37ms step:2736/7050 train_time:616626ms step_avg:225.38ms step:2737/7050 train_time:616858ms step_avg:225.38ms step:2738/7050 train_time:617091ms step_avg:225.38ms step:2739/7050 train_time:617325ms step_avg:225.38ms step:2740/7050 train_time:617557ms step_avg:225.39ms step:2741/7050 train_time:617792ms step_avg:225.39ms step:2742/7050 train_time:618024ms step_avg:225.39ms step:2743/7050 train_time:618255ms step_avg:225.39ms step:2744/7050 train_time:618487ms step_avg:225.40ms step:2745/7050 train_time:618722ms step_avg:225.40ms step:2746/7050 train_time:618954ms step_avg:225.40ms step:2747/7050 train_time:619186ms step_avg:225.40ms step:2748/7050 train_time:619418ms step_avg:225.41ms step:2749/7050 train_time:619650ms step_avg:225.41ms step:2750/7050 train_time:619882ms step_avg:225.41ms step:2750/7050 val_loss:3.1829 train_time:620068ms step_avg:225.48ms step:2751/7050 train_time:620120ms step_avg:225.42ms step:2752/7050 train_time:620350ms step_avg:225.42ms step:2753/7050 train_time:620589ms step_avg:225.42ms step:2754/7050 train_time:620822ms step_avg:225.43ms step:2755/7050 train_time:621053ms step_avg:225.43ms step:2756/7050 train_time:621285ms step_avg:225.43ms step:2757/7050 train_time:621519ms step_avg:225.43ms step:2758/7050 train_time:621752ms step_avg:225.44ms step:2759/7050 train_time:621987ms step_avg:225.44ms step:2760/7050 train_time:622218ms step_avg:225.44ms step:2761/7050 train_time:622450ms step_avg:225.44ms step:2762/7050 train_time:622682ms step_avg:225.45ms step:2763/7050 train_time:622914ms step_avg:225.45ms step:2764/7050 train_time:623146ms step_avg:225.45ms step:2765/7050 train_time:623377ms step_avg:225.45ms step:2766/7050 train_time:623610ms step_avg:225.46ms step:2767/7050 train_time:623844ms step_avg:225.46ms step:2768/7050 train_time:624076ms step_avg:225.46ms step:2769/7050 train_time:624310ms step_avg:225.46ms step:2770/7050 train_time:624542ms step_avg:225.47ms step:2771/7050 train_time:624775ms step_avg:225.47ms step:2772/7050 train_time:625008ms step_avg:225.47ms step:2773/7050 train_time:625240ms step_avg:225.47ms step:2774/7050 train_time:625472ms step_avg:225.48ms step:2775/7050 train_time:625705ms step_avg:225.48ms step:2776/7050 train_time:625938ms step_avg:225.48ms step:2777/7050 train_time:626173ms step_avg:225.49ms step:2778/7050 train_time:626406ms step_avg:225.49ms step:2779/7050 train_time:626637ms step_avg:225.49ms step:2780/7050 train_time:626870ms step_avg:225.49ms step:2781/7050 train_time:627102ms step_avg:225.50ms step:2782/7050 train_time:627335ms step_avg:225.50ms step:2783/7050 train_time:627568ms step_avg:225.50ms step:2784/7050 train_time:627801ms step_avg:225.50ms step:2785/7050 train_time:628033ms step_avg:225.51ms step:2786/7050 train_time:628266ms step_avg:225.51ms step:2787/7050 train_time:628500ms step_avg:225.51ms step:2788/7050 train_time:628731ms step_avg:225.51ms step:2789/7050 train_time:628965ms step_avg:225.52ms step:2790/7050 train_time:629197ms step_avg:225.52ms step:2791/7050 train_time:629432ms step_avg:225.52ms step:2792/7050 train_time:629664ms step_avg:225.52ms step:2793/7050 train_time:629896ms step_avg:225.53ms step:2794/7050 train_time:630130ms step_avg:225.53ms step:2795/7050 train_time:630363ms step_avg:225.53ms step:2796/7050 train_time:630596ms step_avg:225.54ms step:2797/7050 train_time:630828ms step_avg:225.54ms step:2798/7050 train_time:631062ms step_avg:225.54ms step:2799/7050 train_time:631296ms step_avg:225.54ms step:2800/7050 train_time:631530ms step_avg:225.55ms step:2801/7050 train_time:631760ms step_avg:225.55ms step:2802/7050 train_time:631993ms step_avg:225.55ms step:2803/7050 train_time:632227ms step_avg:225.55ms step:2804/7050 train_time:632459ms step_avg:225.56ms step:2805/7050 train_time:632690ms step_avg:225.56ms step:2806/7050 train_time:632924ms step_avg:225.56ms step:2807/7050 train_time:633158ms step_avg:225.56ms step:2808/7050 train_time:633393ms step_avg:225.57ms step:2809/7050 train_time:633627ms step_avg:225.57ms step:2810/7050 train_time:633858ms step_avg:225.57ms step:2811/7050 train_time:634091ms step_avg:225.57ms step:2812/7050 train_time:634324ms step_avg:225.58ms step:2813/7050 train_time:634557ms step_avg:225.58ms step:2814/7050 train_time:634790ms step_avg:225.58ms step:2815/7050 train_time:635024ms step_avg:225.59ms step:2816/7050 train_time:635256ms step_avg:225.59ms step:2817/7050 train_time:635488ms step_avg:225.59ms step:2818/7050 train_time:635722ms step_avg:225.59ms step:2819/7050 train_time:635953ms step_avg:225.60ms step:2820/7050 train_time:636186ms step_avg:225.60ms step:2821/7050 train_time:636419ms step_avg:225.60ms step:2822/7050 train_time:636651ms step_avg:225.60ms step:2823/7050 train_time:636884ms step_avg:225.61ms step:2824/7050 train_time:637118ms step_avg:225.61ms step:2825/7050 train_time:637352ms step_avg:225.61ms step:2826/7050 train_time:637584ms step_avg:225.61ms step:2827/7050 train_time:637817ms step_avg:225.62ms step:2828/7050 train_time:638050ms step_avg:225.62ms step:2829/7050 train_time:638284ms step_avg:225.62ms step:2830/7050 train_time:638517ms step_avg:225.62ms step:2831/7050 train_time:638752ms step_avg:225.63ms step:2832/7050 train_time:638984ms step_avg:225.63ms step:2833/7050 train_time:639216ms step_avg:225.63ms step:2834/7050 train_time:639449ms step_avg:225.63ms step:2835/7050 train_time:639682ms step_avg:225.64ms step:2836/7050 train_time:639913ms step_avg:225.64ms step:2837/7050 train_time:640146ms step_avg:225.64ms step:2838/7050 train_time:640377ms step_avg:225.64ms step:2839/7050 train_time:640611ms step_avg:225.65ms step:2840/7050 train_time:640845ms step_avg:225.65ms step:2841/7050 train_time:641077ms step_avg:225.65ms step:2842/7050 train_time:641309ms step_avg:225.65ms step:2843/7050 train_time:641542ms step_avg:225.66ms step:2844/7050 train_time:641774ms step_avg:225.66ms step:2845/7050 train_time:642007ms step_avg:225.66ms step:2846/7050 train_time:642238ms step_avg:225.66ms step:2847/7050 train_time:642472ms step_avg:225.67ms step:2848/7050 train_time:642705ms step_avg:225.67ms step:2849/7050 train_time:642938ms step_avg:225.67ms step:2850/7050 train_time:643170ms step_avg:225.67ms step:2851/7050 train_time:643402ms step_avg:225.68ms step:2852/7050 train_time:643634ms step_avg:225.68ms step:2853/7050 train_time:643868ms step_avg:225.68ms step:2854/7050 train_time:644100ms step_avg:225.68ms step:2855/7050 train_time:644331ms step_avg:225.69ms step:2856/7050 train_time:644564ms step_avg:225.69ms step:2857/7050 train_time:644799ms step_avg:225.69ms step:2858/7050 train_time:645031ms step_avg:225.69ms step:2859/7050 train_time:645263ms step_avg:225.70ms step:2860/7050 train_time:645495ms step_avg:225.70ms step:2861/7050 train_time:645729ms step_avg:225.70ms step:2862/7050 train_time:645963ms step_avg:225.70ms step:2863/7050 train_time:646196ms step_avg:225.71ms step:2864/7050 train_time:646427ms step_avg:225.71ms step:2865/7050 train_time:646660ms step_avg:225.71ms step:2866/7050 train_time:646894ms step_avg:225.71ms step:2867/7050 train_time:647127ms step_avg:225.72ms step:2868/7050 train_time:647359ms step_avg:225.72ms step:2869/7050 train_time:647591ms step_avg:225.72ms step:2870/7050 train_time:647824ms step_avg:225.72ms step:2871/7050 train_time:648057ms step_avg:225.73ms step:2872/7050 train_time:648289ms step_avg:225.73ms step:2873/7050 train_time:648521ms step_avg:225.73ms step:2874/7050 train_time:648754ms step_avg:225.73ms step:2875/7050 train_time:648987ms step_avg:225.73ms step:2875/7050 val_loss:3.1733 train_time:649172ms step_avg:225.80ms step:2876/7050 train_time:649222ms step_avg:225.74ms step:2877/7050 train_time:649454ms step_avg:225.74ms step:2878/7050 train_time:649689ms step_avg:225.74ms step:2879/7050 train_time:649921ms step_avg:225.75ms step:2880/7050 train_time:650152ms step_avg:225.75ms step:2881/7050 train_time:650384ms step_avg:225.75ms step:2882/7050 train_time:650618ms step_avg:225.75ms step:2883/7050 train_time:650850ms step_avg:225.75ms step:2884/7050 train_time:651082ms step_avg:225.76ms step:2885/7050 train_time:651313ms step_avg:225.76ms step:2886/7050 train_time:651546ms step_avg:225.76ms step:2887/7050 train_time:651780ms step_avg:225.76ms step:2888/7050 train_time:652012ms step_avg:225.77ms step:2889/7050 train_time:652244ms step_avg:225.77ms step:2890/7050 train_time:652477ms step_avg:225.77ms step:2891/7050 train_time:652710ms step_avg:225.77ms step:2892/7050 train_time:652943ms step_avg:225.78ms step:2893/7050 train_time:653174ms step_avg:225.78ms step:2894/7050 train_time:653407ms step_avg:225.78ms step:2895/7050 train_time:653639ms step_avg:225.78ms step:2896/7050 train_time:653872ms step_avg:225.78ms step:2897/7050 train_time:654104ms step_avg:225.79ms step:2898/7050 train_time:654337ms step_avg:225.79ms step:2899/7050 train_time:654570ms step_avg:225.79ms step:2900/7050 train_time:654803ms step_avg:225.79ms step:2901/7050 train_time:655036ms step_avg:225.80ms step:2902/7050 train_time:655268ms step_avg:225.80ms step:2903/7050 train_time:655501ms step_avg:225.80ms step:2904/7050 train_time:655734ms step_avg:225.80ms step:2905/7050 train_time:655967ms step_avg:225.81ms step:2906/7050 train_time:656199ms step_avg:225.81ms step:2907/7050 train_time:656431ms step_avg:225.81ms step:2908/7050 train_time:656664ms step_avg:225.81ms step:2909/7050 train_time:656898ms step_avg:225.82ms step:2910/7050 train_time:657130ms step_avg:225.82ms step:2911/7050 train_time:657361ms step_avg:225.82ms step:2912/7050 train_time:657594ms step_avg:225.82ms step:2913/7050 train_time:657826ms step_avg:225.82ms step:2914/7050 train_time:658060ms step_avg:225.83ms step:2915/7050 train_time:658293ms step_avg:225.83ms step:2916/7050 train_time:658524ms step_avg:225.83ms step:2917/7050 train_time:658757ms step_avg:225.83ms step:2918/7050 train_time:658989ms step_avg:225.84ms step:2919/7050 train_time:659222ms step_avg:225.84ms step:2920/7050 train_time:659456ms step_avg:225.84ms step:2921/7050 train_time:659690ms step_avg:225.84ms step:2922/7050 train_time:659921ms step_avg:225.85ms step:2923/7050 train_time:660153ms step_avg:225.85ms step:2924/7050 train_time:660387ms step_avg:225.85ms step:2925/7050 train_time:660620ms step_avg:225.85ms step:2926/7050 train_time:660852ms step_avg:225.86ms step:2927/7050 train_time:661084ms step_avg:225.86ms step:2928/7050 train_time:661319ms step_avg:225.86ms step:2929/7050 train_time:661554ms step_avg:225.86ms step:2930/7050 train_time:661785ms step_avg:225.87ms step:2931/7050 train_time:662018ms step_avg:225.87ms step:2932/7050 train_time:662249ms step_avg:225.87ms step:2933/7050 train_time:662482ms step_avg:225.87ms step:2934/7050 train_time:662716ms step_avg:225.87ms step:2935/7050 train_time:662948ms step_avg:225.88ms step:2936/7050 train_time:663180ms step_avg:225.88ms step:2937/7050 train_time:663412ms step_avg:225.88ms step:2938/7050 train_time:663647ms step_avg:225.88ms step:2939/7050 train_time:663879ms step_avg:225.89ms step:2940/7050 train_time:664111ms step_avg:225.89ms step:2941/7050 train_time:664344ms step_avg:225.89ms step:2942/7050 train_time:664578ms step_avg:225.89ms step:2943/7050 train_time:664810ms step_avg:225.90ms step:2944/7050 train_time:665043ms step_avg:225.90ms step:2945/7050 train_time:665276ms step_avg:225.90ms step:2946/7050 train_time:665508ms step_avg:225.90ms step:2947/7050 train_time:665740ms step_avg:225.90ms step:2948/7050 train_time:665972ms step_avg:225.91ms step:2949/7050 train_time:666206ms step_avg:225.91ms step:2950/7050 train_time:666438ms step_avg:225.91ms step:2951/7050 train_time:666672ms step_avg:225.91ms step:2952/7050 train_time:666904ms step_avg:225.92ms step:2953/7050 train_time:667135ms step_avg:225.92ms step:2954/7050 train_time:667368ms step_avg:225.92ms step:2955/7050 train_time:667601ms step_avg:225.92ms step:2956/7050 train_time:667835ms step_avg:225.93ms step:2957/7050 train_time:668067ms step_avg:225.93ms step:2958/7050 train_time:668300ms step_avg:225.93ms step:2959/7050 train_time:668531ms step_avg:225.93ms step:2960/7050 train_time:668764ms step_avg:225.93ms step:2961/7050 train_time:668997ms step_avg:225.94ms step:2962/7050 train_time:669231ms step_avg:225.94ms step:2963/7050 train_time:669464ms step_avg:225.94ms step:2964/7050 train_time:669697ms step_avg:225.94ms step:2965/7050 train_time:669930ms step_avg:225.95ms step:2966/7050 train_time:670163ms step_avg:225.95ms step:2967/7050 train_time:670395ms step_avg:225.95ms step:2968/7050 train_time:670628ms step_avg:225.95ms step:2969/7050 train_time:670861ms step_avg:225.96ms step:2970/7050 train_time:671094ms step_avg:225.96ms step:2971/7050 train_time:671326ms step_avg:225.96ms step:2972/7050 train_time:671559ms step_avg:225.96ms step:2973/7050 train_time:671792ms step_avg:225.96ms step:2974/7050 train_time:672024ms step_avg:225.97ms step:2975/7050 train_time:672257ms step_avg:225.97ms step:2976/7050 train_time:672490ms step_avg:225.97ms step:2977/7050 train_time:672722ms step_avg:225.97ms step:2978/7050 train_time:672954ms step_avg:225.98ms step:2979/7050 train_time:673185ms step_avg:225.98ms step:2980/7050 train_time:673948ms step_avg:226.16ms step:2981/7050 train_time:674180ms step_avg:226.16ms step:2982/7050 train_time:674409ms step_avg:226.16ms step:2983/7050 train_time:674639ms step_avg:226.16ms step:2984/7050 train_time:674875ms step_avg:226.16ms step:2985/7050 train_time:675110ms step_avg:226.17ms step:2986/7050 train_time:675340ms step_avg:226.17ms step:2987/7050 train_time:675571ms step_avg:226.17ms step:2988/7050 train_time:675803ms step_avg:226.17ms step:2989/7050 train_time:676038ms step_avg:226.18ms step:2990/7050 train_time:676270ms step_avg:226.18ms step:2991/7050 train_time:676504ms step_avg:226.18ms step:2992/7050 train_time:676736ms step_avg:226.18ms step:2993/7050 train_time:676969ms step_avg:226.18ms step:2994/7050 train_time:677202ms step_avg:226.19ms step:2995/7050 train_time:677436ms step_avg:226.19ms step:2996/7050 train_time:677668ms step_avg:226.19ms step:2997/7050 train_time:677900ms step_avg:226.19ms step:2998/7050 train_time:678134ms step_avg:226.20ms step:2999/7050 train_time:678366ms step_avg:226.20ms step:3000/7050 train_time:678599ms step_avg:226.20ms step:3000/7050 val_loss:3.1670 train_time:678781ms step_avg:226.26ms step:3001/7050 train_time:678832ms step_avg:226.20ms step:3002/7050 train_time:679063ms step_avg:226.20ms step:3003/7050 train_time:679298ms step_avg:226.21ms step:3004/7050 train_time:679531ms step_avg:226.21ms step:3005/7050 train_time:679764ms step_avg:226.21ms step:3006/7050 train_time:679996ms step_avg:226.21ms step:3007/7050 train_time:680229ms step_avg:226.22ms step:3008/7050 train_time:680463ms step_avg:226.22ms step:3009/7050 train_time:680696ms step_avg:226.22ms step:3010/7050 train_time:680927ms step_avg:226.22ms step:3011/7050 train_time:681160ms step_avg:226.22ms step:3012/7050 train_time:681393ms step_avg:226.23ms step:3013/7050 train_time:681627ms step_avg:226.23ms step:3014/7050 train_time:681860ms step_avg:226.23ms step:3015/7050 train_time:682092ms step_avg:226.23ms step:3016/7050 train_time:682324ms step_avg:226.23ms step:3017/7050 train_time:682557ms step_avg:226.24ms step:3018/7050 train_time:682791ms step_avg:226.24ms step:3019/7050 train_time:683022ms step_avg:226.24ms step:3020/7050 train_time:683256ms step_avg:226.24ms step:3021/7050 train_time:683488ms step_avg:226.25ms step:3022/7050 train_time:683719ms step_avg:226.25ms step:3023/7050 train_time:683951ms step_avg:226.25ms step:3024/7050 train_time:684184ms step_avg:226.25ms step:3025/7050 train_time:684416ms step_avg:226.25ms step:3026/7050 train_time:684649ms step_avg:226.26ms step:3027/7050 train_time:684881ms step_avg:226.26ms step:3028/7050 train_time:685115ms step_avg:226.26ms step:3029/7050 train_time:685349ms step_avg:226.26ms step:3030/7050 train_time:685582ms step_avg:226.26ms step:3031/7050 train_time:685816ms step_avg:226.27ms step:3032/7050 train_time:686047ms step_avg:226.27ms step:3033/7050 train_time:686280ms step_avg:226.27ms step:3034/7050 train_time:686513ms step_avg:226.27ms step:3035/7050 train_time:686745ms step_avg:226.28ms step:3036/7050 train_time:686976ms step_avg:226.28ms step:3037/7050 train_time:687209ms step_avg:226.28ms step:3038/7050 train_time:687441ms step_avg:226.28ms step:3039/7050 train_time:687676ms step_avg:226.28ms step:3040/7050 train_time:687908ms step_avg:226.29ms step:3041/7050 train_time:688141ms step_avg:226.29ms step:3042/7050 train_time:688375ms step_avg:226.29ms step:3043/7050 train_time:688607ms step_avg:226.29ms step:3044/7050 train_time:688839ms step_avg:226.29ms step:3045/7050 train_time:689072ms step_avg:226.30ms step:3046/7050 train_time:689305ms step_avg:226.30ms step:3047/7050 train_time:689537ms step_avg:226.30ms step:3048/7050 train_time:689771ms step_avg:226.30ms step:3049/7050 train_time:690003ms step_avg:226.30ms step:3050/7050 train_time:690235ms step_avg:226.31ms step:3051/7050 train_time:690468ms step_avg:226.31ms step:3052/7050 train_time:690700ms step_avg:226.31ms step:3053/7050 train_time:690932ms step_avg:226.31ms step:3054/7050 train_time:691164ms step_avg:226.31ms step:3055/7050 train_time:691397ms step_avg:226.32ms step:3056/7050 train_time:691630ms step_avg:226.32ms step:3057/7050 train_time:691863ms step_avg:226.32ms step:3058/7050 train_time:692096ms step_avg:226.32ms step:3059/7050 train_time:692328ms step_avg:226.32ms step:3060/7050 train_time:692560ms step_avg:226.33ms step:3061/7050 train_time:692793ms step_avg:226.33ms step:3062/7050 train_time:693026ms step_avg:226.33ms step:3063/7050 train_time:693257ms step_avg:226.33ms step:3064/7050 train_time:693492ms step_avg:226.34ms step:3065/7050 train_time:693723ms step_avg:226.34ms step:3066/7050 train_time:693956ms step_avg:226.34ms step:3067/7050 train_time:694189ms step_avg:226.34ms step:3068/7050 train_time:694422ms step_avg:226.34ms step:3069/7050 train_time:694655ms step_avg:226.35ms step:3070/7050 train_time:694890ms step_avg:226.35ms step:3071/7050 train_time:695121ms step_avg:226.35ms step:3072/7050 train_time:695354ms step_avg:226.35ms step:3073/7050 train_time:695587ms step_avg:226.35ms step:3074/7050 train_time:695819ms step_avg:226.36ms step:3075/7050 train_time:696051ms step_avg:226.36ms step:3076/7050 train_time:696283ms step_avg:226.36ms step:3077/7050 train_time:696514ms step_avg:226.36ms step:3078/7050 train_time:696747ms step_avg:226.36ms step:3079/7050 train_time:696981ms step_avg:226.37ms step:3080/7050 train_time:697213ms step_avg:226.37ms step:3081/7050 train_time:697443ms step_avg:226.37ms step:3082/7050 train_time:697678ms step_avg:226.37ms step:3083/7050 train_time:697912ms step_avg:226.37ms step:3084/7050 train_time:698144ms step_avg:226.38ms step:3085/7050 train_time:698377ms step_avg:226.38ms step:3086/7050 train_time:698613ms step_avg:226.38ms step:3087/7050 train_time:698846ms step_avg:226.38ms step:3088/7050 train_time:699079ms step_avg:226.39ms step:3089/7050 train_time:699312ms step_avg:226.39ms step:3090/7050 train_time:699545ms step_avg:226.39ms step:3091/7050 train_time:699777ms step_avg:226.39ms step:3092/7050 train_time:700011ms step_avg:226.39ms step:3093/7050 train_time:700243ms step_avg:226.40ms step:3094/7050 train_time:700479ms step_avg:226.40ms step:3095/7050 train_time:700714ms step_avg:226.40ms step:3096/7050 train_time:700946ms step_avg:226.40ms step:3097/7050 train_time:701181ms step_avg:226.41ms step:3098/7050 train_time:701414ms step_avg:226.41ms step:3099/7050 train_time:701646ms step_avg:226.41ms step:3100/7050 train_time:701879ms step_avg:226.41ms step:3101/7050 train_time:702112ms step_avg:226.41ms step:3102/7050 train_time:702343ms step_avg:226.42ms step:3103/7050 train_time:702577ms step_avg:226.42ms step:3104/7050 train_time:702808ms step_avg:226.42ms step:3105/7050 train_time:703042ms step_avg:226.42ms step:3106/7050 train_time:703276ms step_avg:226.43ms step:3107/7050 train_time:703508ms step_avg:226.43ms step:3108/7050 train_time:703741ms step_avg:226.43ms step:3109/7050 train_time:703974ms step_avg:226.43ms step:3110/7050 train_time:704207ms step_avg:226.43ms step:3111/7050 train_time:704438ms step_avg:226.43ms step:3112/7050 train_time:704670ms step_avg:226.44ms step:3113/7050 train_time:704903ms step_avg:226.44ms step:3114/7050 train_time:705134ms step_avg:226.44ms step:3115/7050 train_time:705366ms step_avg:226.44ms step:3116/7050 train_time:705599ms step_avg:226.44ms step:3117/7050 train_time:705832ms step_avg:226.45ms step:3118/7050 train_time:706065ms step_avg:226.45ms step:3119/7050 train_time:706299ms step_avg:226.45ms step:3120/7050 train_time:706531ms step_avg:226.45ms step:3121/7050 train_time:706765ms step_avg:226.45ms step:3122/7050 train_time:706998ms step_avg:226.46ms step:3123/7050 train_time:707229ms step_avg:226.46ms step:3124/7050 train_time:707463ms step_avg:226.46ms step:3125/7050 train_time:707697ms step_avg:226.46ms step:3125/7050 val_loss:3.1598 train_time:707879ms step_avg:226.52ms step:3126/7050 train_time:707929ms step_avg:226.46ms step:3127/7050 train_time:708163ms step_avg:226.47ms step:3128/7050 train_time:708397ms step_avg:226.47ms step:3129/7050 train_time:708629ms step_avg:226.47ms step:3130/7050 train_time:708860ms step_avg:226.47ms step:3131/7050 train_time:709091ms step_avg:226.47ms step:3132/7050 train_time:709325ms step_avg:226.48ms step:3133/7050 train_time:709558ms step_avg:226.48ms step:3134/7050 train_time:709790ms step_avg:226.48ms step:3135/7050 train_time:710023ms step_avg:226.48ms step:3136/7050 train_time:710255ms step_avg:226.48ms step:3137/7050 train_time:710489ms step_avg:226.49ms step:3138/7050 train_time:710721ms step_avg:226.49ms step:3139/7050 train_time:710954ms step_avg:226.49ms step:3140/7050 train_time:711186ms step_avg:226.49ms step:3141/7050 train_time:711420ms step_avg:226.49ms step:3142/7050 train_time:711653ms step_avg:226.50ms step:3143/7050 train_time:711887ms step_avg:226.50ms step:3144/7050 train_time:712120ms step_avg:226.50ms step:3145/7050 train_time:712352ms step_avg:226.50ms step:3146/7050 train_time:712585ms step_avg:226.51ms step:3147/7050 train_time:712819ms step_avg:226.51ms step:3148/7050 train_time:713053ms step_avg:226.51ms step:3149/7050 train_time:713286ms step_avg:226.51ms step:3150/7050 train_time:713519ms step_avg:226.51ms step:3151/7050 train_time:713751ms step_avg:226.52ms step:3152/7050 train_time:713986ms step_avg:226.52ms step:3153/7050 train_time:714219ms step_avg:226.52ms step:3154/7050 train_time:714452ms step_avg:226.52ms step:3155/7050 train_time:714685ms step_avg:226.52ms step:3156/7050 train_time:714919ms step_avg:226.53ms step:3157/7050 train_time:715152ms step_avg:226.53ms step:3158/7050 train_time:715386ms step_avg:226.53ms step:3159/7050 train_time:715620ms step_avg:226.53ms step:3160/7050 train_time:715852ms step_avg:226.54ms step:3161/7050 train_time:716086ms step_avg:226.54ms step:3162/7050 train_time:716318ms step_avg:226.54ms step:3163/7050 train_time:716552ms step_avg:226.54ms step:3164/7050 train_time:716786ms step_avg:226.54ms step:3165/7050 train_time:717019ms step_avg:226.55ms step:3166/7050 train_time:717251ms step_avg:226.55ms step:3167/7050 train_time:717485ms step_avg:226.55ms step:3168/7050 train_time:717718ms step_avg:226.55ms step:3169/7050 train_time:717950ms step_avg:226.55ms step:3170/7050 train_time:718183ms step_avg:226.56ms step:3171/7050 train_time:718415ms step_avg:226.56ms step:3172/7050 train_time:718648ms step_avg:226.56ms step:3173/7050 train_time:718883ms step_avg:226.56ms step:3174/7050 train_time:719116ms step_avg:226.56ms step:3175/7050 train_time:719349ms step_avg:226.57ms step:3176/7050 train_time:719582ms step_avg:226.57ms step:3177/7050 train_time:719814ms step_avg:226.57ms step:3178/7050 train_time:720048ms step_avg:226.57ms step:3179/7050 train_time:720283ms step_avg:226.58ms step:3180/7050 train_time:720515ms step_avg:226.58ms step:3181/7050 train_time:720748ms step_avg:226.58ms step:3182/7050 train_time:720981ms step_avg:226.58ms step:3183/7050 train_time:721213ms step_avg:226.58ms step:3184/7050 train_time:721446ms step_avg:226.58ms step:3185/7050 train_time:721679ms step_avg:226.59ms step:3186/7050 train_time:721911ms step_avg:226.59ms step:3187/7050 train_time:722145ms step_avg:226.59ms step:3188/7050 train_time:722379ms step_avg:226.59ms step:3189/7050 train_time:722612ms step_avg:226.60ms step:3190/7050 train_time:722845ms step_avg:226.60ms step:3191/7050 train_time:723078ms step_avg:226.60ms step:3192/7050 train_time:723312ms step_avg:226.60ms step:3193/7050 train_time:723546ms step_avg:226.60ms step:3194/7050 train_time:723778ms step_avg:226.61ms step:3195/7050 train_time:724013ms step_avg:226.61ms step:3196/7050 train_time:724245ms step_avg:226.61ms step:3197/7050 train_time:724479ms step_avg:226.61ms step:3198/7050 train_time:724712ms step_avg:226.61ms step:3199/7050 train_time:724947ms step_avg:226.62ms step:3200/7050 train_time:725180ms step_avg:226.62ms step:3201/7050 train_time:725417ms step_avg:226.62ms step:3202/7050 train_time:725651ms step_avg:226.62ms step:3203/7050 train_time:725885ms step_avg:226.63ms step:3204/7050 train_time:726118ms step_avg:226.63ms step:3205/7050 train_time:726351ms step_avg:226.63ms step:3206/7050 train_time:726586ms step_avg:226.63ms step:3207/7050 train_time:726818ms step_avg:226.64ms step:3208/7050 train_time:727053ms step_avg:226.64ms step:3209/7050 train_time:727287ms step_avg:226.64ms step:3210/7050 train_time:727520ms step_avg:226.64ms step:3211/7050 train_time:727751ms step_avg:226.64ms step:3212/7050 train_time:727985ms step_avg:226.65ms step:3213/7050 train_time:728220ms step_avg:226.65ms step:3214/7050 train_time:728454ms step_avg:226.65ms step:3215/7050 train_time:728686ms step_avg:226.65ms step:3216/7050 train_time:728918ms step_avg:226.65ms step:3217/7050 train_time:729150ms step_avg:226.66ms step:3218/7050 train_time:729384ms step_avg:226.66ms step:3219/7050 train_time:729617ms step_avg:226.66ms step:3220/7050 train_time:729850ms step_avg:226.66ms step:3221/7050 train_time:730085ms step_avg:226.66ms step:3222/7050 train_time:730318ms step_avg:226.67ms step:3223/7050 train_time:730549ms step_avg:226.67ms step:3224/7050 train_time:730786ms step_avg:226.67ms step:3225/7050 train_time:731018ms step_avg:226.67ms step:3226/7050 train_time:731250ms step_avg:226.67ms step:3227/7050 train_time:731484ms step_avg:226.68ms step:3228/7050 train_time:731716ms step_avg:226.68ms step:3229/7050 train_time:731950ms step_avg:226.68ms step:3230/7050 train_time:732185ms step_avg:226.68ms step:3231/7050 train_time:732418ms step_avg:226.68ms step:3232/7050 train_time:732652ms step_avg:226.69ms step:3233/7050 train_time:732884ms step_avg:226.69ms step:3234/7050 train_time:733116ms step_avg:226.69ms step:3235/7050 train_time:733349ms step_avg:226.69ms step:3236/7050 train_time:733583ms step_avg:226.69ms step:3237/7050 train_time:733816ms step_avg:226.70ms step:3238/7050 train_time:734049ms step_avg:226.70ms step:3239/7050 train_time:734283ms step_avg:226.70ms step:3240/7050 train_time:734516ms step_avg:226.70ms step:3241/7050 train_time:734749ms step_avg:226.70ms step:3242/7050 train_time:734983ms step_avg:226.71ms step:3243/7050 train_time:735216ms step_avg:226.71ms step:3244/7050 train_time:735449ms step_avg:226.71ms step:3245/7050 train_time:735684ms step_avg:226.71ms step:3246/7050 train_time:735916ms step_avg:226.71ms step:3247/7050 train_time:736150ms step_avg:226.72ms step:3248/7050 train_time:736382ms step_avg:226.72ms step:3249/7050 train_time:736615ms step_avg:226.72ms step:3250/7050 train_time:736847ms step_avg:226.72ms step:3250/7050 val_loss:3.1471 train_time:737032ms step_avg:226.78ms step:3251/7050 train_time:737082ms step_avg:226.72ms step:3252/7050 train_time:737315ms step_avg:226.73ms step:3253/7050 train_time:737555ms step_avg:226.73ms step:3254/7050 train_time:737788ms step_avg:226.73ms step:3255/7050 train_time:738019ms step_avg:226.73ms step:3256/7050 train_time:738249ms step_avg:226.74ms step:3257/7050 train_time:738483ms step_avg:226.74ms step:3258/7050 train_time:738718ms step_avg:226.74ms step:3259/7050 train_time:738951ms step_avg:226.74ms step:3260/7050 train_time:739183ms step_avg:226.74ms step:3261/7050 train_time:739417ms step_avg:226.75ms step:3262/7050 train_time:739654ms step_avg:226.75ms step:3263/7050 train_time:739887ms step_avg:226.75ms step:3264/7050 train_time:740121ms step_avg:226.75ms step:3265/7050 train_time:740353ms step_avg:226.75ms step:3266/7050 train_time:740586ms step_avg:226.76ms step:3267/7050 train_time:740820ms step_avg:226.76ms step:3268/7050 train_time:741054ms step_avg:226.76ms step:3269/7050 train_time:741286ms step_avg:226.76ms step:3270/7050 train_time:741519ms step_avg:226.76ms step:3271/7050 train_time:741755ms step_avg:226.77ms step:3272/7050 train_time:741986ms step_avg:226.77ms step:3273/7050 train_time:742219ms step_avg:226.77ms step:3274/7050 train_time:742453ms step_avg:226.77ms step:3275/7050 train_time:742685ms step_avg:226.77ms step:3276/7050 train_time:742919ms step_avg:226.78ms step:3277/7050 train_time:743154ms step_avg:226.78ms step:3278/7050 train_time:743387ms step_avg:226.78ms step:3279/7050 train_time:743620ms step_avg:226.78ms step:3280/7050 train_time:743854ms step_avg:226.78ms step:3281/7050 train_time:744088ms step_avg:226.79ms step:3282/7050 train_time:744322ms step_avg:226.79ms step:3283/7050 train_time:744555ms step_avg:226.79ms step:3284/7050 train_time:744787ms step_avg:226.79ms step:3285/7050 train_time:745021ms step_avg:226.79ms step:3286/7050 train_time:745254ms step_avg:226.80ms step:3287/7050 train_time:745489ms step_avg:226.80ms step:3288/7050 train_time:745722ms step_avg:226.80ms step:3289/7050 train_time:745955ms step_avg:226.80ms step:3290/7050 train_time:746188ms step_avg:226.80ms step:3291/7050 train_time:746422ms step_avg:226.81ms step:3292/7050 train_time:746656ms step_avg:226.81ms step:3293/7050 train_time:746892ms step_avg:226.81ms step:3294/7050 train_time:747125ms step_avg:226.81ms step:3295/7050 train_time:747359ms step_avg:226.82ms step:3296/7050 train_time:747592ms step_avg:226.82ms step:3297/7050 train_time:747825ms step_avg:226.82ms step:3298/7050 train_time:748059ms step_avg:226.82ms step:3299/7050 train_time:748292ms step_avg:226.82ms step:3300/7050 train_time:748525ms step_avg:226.83ms step:3301/7050 train_time:748761ms step_avg:226.83ms step:3302/7050 train_time:748996ms step_avg:226.83ms step:3303/7050 train_time:749228ms step_avg:226.83ms step:3304/7050 train_time:749461ms step_avg:226.83ms step:3305/7050 train_time:749695ms step_avg:226.84ms step:3306/7050 train_time:749929ms step_avg:226.84ms step:3307/7050 train_time:750162ms step_avg:226.84ms step:3308/7050 train_time:750396ms step_avg:226.84ms step:3309/7050 train_time:750630ms step_avg:226.84ms step:3310/7050 train_time:750862ms step_avg:226.85ms step:3311/7050 train_time:751097ms step_avg:226.85ms step:3312/7050 train_time:751330ms step_avg:226.85ms step:3313/7050 train_time:751563ms step_avg:226.85ms step:3314/7050 train_time:751799ms step_avg:226.86ms step:3315/7050 train_time:752031ms step_avg:226.86ms step:3316/7050 train_time:752264ms step_avg:226.86ms step:3317/7050 train_time:752496ms step_avg:226.86ms step:3318/7050 train_time:752730ms step_avg:226.86ms step:3319/7050 train_time:752963ms step_avg:226.86ms step:3320/7050 train_time:753196ms step_avg:226.87ms step:3321/7050 train_time:753428ms step_avg:226.87ms step:3322/7050 train_time:753663ms step_avg:226.87ms step:3323/7050 train_time:753897ms step_avg:226.87ms step:3324/7050 train_time:754131ms step_avg:226.87ms step:3325/7050 train_time:754363ms step_avg:226.88ms step:3326/7050 train_time:754599ms step_avg:226.88ms step:3327/7050 train_time:754832ms step_avg:226.88ms step:3328/7050 train_time:755065ms step_avg:226.88ms step:3329/7050 train_time:755300ms step_avg:226.88ms step:3330/7050 train_time:755533ms step_avg:226.89ms step:3331/7050 train_time:755767ms step_avg:226.89ms step:3332/7050 train_time:755999ms step_avg:226.89ms step:3333/7050 train_time:756232ms step_avg:226.89ms step:3334/7050 train_time:756465ms step_avg:226.89ms step:3335/7050 train_time:756700ms step_avg:226.90ms step:3336/7050 train_time:756933ms step_avg:226.90ms step:3337/7050 train_time:757167ms step_avg:226.90ms step:3338/7050 train_time:757402ms step_avg:226.90ms step:3339/7050 train_time:757634ms step_avg:226.90ms step:3340/7050 train_time:757868ms step_avg:226.91ms step:3341/7050 train_time:758100ms step_avg:226.91ms step:3342/7050 train_time:758332ms step_avg:226.91ms step:3343/7050 train_time:758564ms step_avg:226.91ms step:3344/7050 train_time:758797ms step_avg:226.91ms step:3345/7050 train_time:759030ms step_avg:226.91ms step:3346/7050 train_time:759263ms step_avg:226.92ms step:3347/7050 train_time:759498ms step_avg:226.92ms step:3348/7050 train_time:759731ms step_avg:226.92ms step:3349/7050 train_time:759965ms step_avg:226.92ms step:3350/7050 train_time:760198ms step_avg:226.92ms step:3351/7050 train_time:760432ms step_avg:226.93ms step:3352/7050 train_time:760664ms step_avg:226.93ms step:3353/7050 train_time:760899ms step_avg:226.93ms step:3354/7050 train_time:761132ms step_avg:226.93ms step:3355/7050 train_time:761363ms step_avg:226.93ms step:3356/7050 train_time:761598ms step_avg:226.94ms step:3357/7050 train_time:761832ms step_avg:226.94ms step:3358/7050 train_time:762066ms step_avg:226.94ms step:3359/7050 train_time:762299ms step_avg:226.94ms step:3360/7050 train_time:762533ms step_avg:226.94ms step:3361/7050 train_time:762766ms step_avg:226.95ms step:3362/7050 train_time:763000ms step_avg:226.95ms step:3363/7050 train_time:763234ms step_avg:226.95ms step:3364/7050 train_time:763468ms step_avg:226.95ms step:3365/7050 train_time:763701ms step_avg:226.95ms step:3366/7050 train_time:763935ms step_avg:226.96ms step:3367/7050 train_time:764168ms step_avg:226.96ms step:3368/7050 train_time:764401ms step_avg:226.96ms step:3369/7050 train_time:764634ms step_avg:226.96ms step:3370/7050 train_time:764868ms step_avg:226.96ms step:3371/7050 train_time:765101ms step_avg:226.97ms step:3372/7050 train_time:765335ms step_avg:226.97ms step:3373/7050 train_time:765567ms step_avg:226.97ms step:3374/7050 train_time:765800ms step_avg:226.97ms step:3375/7050 train_time:766034ms step_avg:226.97ms step:3375/7050 val_loss:3.1413 train_time:766218ms step_avg:227.03ms step:3376/7050 train_time:766268ms step_avg:226.98ms step:3377/7050 train_time:766499ms step_avg:226.98ms step:3378/7050 train_time:766738ms step_avg:226.98ms step:3379/7050 train_time:766975ms step_avg:226.98ms step:3380/7050 train_time:767208ms step_avg:226.98ms step:3381/7050 train_time:767441ms step_avg:226.99ms step:3382/7050 train_time:767676ms step_avg:226.99ms step:3383/7050 train_time:767911ms step_avg:226.99ms step:3384/7050 train_time:768143ms step_avg:226.99ms step:3385/7050 train_time:768375ms step_avg:226.99ms step:3386/7050 train_time:768610ms step_avg:227.00ms step:3387/7050 train_time:768844ms step_avg:227.00ms step:3388/7050 train_time:769075ms step_avg:227.00ms step:3389/7050 train_time:769309ms step_avg:227.00ms step:3390/7050 train_time:769542ms step_avg:227.00ms step:3391/7050 train_time:769777ms step_avg:227.01ms step:3392/7050 train_time:770010ms step_avg:227.01ms step:3393/7050 train_time:770243ms step_avg:227.01ms step:3394/7050 train_time:770475ms step_avg:227.01ms step:3395/7050 train_time:770708ms step_avg:227.01ms step:3396/7050 train_time:770943ms step_avg:227.02ms step:3397/7050 train_time:771177ms step_avg:227.02ms step:3398/7050 train_time:771410ms step_avg:227.02ms step:3399/7050 train_time:771644ms step_avg:227.02ms step:3400/7050 train_time:771877ms step_avg:227.02ms step:3401/7050 train_time:772108ms step_avg:227.02ms step:3402/7050 train_time:772344ms step_avg:227.03ms step:3403/7050 train_time:772575ms step_avg:227.03ms step:3404/7050 train_time:772810ms step_avg:227.03ms step:3405/7050 train_time:773043ms step_avg:227.03ms step:3406/7050 train_time:773274ms step_avg:227.03ms step:3407/7050 train_time:773506ms step_avg:227.03ms step:3408/7050 train_time:773741ms step_avg:227.04ms step:3409/7050 train_time:773973ms step_avg:227.04ms step:3410/7050 train_time:774208ms step_avg:227.04ms step:3411/7050 train_time:774441ms step_avg:227.04ms step:3412/7050 train_time:774675ms step_avg:227.04ms step:3413/7050 train_time:774909ms step_avg:227.05ms step:3414/7050 train_time:775144ms step_avg:227.05ms step:3415/7050 train_time:775379ms step_avg:227.05ms step:3416/7050 train_time:775612ms step_avg:227.05ms step:3417/7050 train_time:775844ms step_avg:227.05ms step:3418/7050 train_time:776080ms step_avg:227.06ms step:3419/7050 train_time:776313ms step_avg:227.06ms step:3420/7050 train_time:776548ms step_avg:227.06ms step:3421/7050 train_time:776781ms step_avg:227.06ms step:3422/7050 train_time:777014ms step_avg:227.06ms step:3423/7050 train_time:777247ms step_avg:227.07ms step:3424/7050 train_time:777483ms step_avg:227.07ms step:3425/7050 train_time:777716ms step_avg:227.07ms step:3426/7050 train_time:777948ms step_avg:227.07ms step:3427/7050 train_time:778183ms step_avg:227.07ms step:3428/7050 train_time:778415ms step_avg:227.08ms step:3429/7050 train_time:778648ms step_avg:227.08ms step:3430/7050 train_time:778881ms step_avg:227.08ms step:3431/7050 train_time:779114ms step_avg:227.08ms step:3432/7050 train_time:779346ms step_avg:227.08ms step:3433/7050 train_time:779579ms step_avg:227.08ms step:3434/7050 train_time:779810ms step_avg:227.09ms step:3435/7050 train_time:780043ms step_avg:227.09ms step:3436/7050 train_time:780279ms step_avg:227.09ms step:3437/7050 train_time:780511ms step_avg:227.09ms step:3438/7050 train_time:780743ms step_avg:227.09ms step:3439/7050 train_time:780976ms step_avg:227.09ms step:3440/7050 train_time:781210ms step_avg:227.10ms step:3441/7050 train_time:781443ms step_avg:227.10ms step:3442/7050 train_time:781675ms step_avg:227.10ms step:3443/7050 train_time:781908ms step_avg:227.10ms step:3444/7050 train_time:782144ms step_avg:227.10ms step:3445/7050 train_time:782377ms step_avg:227.11ms step:3446/7050 train_time:782612ms step_avg:227.11ms step:3447/7050 train_time:782845ms step_avg:227.11ms step:3448/7050 train_time:783077ms step_avg:227.11ms step:3449/7050 train_time:783311ms step_avg:227.11ms step:3450/7050 train_time:783544ms step_avg:227.11ms step:3451/7050 train_time:783778ms step_avg:227.12ms step:3452/7050 train_time:784010ms step_avg:227.12ms step:3453/7050 train_time:784248ms step_avg:227.12ms step:3454/7050 train_time:784480ms step_avg:227.12ms step:3455/7050 train_time:784711ms step_avg:227.12ms step:3456/7050 train_time:784944ms step_avg:227.12ms step:3457/7050 train_time:785178ms step_avg:227.13ms step:3458/7050 train_time:785411ms step_avg:227.13ms step:3459/7050 train_time:785644ms step_avg:227.13ms step:3460/7050 train_time:785877ms step_avg:227.13ms step:3461/7050 train_time:786112ms step_avg:227.13ms step:3462/7050 train_time:786345ms step_avg:227.14ms step:3463/7050 train_time:786579ms step_avg:227.14ms step:3464/7050 train_time:786812ms step_avg:227.14ms step:3465/7050 train_time:787045ms step_avg:227.14ms step:3466/7050 train_time:787277ms step_avg:227.14ms step:3467/7050 train_time:787512ms step_avg:227.15ms step:3468/7050 train_time:787746ms step_avg:227.15ms step:3469/7050 train_time:787981ms step_avg:227.15ms step:3470/7050 train_time:788214ms step_avg:227.15ms step:3471/7050 train_time:788448ms step_avg:227.15ms step:3472/7050 train_time:788682ms step_avg:227.15ms step:3473/7050 train_time:788914ms step_avg:227.16ms step:3474/7050 train_time:789149ms step_avg:227.16ms step:3475/7050 train_time:789384ms step_avg:227.16ms step:3476/7050 train_time:789618ms step_avg:227.16ms step:3477/7050 train_time:789853ms step_avg:227.16ms step:3478/7050 train_time:790086ms step_avg:227.17ms step:3479/7050 train_time:790320ms step_avg:227.17ms step:3480/7050 train_time:790554ms step_avg:227.17ms step:3481/7050 train_time:790789ms step_avg:227.17ms step:3482/7050 train_time:791021ms step_avg:227.17ms step:3483/7050 train_time:791253ms step_avg:227.18ms step:3484/7050 train_time:791486ms step_avg:227.18ms step:3485/7050 train_time:791719ms step_avg:227.18ms step:3486/7050 train_time:791952ms step_avg:227.18ms step:3487/7050 train_time:792186ms step_avg:227.18ms step:3488/7050 train_time:792421ms step_avg:227.18ms step:3489/7050 train_time:792653ms step_avg:227.19ms step:3490/7050 train_time:792886ms step_avg:227.19ms step:3491/7050 train_time:793119ms step_avg:227.19ms step:3492/7050 train_time:793354ms step_avg:227.19ms step:3493/7050 train_time:793586ms step_avg:227.19ms step:3494/7050 train_time:793819ms step_avg:227.19ms step:3495/7050 train_time:794053ms step_avg:227.20ms step:3496/7050 train_time:794287ms step_avg:227.20ms step:3497/7050 train_time:794519ms step_avg:227.20ms step:3498/7050 train_time:794752ms step_avg:227.20ms step:3499/7050 train_time:794986ms step_avg:227.20ms step:3500/7050 train_time:795218ms step_avg:227.21ms step:3500/7050 val_loss:3.1367 train_time:795403ms step_avg:227.26ms step:3501/7050 train_time:795453ms step_avg:227.21ms step:3502/7050 train_time:795686ms step_avg:227.21ms step:3503/7050 train_time:795924ms step_avg:227.21ms step:3504/7050 train_time:796158ms step_avg:227.21ms step:3505/7050 train_time:796391ms step_avg:227.22ms step:3506/7050 train_time:796622ms step_avg:227.22ms step:3507/7050 train_time:796860ms step_avg:227.22ms step:3508/7050 train_time:797094ms step_avg:227.22ms step:3509/7050 train_time:797326ms step_avg:227.22ms step:3510/7050 train_time:797559ms step_avg:227.22ms step:3511/7050 train_time:797794ms step_avg:227.23ms step:3512/7050 train_time:798029ms step_avg:227.23ms step:3513/7050 train_time:798262ms step_avg:227.23ms step:3514/7050 train_time:798495ms step_avg:227.23ms step:3515/7050 train_time:798729ms step_avg:227.23ms step:3516/7050 train_time:798965ms step_avg:227.24ms step:3517/7050 train_time:799198ms step_avg:227.24ms step:3518/7050 train_time:799430ms step_avg:227.24ms step:3519/7050 train_time:799664ms step_avg:227.24ms step:3520/7050 train_time:799897ms step_avg:227.24ms step:3521/7050 train_time:800130ms step_avg:227.25ms step:3522/7050 train_time:800364ms step_avg:227.25ms step:3523/7050 train_time:800597ms step_avg:227.25ms step:3524/7050 train_time:800832ms step_avg:227.25ms step:3525/7050 train_time:801067ms step_avg:227.25ms step:3526/7050 train_time:801301ms step_avg:227.25ms step:3527/7050 train_time:801532ms step_avg:227.26ms step:3528/7050 train_time:801765ms step_avg:227.26ms step:3529/7050 train_time:802000ms step_avg:227.26ms step:3530/7050 train_time:802233ms step_avg:227.26ms step:3531/7050 train_time:802467ms step_avg:227.26ms step:3532/7050 train_time:802700ms step_avg:227.27ms step:3533/7050 train_time:802935ms step_avg:227.27ms step:3534/7050 train_time:803169ms step_avg:227.27ms step:3535/7050 train_time:803402ms step_avg:227.27ms step:3536/7050 train_time:803635ms step_avg:227.27ms step:3537/7050 train_time:803869ms step_avg:227.27ms step:3538/7050 train_time:804100ms step_avg:227.28ms step:3539/7050 train_time:804333ms step_avg:227.28ms step:3540/7050 train_time:804568ms step_avg:227.28ms step:3541/7050 train_time:804800ms step_avg:227.28ms step:3542/7050 train_time:805035ms step_avg:227.28ms step:3543/7050 train_time:805267ms step_avg:227.28ms step:3544/7050 train_time:805501ms step_avg:227.29ms step:3545/7050 train_time:805735ms step_avg:227.29ms step:3546/7050 train_time:805972ms step_avg:227.29ms step:3547/7050 train_time:806205ms step_avg:227.29ms step:3548/7050 train_time:806440ms step_avg:227.29ms step:3549/7050 train_time:806671ms step_avg:227.30ms step:3550/7050 train_time:806904ms step_avg:227.30ms step:3551/7050 train_time:807138ms step_avg:227.30ms step:3552/7050 train_time:807373ms step_avg:227.30ms step:3553/7050 train_time:807609ms step_avg:227.30ms step:3554/7050 train_time:807842ms step_avg:227.31ms step:3555/7050 train_time:808074ms step_avg:227.31ms step:3556/7050 train_time:808310ms step_avg:227.31ms step:3557/7050 train_time:808546ms step_avg:227.31ms step:3558/7050 train_time:808779ms step_avg:227.31ms step:3559/7050 train_time:809014ms step_avg:227.32ms step:3560/7050 train_time:809246ms step_avg:227.32ms step:3561/7050 train_time:809480ms step_avg:227.32ms step:3562/7050 train_time:809713ms step_avg:227.32ms step:3563/7050 train_time:809946ms step_avg:227.32ms step:3564/7050 train_time:810178ms step_avg:227.32ms step:3565/7050 train_time:810411ms step_avg:227.32ms step:3566/7050 train_time:810647ms step_avg:227.33ms step:3567/7050 train_time:810880ms step_avg:227.33ms step:3568/7050 train_time:811113ms step_avg:227.33ms step:3569/7050 train_time:811348ms step_avg:227.33ms step:3570/7050 train_time:811581ms step_avg:227.33ms step:3571/7050 train_time:811813ms step_avg:227.33ms step:3572/7050 train_time:812047ms step_avg:227.34ms step:3573/7050 train_time:812279ms step_avg:227.34ms step:3574/7050 train_time:812514ms step_avg:227.34ms step:3575/7050 train_time:812748ms step_avg:227.34ms step:3576/7050 train_time:812980ms step_avg:227.34ms step:3577/7050 train_time:813213ms step_avg:227.34ms step:3578/7050 train_time:813445ms step_avg:227.35ms step:3579/7050 train_time:813679ms step_avg:227.35ms step:3580/7050 train_time:813911ms step_avg:227.35ms step:3581/7050 train_time:814145ms step_avg:227.35ms step:3582/7050 train_time:814379ms step_avg:227.35ms step:3583/7050 train_time:814612ms step_avg:227.35ms step:3584/7050 train_time:814845ms step_avg:227.36ms step:3585/7050 train_time:815078ms step_avg:227.36ms step:3586/7050 train_time:815311ms step_avg:227.36ms step:3587/7050 train_time:815544ms step_avg:227.36ms step:3588/7050 train_time:815778ms step_avg:227.36ms step:3589/7050 train_time:816011ms step_avg:227.36ms step:3590/7050 train_time:816243ms step_avg:227.37ms step:3591/7050 train_time:816475ms step_avg:227.37ms step:3592/7050 train_time:816709ms step_avg:227.37ms step:3593/7050 train_time:816942ms step_avg:227.37ms step:3594/7050 train_time:817175ms step_avg:227.37ms step:3595/7050 train_time:817409ms step_avg:227.37ms step:3596/7050 train_time:817642ms step_avg:227.38ms step:3597/7050 train_time:817875ms step_avg:227.38ms step:3598/7050 train_time:818110ms step_avg:227.38ms step:3599/7050 train_time:818343ms step_avg:227.38ms step:3600/7050 train_time:818575ms step_avg:227.38ms step:3601/7050 train_time:818809ms step_avg:227.38ms step:3602/7050 train_time:819044ms step_avg:227.39ms step:3603/7050 train_time:819275ms step_avg:227.39ms step:3604/7050 train_time:819509ms step_avg:227.39ms step:3605/7050 train_time:819741ms step_avg:227.39ms step:3606/7050 train_time:819976ms step_avg:227.39ms step:3607/7050 train_time:820211ms step_avg:227.39ms step:3608/7050 train_time:820445ms step_avg:227.40ms step:3609/7050 train_time:820678ms step_avg:227.40ms step:3610/7050 train_time:820910ms step_avg:227.40ms step:3611/7050 train_time:821143ms step_avg:227.40ms step:3612/7050 train_time:821377ms step_avg:227.40ms step:3613/7050 train_time:821609ms step_avg:227.40ms step:3614/7050 train_time:821842ms step_avg:227.41ms step:3615/7050 train_time:822075ms step_avg:227.41ms step:3616/7050 train_time:822309ms step_avg:227.41ms step:3617/7050 train_time:822541ms step_avg:227.41ms step:3618/7050 train_time:822774ms step_avg:227.41ms step:3619/7050 train_time:823007ms step_avg:227.41ms step:3620/7050 train_time:823241ms step_avg:227.41ms step:3621/7050 train_time:823476ms step_avg:227.42ms step:3622/7050 train_time:823709ms step_avg:227.42ms step:3623/7050 train_time:823941ms step_avg:227.42ms step:3624/7050 train_time:824175ms step_avg:227.42ms step:3625/7050 train_time:824409ms step_avg:227.42ms step:3625/7050 val_loss:3.1313 train_time:824596ms step_avg:227.47ms step:3626/7050 train_time:824647ms step_avg:227.43ms step:3627/7050 train_time:824878ms step_avg:227.43ms step:3628/7050 train_time:825115ms step_avg:227.43ms step:3629/7050 train_time:825348ms step_avg:227.43ms step:3630/7050 train_time:825579ms step_avg:227.43ms step:3631/7050 train_time:825810ms step_avg:227.43ms step:3632/7050 train_time:826044ms step_avg:227.44ms step:3633/7050 train_time:826278ms step_avg:227.44ms step:3634/7050 train_time:826510ms step_avg:227.44ms step:3635/7050 train_time:826743ms step_avg:227.44ms step:3636/7050 train_time:826975ms step_avg:227.44ms step:3637/7050 train_time:827210ms step_avg:227.44ms step:3638/7050 train_time:827442ms step_avg:227.44ms step:3639/7050 train_time:827674ms step_avg:227.45ms step:3640/7050 train_time:827907ms step_avg:227.45ms step:3641/7050 train_time:828143ms step_avg:227.45ms step:3642/7050 train_time:828380ms step_avg:227.45ms step:3643/7050 train_time:828614ms step_avg:227.45ms step:3644/7050 train_time:828848ms step_avg:227.46ms step:3645/7050 train_time:829081ms step_avg:227.46ms step:3646/7050 train_time:829314ms step_avg:227.46ms step:3647/7050 train_time:829546ms step_avg:227.46ms step:3648/7050 train_time:829779ms step_avg:227.46ms step:3649/7050 train_time:830011ms step_avg:227.46ms step:3650/7050 train_time:830245ms step_avg:227.46ms step:3651/7050 train_time:830480ms step_avg:227.47ms step:3652/7050 train_time:830712ms step_avg:227.47ms step:3653/7050 train_time:830945ms step_avg:227.47ms step:3654/7050 train_time:831177ms step_avg:227.47ms step:3655/7050 train_time:831411ms step_avg:227.47ms step:3656/7050 train_time:831646ms step_avg:227.47ms step:3657/7050 train_time:831881ms step_avg:227.48ms step:3658/7050 train_time:832117ms step_avg:227.48ms step:3659/7050 train_time:832354ms step_avg:227.48ms step:3660/7050 train_time:832590ms step_avg:227.48ms step:3661/7050 train_time:832827ms step_avg:227.49ms step:3662/7050 train_time:833065ms step_avg:227.49ms step:3663/7050 train_time:833301ms step_avg:227.49ms step:3664/7050 train_time:833538ms step_avg:227.49ms step:3665/7050 train_time:833773ms step_avg:227.50ms step:3666/7050 train_time:834010ms step_avg:227.50ms step:3667/7050 train_time:834246ms step_avg:227.50ms step:3668/7050 train_time:834482ms step_avg:227.50ms step:3669/7050 train_time:834718ms step_avg:227.51ms step:3670/7050 train_time:834954ms step_avg:227.51ms step:3671/7050 train_time:835192ms step_avg:227.51ms step:3672/7050 train_time:835432ms step_avg:227.51ms step:3673/7050 train_time:835668ms step_avg:227.52ms step:3674/7050 train_time:835903ms step_avg:227.52ms step:3675/7050 train_time:836140ms step_avg:227.52ms step:3676/7050 train_time:836378ms step_avg:227.52ms step:3677/7050 train_time:836613ms step_avg:227.53ms step:3678/7050 train_time:836849ms step_avg:227.53ms step:3679/7050 train_time:837084ms step_avg:227.53ms step:3680/7050 train_time:837320ms step_avg:227.53ms step:3681/7050 train_time:837556ms step_avg:227.53ms step:3682/7050 train_time:837793ms step_avg:227.54ms step:3683/7050 train_time:838029ms step_avg:227.54ms step:3684/7050 train_time:838266ms step_avg:227.54ms step:3685/7050 train_time:838502ms step_avg:227.54ms step:3686/7050 train_time:838739ms step_avg:227.55ms step:3687/7050 train_time:838975ms step_avg:227.55ms step:3688/7050 train_time:839211ms step_avg:227.55ms step:3689/7050 train_time:839447ms step_avg:227.55ms step:3690/7050 train_time:839681ms step_avg:227.56ms step:3691/7050 train_time:839917ms step_avg:227.56ms step:3692/7050 train_time:840153ms step_avg:227.56ms step:3693/7050 train_time:840390ms step_avg:227.56ms step:3694/7050 train_time:840625ms step_avg:227.57ms step:3695/7050 train_time:840861ms step_avg:227.57ms step:3696/7050 train_time:841098ms step_avg:227.57ms step:3697/7050 train_time:841338ms step_avg:227.57ms step:3698/7050 train_time:841575ms step_avg:227.58ms step:3699/7050 train_time:841810ms step_avg:227.58ms step:3700/7050 train_time:842047ms step_avg:227.58ms step:3701/7050 train_time:842283ms step_avg:227.58ms step:3702/7050 train_time:842520ms step_avg:227.59ms step:3703/7050 train_time:842755ms step_avg:227.59ms step:3704/7050 train_time:842991ms step_avg:227.59ms step:3705/7050 train_time:843228ms step_avg:227.59ms step:3706/7050 train_time:843464ms step_avg:227.59ms step:3707/7050 train_time:843701ms step_avg:227.60ms step:3708/7050 train_time:843937ms step_avg:227.60ms step:3709/7050 train_time:844175ms step_avg:227.60ms step:3710/7050 train_time:844411ms step_avg:227.60ms step:3711/7050 train_time:844647ms step_avg:227.61ms step:3712/7050 train_time:844883ms step_avg:227.61ms step:3713/7050 train_time:845120ms step_avg:227.61ms step:3714/7050 train_time:845356ms step_avg:227.61ms step:3715/7050 train_time:845592ms step_avg:227.62ms step:3716/7050 train_time:845830ms step_avg:227.62ms step:3717/7050 train_time:846066ms step_avg:227.62ms step:3718/7050 train_time:846302ms step_avg:227.62ms step:3719/7050 train_time:846540ms step_avg:227.63ms step:3720/7050 train_time:846776ms step_avg:227.63ms step:3721/7050 train_time:847013ms step_avg:227.63ms step:3722/7050 train_time:847250ms step_avg:227.63ms step:3723/7050 train_time:847486ms step_avg:227.64ms step:3724/7050 train_time:847724ms step_avg:227.64ms step:3725/7050 train_time:847960ms step_avg:227.64ms step:3726/7050 train_time:848197ms step_avg:227.64ms step:3727/7050 train_time:848433ms step_avg:227.65ms step:3728/7050 train_time:848669ms step_avg:227.65ms step:3729/7050 train_time:848905ms step_avg:227.65ms step:3730/7050 train_time:849143ms step_avg:227.65ms step:3731/7050 train_time:849379ms step_avg:227.65ms step:3732/7050 train_time:849616ms step_avg:227.66ms step:3733/7050 train_time:849853ms step_avg:227.66ms step:3734/7050 train_time:850092ms step_avg:227.66ms step:3735/7050 train_time:850328ms step_avg:227.66ms step:3736/7050 train_time:850563ms step_avg:227.67ms step:3737/7050 train_time:850798ms step_avg:227.67ms step:3738/7050 train_time:851036ms step_avg:227.67ms step:3739/7050 train_time:851275ms step_avg:227.67ms step:3740/7050 train_time:851511ms step_avg:227.68ms step:3741/7050 train_time:851746ms step_avg:227.68ms step:3742/7050 train_time:851980ms step_avg:227.68ms step:3743/7050 train_time:852215ms step_avg:227.68ms step:3744/7050 train_time:852453ms step_avg:227.69ms step:3745/7050 train_time:852688ms step_avg:227.69ms step:3746/7050 train_time:852923ms step_avg:227.69ms step:3747/7050 train_time:853160ms step_avg:227.69ms step:3748/7050 train_time:853397ms step_avg:227.69ms step:3749/7050 train_time:853634ms step_avg:227.70ms step:3750/7050 train_time:853871ms step_avg:227.70ms step:3750/7050 val_loss:3.1257 train_time:854057ms step_avg:227.75ms step:3751/7050 train_time:854109ms step_avg:227.70ms step:3752/7050 train_time:854342ms step_avg:227.70ms step:3753/7050 train_time:854579ms step_avg:227.71ms step:3754/7050 train_time:854818ms step_avg:227.71ms step:3755/7050 train_time:855053ms step_avg:227.71ms step:3756/7050 train_time:855288ms step_avg:227.71ms step:3757/7050 train_time:855527ms step_avg:227.72ms step:3758/7050 train_time:855765ms step_avg:227.72ms step:3759/7050 train_time:856003ms step_avg:227.72ms step:3760/7050 train_time:856239ms step_avg:227.72ms step:3761/7050 train_time:856474ms step_avg:227.72ms step:3762/7050 train_time:856713ms step_avg:227.73ms step:3763/7050 train_time:856949ms step_avg:227.73ms step:3764/7050 train_time:857186ms step_avg:227.73ms step:3765/7050 train_time:857421ms step_avg:227.73ms step:3766/7050 train_time:857658ms step_avg:227.74ms step:3767/7050 train_time:857896ms step_avg:227.74ms step:3768/7050 train_time:858133ms step_avg:227.74ms step:3769/7050 train_time:858370ms step_avg:227.74ms step:3770/7050 train_time:858606ms step_avg:227.75ms step:3771/7050 train_time:858842ms step_avg:227.75ms step:3772/7050 train_time:859079ms step_avg:227.75ms step:3773/7050 train_time:859315ms step_avg:227.75ms step:3774/7050 train_time:859551ms step_avg:227.76ms step:3775/7050 train_time:859789ms step_avg:227.76ms step:3776/7050 train_time:860026ms step_avg:227.76ms step:3777/7050 train_time:860262ms step_avg:227.76ms step:3778/7050 train_time:860500ms step_avg:227.77ms step:3779/7050 train_time:860737ms step_avg:227.77ms step:3780/7050 train_time:860974ms step_avg:227.77ms step:3781/7050 train_time:861212ms step_avg:227.77ms step:3782/7050 train_time:861447ms step_avg:227.78ms step:3783/7050 train_time:861684ms step_avg:227.78ms step:3784/7050 train_time:861921ms step_avg:227.78ms step:3785/7050 train_time:862157ms step_avg:227.78ms step:3786/7050 train_time:862394ms step_avg:227.78ms step:3787/7050 train_time:862631ms step_avg:227.79ms step:3788/7050 train_time:862868ms step_avg:227.79ms step:3789/7050 train_time:863105ms step_avg:227.79ms step:3790/7050 train_time:863343ms step_avg:227.79ms step:3791/7050 train_time:863578ms step_avg:227.80ms step:3792/7050 train_time:863816ms step_avg:227.80ms step:3793/7050 train_time:864053ms step_avg:227.80ms step:3794/7050 train_time:864290ms step_avg:227.80ms step:3795/7050 train_time:864527ms step_avg:227.81ms step:3796/7050 train_time:864765ms step_avg:227.81ms step:3797/7050 train_time:865003ms step_avg:227.81ms step:3798/7050 train_time:865240ms step_avg:227.81ms step:3799/7050 train_time:865475ms step_avg:227.82ms step:3800/7050 train_time:865715ms step_avg:227.82ms step:3801/7050 train_time:865951ms step_avg:227.82ms step:3802/7050 train_time:866189ms step_avg:227.82ms step:3803/7050 train_time:866429ms step_avg:227.83ms step:3804/7050 train_time:866665ms step_avg:227.83ms step:3805/7050 train_time:866903ms step_avg:227.83ms step:3806/7050 train_time:867139ms step_avg:227.83ms step:3807/7050 train_time:867375ms step_avg:227.84ms step:3808/7050 train_time:867612ms step_avg:227.84ms step:3809/7050 train_time:867848ms step_avg:227.84ms step:3810/7050 train_time:868086ms step_avg:227.84ms step:3811/7050 train_time:868322ms step_avg:227.85ms step:3812/7050 train_time:868558ms step_avg:227.85ms step:3813/7050 train_time:868793ms step_avg:227.85ms step:3814/7050 train_time:869032ms step_avg:227.85ms step:3815/7050 train_time:869268ms step_avg:227.86ms step:3816/7050 train_time:869504ms step_avg:227.86ms step:3817/7050 train_time:869740ms step_avg:227.86ms step:3818/7050 train_time:869977ms step_avg:227.86ms step:3819/7050 train_time:870215ms step_avg:227.86ms step:3820/7050 train_time:870452ms step_avg:227.87ms step:3821/7050 train_time:870687ms step_avg:227.87ms step:3822/7050 train_time:870923ms step_avg:227.87ms step:3823/7050 train_time:871160ms step_avg:227.87ms step:3824/7050 train_time:871397ms step_avg:227.88ms step:3825/7050 train_time:871634ms step_avg:227.88ms step:3826/7050 train_time:871869ms step_avg:227.88ms step:3827/7050 train_time:872108ms step_avg:227.88ms step:3828/7050 train_time:872344ms step_avg:227.89ms step:3829/7050 train_time:872581ms step_avg:227.89ms step:3830/7050 train_time:872818ms step_avg:227.89ms step:3831/7050 train_time:873054ms step_avg:227.89ms step:3832/7050 train_time:873292ms step_avg:227.89ms step:3833/7050 train_time:873528ms step_avg:227.90ms step:3834/7050 train_time:873764ms step_avg:227.90ms step:3835/7050 train_time:874000ms step_avg:227.90ms step:3836/7050 train_time:874237ms step_avg:227.90ms step:3837/7050 train_time:874478ms step_avg:227.91ms step:3838/7050 train_time:874715ms step_avg:227.91ms step:3839/7050 train_time:874951ms step_avg:227.91ms step:3840/7050 train_time:875189ms step_avg:227.91ms step:3841/7050 train_time:875428ms step_avg:227.92ms step:3842/7050 train_time:875666ms step_avg:227.92ms step:3843/7050 train_time:875904ms step_avg:227.92ms step:3844/7050 train_time:876139ms step_avg:227.92ms step:3845/7050 train_time:876374ms step_avg:227.93ms step:3846/7050 train_time:876611ms step_avg:227.93ms step:3847/7050 train_time:876848ms step_avg:227.93ms step:3848/7050 train_time:877086ms step_avg:227.93ms step:3849/7050 train_time:877324ms step_avg:227.94ms step:3850/7050 train_time:877558ms step_avg:227.94ms step:3851/7050 train_time:877794ms step_avg:227.94ms step:3852/7050 train_time:878031ms step_avg:227.94ms step:3853/7050 train_time:878270ms step_avg:227.94ms step:3854/7050 train_time:878507ms step_avg:227.95ms step:3855/7050 train_time:878743ms step_avg:227.95ms step:3856/7050 train_time:878979ms step_avg:227.95ms step:3857/7050 train_time:879215ms step_avg:227.95ms step:3858/7050 train_time:879450ms step_avg:227.95ms step:3859/7050 train_time:879688ms step_avg:227.96ms step:3860/7050 train_time:879926ms step_avg:227.96ms step:3861/7050 train_time:880161ms step_avg:227.96ms step:3862/7050 train_time:880398ms step_avg:227.96ms step:3863/7050 train_time:880635ms step_avg:227.97ms step:3864/7050 train_time:880875ms step_avg:227.97ms step:3865/7050 train_time:881111ms step_avg:227.97ms step:3866/7050 train_time:881346ms step_avg:227.97ms step:3867/7050 train_time:881581ms step_avg:227.98ms step:3868/7050 train_time:881820ms step_avg:227.98ms step:3869/7050 train_time:882055ms step_avg:227.98ms step:3870/7050 train_time:882290ms step_avg:227.98ms step:3871/7050 train_time:882525ms step_avg:227.98ms step:3872/7050 train_time:882763ms step_avg:227.99ms step:3873/7050 train_time:882999ms step_avg:227.99ms step:3874/7050 train_time:883235ms step_avg:227.99ms step:3875/7050 train_time:883474ms step_avg:227.99ms step:3875/7050 val_loss:3.1203 train_time:883661ms step_avg:228.04ms step:3876/7050 train_time:883712ms step_avg:228.00ms step:3877/7050 train_time:883947ms step_avg:228.00ms step:3878/7050 train_time:884192ms step_avg:228.00ms step:3879/7050 train_time:884429ms step_avg:228.00ms step:3880/7050 train_time:884663ms step_avg:228.01ms step:3881/7050 train_time:884897ms step_avg:228.01ms step:3882/7050 train_time:885135ms step_avg:228.01ms step:3883/7050 train_time:885372ms step_avg:228.01ms step:3884/7050 train_time:885607ms step_avg:228.01ms step:3885/7050 train_time:885844ms step_avg:228.02ms step:3886/7050 train_time:886082ms step_avg:228.02ms step:3887/7050 train_time:886317ms step_avg:228.02ms step:3888/7050 train_time:886554ms step_avg:228.02ms step:3889/7050 train_time:886790ms step_avg:228.03ms step:3890/7050 train_time:887025ms step_avg:228.03ms step:3891/7050 train_time:887263ms step_avg:228.03ms step:3892/7050 train_time:887499ms step_avg:228.03ms step:3893/7050 train_time:887734ms step_avg:228.03ms step:3894/7050 train_time:887970ms step_avg:228.04ms step:3895/7050 train_time:888206ms step_avg:228.04ms step:3896/7050 train_time:888442ms step_avg:228.04ms step:3897/7050 train_time:888677ms step_avg:228.04ms step:3898/7050 train_time:888916ms step_avg:228.04ms step:3899/7050 train_time:889151ms step_avg:228.05ms step:3900/7050 train_time:889388ms step_avg:228.05ms step:3901/7050 train_time:889624ms step_avg:228.05ms step:3902/7050 train_time:889861ms step_avg:228.05ms step:3903/7050 train_time:890095ms step_avg:228.05ms step:3904/7050 train_time:890333ms step_avg:228.06ms step:3905/7050 train_time:890571ms step_avg:228.06ms step:3906/7050 train_time:890806ms step_avg:228.06ms step:3907/7050 train_time:891043ms step_avg:228.06ms step:3908/7050 train_time:891280ms step_avg:228.07ms step:3909/7050 train_time:891516ms step_avg:228.07ms step:3910/7050 train_time:891752ms step_avg:228.07ms step:3911/7050 train_time:891989ms step_avg:228.07ms step:3912/7050 train_time:892225ms step_avg:228.07ms step:3913/7050 train_time:892462ms step_avg:228.08ms step:3914/7050 train_time:892697ms step_avg:228.08ms step:3915/7050 train_time:892933ms step_avg:228.08ms step:3916/7050 train_time:893171ms step_avg:228.08ms step:3917/7050 train_time:893408ms step_avg:228.08ms step:3918/7050 train_time:893645ms step_avg:228.09ms step:3919/7050 train_time:893882ms step_avg:228.09ms step:3920/7050 train_time:894118ms step_avg:228.09ms step:3921/7050 train_time:894354ms step_avg:228.09ms step:3922/7050 train_time:894591ms step_avg:228.10ms step:3923/7050 train_time:894827ms step_avg:228.10ms step:3924/7050 train_time:895064ms step_avg:228.10ms step:3925/7050 train_time:895301ms step_avg:228.10ms step:3926/7050 train_time:895539ms step_avg:228.10ms step:3927/7050 train_time:895774ms step_avg:228.11ms step:3928/7050 train_time:896011ms step_avg:228.11ms step:3929/7050 train_time:896247ms step_avg:228.11ms step:3930/7050 train_time:896485ms step_avg:228.11ms step:3931/7050 train_time:896720ms step_avg:228.11ms step:3932/7050 train_time:896956ms step_avg:228.12ms step:3933/7050 train_time:897193ms step_avg:228.12ms step:3934/7050 train_time:897430ms step_avg:228.12ms step:3935/7050 train_time:897670ms step_avg:228.12ms step:3936/7050 train_time:897906ms step_avg:228.13ms step:3937/7050 train_time:898143ms step_avg:228.13ms step:3938/7050 train_time:898379ms step_avg:228.13ms step:3939/7050 train_time:898615ms step_avg:228.13ms step:3940/7050 train_time:898852ms step_avg:228.13ms step:3941/7050 train_time:899088ms step_avg:228.14ms step:3942/7050 train_time:899325ms step_avg:228.14ms step:3943/7050 train_time:899562ms step_avg:228.14ms step:3944/7050 train_time:899799ms step_avg:228.14ms step:3945/7050 train_time:900034ms step_avg:228.15ms step:3946/7050 train_time:900271ms step_avg:228.15ms step:3947/7050 train_time:900508ms step_avg:228.15ms step:3948/7050 train_time:900747ms step_avg:228.15ms step:3949/7050 train_time:900986ms step_avg:228.16ms step:3950/7050 train_time:901222ms step_avg:228.16ms step:3951/7050 train_time:901457ms step_avg:228.16ms step:3952/7050 train_time:901694ms step_avg:228.16ms step:3953/7050 train_time:901931ms step_avg:228.16ms step:3954/7050 train_time:902168ms step_avg:228.17ms step:3955/7050 train_time:902406ms step_avg:228.17ms step:3956/7050 train_time:902643ms step_avg:228.17ms step:3957/7050 train_time:902880ms step_avg:228.17ms step:3958/7050 train_time:903116ms step_avg:228.17ms step:3959/7050 train_time:903353ms step_avg:228.18ms step:3960/7050 train_time:903591ms step_avg:228.18ms step:3961/7050 train_time:903827ms step_avg:228.18ms step:3962/7050 train_time:904065ms step_avg:228.18ms step:3963/7050 train_time:904301ms step_avg:228.19ms step:3964/7050 train_time:904538ms step_avg:228.19ms step:3965/7050 train_time:904775ms step_avg:228.19ms step:3966/7050 train_time:905012ms step_avg:228.19ms step:3967/7050 train_time:905248ms step_avg:228.19ms step:3968/7050 train_time:905487ms step_avg:228.20ms step:3969/7050 train_time:905722ms step_avg:228.20ms step:3970/7050 train_time:905958ms step_avg:228.20ms step:3971/7050 train_time:906193ms step_avg:228.20ms step:3972/7050 train_time:906429ms step_avg:228.20ms step:3973/7050 train_time:906667ms step_avg:228.21ms step:3974/7050 train_time:906905ms step_avg:228.21ms step:3975/7050 train_time:907141ms step_avg:228.21ms step:3976/7050 train_time:907378ms step_avg:228.21ms step:3977/7050 train_time:907612ms step_avg:228.22ms step:3978/7050 train_time:907848ms step_avg:228.22ms step:3979/7050 train_time:908085ms step_avg:228.22ms step:3980/7050 train_time:908321ms step_avg:228.22ms step:3981/7050 train_time:908558ms step_avg:228.22ms step:3982/7050 train_time:908795ms step_avg:228.23ms step:3983/7050 train_time:909030ms step_avg:228.23ms step:3984/7050 train_time:909269ms step_avg:228.23ms step:3985/7050 train_time:909507ms step_avg:228.23ms step:3986/7050 train_time:909745ms step_avg:228.24ms step:3987/7050 train_time:909982ms step_avg:228.24ms step:3988/7050 train_time:910219ms step_avg:228.24ms step:3989/7050 train_time:910454ms step_avg:228.24ms step:3990/7050 train_time:910689ms step_avg:228.24ms step:3991/7050 train_time:910926ms step_avg:228.25ms step:3992/7050 train_time:911162ms step_avg:228.25ms step:3993/7050 train_time:911398ms step_avg:228.25ms step:3994/7050 train_time:911633ms step_avg:228.25ms step:3995/7050 train_time:911872ms step_avg:228.25ms step:3996/7050 train_time:912110ms step_avg:228.26ms step:3997/7050 train_time:912346ms step_avg:228.26ms step:3998/7050 train_time:912583ms step_avg:228.26ms step:3999/7050 train_time:912820ms step_avg:228.26ms step:4000/7050 train_time:913055ms step_avg:228.26ms step:4000/7050 val_loss:3.1134 train_time:913245ms step_avg:228.31ms step:4001/7050 train_time:913296ms step_avg:228.27ms step:4002/7050 train_time:913533ms step_avg:228.27ms step:4003/7050 train_time:913771ms step_avg:228.27ms step:4004/7050 train_time:914008ms step_avg:228.27ms step:4005/7050 train_time:914245ms step_avg:228.28ms step:4006/7050 train_time:914482ms step_avg:228.28ms step:4007/7050 train_time:914717ms step_avg:228.28ms step:4008/7050 train_time:914955ms step_avg:228.28ms step:4009/7050 train_time:915191ms step_avg:228.28ms step:4010/7050 train_time:915428ms step_avg:228.29ms step:4011/7050 train_time:915663ms step_avg:228.29ms step:4012/7050 train_time:915899ms step_avg:228.29ms step:4013/7050 train_time:916135ms step_avg:228.29ms step:4014/7050 train_time:916372ms step_avg:228.29ms step:4015/7050 train_time:916609ms step_avg:228.30ms step:4016/7050 train_time:916845ms step_avg:228.30ms step:4017/7050 train_time:917081ms step_avg:228.30ms step:4018/7050 train_time:917317ms step_avg:228.30ms step:4019/7050 train_time:917555ms step_avg:228.30ms step:4020/7050 train_time:917791ms step_avg:228.31ms step:4021/7050 train_time:918028ms step_avg:228.31ms step:4022/7050 train_time:918264ms step_avg:228.31ms step:4023/7050 train_time:918501ms step_avg:228.31ms step:4024/7050 train_time:918737ms step_avg:228.31ms step:4025/7050 train_time:918973ms step_avg:228.32ms step:4026/7050 train_time:919209ms step_avg:228.32ms step:4027/7050 train_time:919445ms step_avg:228.32ms step:4028/7050 train_time:919683ms step_avg:228.32ms step:4029/7050 train_time:919918ms step_avg:228.32ms step:4030/7050 train_time:920153ms step_avg:228.33ms step:4031/7050 train_time:920390ms step_avg:228.33ms step:4032/7050 train_time:920627ms step_avg:228.33ms step:4033/7050 train_time:920863ms step_avg:228.33ms step:4034/7050 train_time:921098ms step_avg:228.33ms step:4035/7050 train_time:921336ms step_avg:228.34ms step:4036/7050 train_time:921572ms step_avg:228.34ms step:4037/7050 train_time:921808ms step_avg:228.34ms step:4038/7050 train_time:922045ms step_avg:228.34ms step:4039/7050 train_time:922280ms step_avg:228.34ms step:4040/7050 train_time:922515ms step_avg:228.35ms step:4041/7050 train_time:922751ms step_avg:228.35ms step:4042/7050 train_time:922988ms step_avg:228.35ms step:4043/7050 train_time:923224ms step_avg:228.35ms step:4044/7050 train_time:923461ms step_avg:228.35ms step:4045/7050 train_time:923696ms step_avg:228.35ms step:4046/7050 train_time:923933ms step_avg:228.36ms step:4047/7050 train_time:924171ms step_avg:228.36ms step:4048/7050 train_time:924406ms step_avg:228.36ms step:4049/7050 train_time:924643ms step_avg:228.36ms step:4050/7050 train_time:924879ms step_avg:228.37ms step:4051/7050 train_time:925117ms step_avg:228.37ms step:4052/7050 train_time:925355ms step_avg:228.37ms step:4053/7050 train_time:925591ms step_avg:228.37ms step:4054/7050 train_time:925827ms step_avg:228.37ms step:4055/7050 train_time:926063ms step_avg:228.38ms step:4056/7050 train_time:926300ms step_avg:228.38ms step:4057/7050 train_time:926538ms step_avg:228.38ms step:4058/7050 train_time:926774ms step_avg:228.38ms step:4059/7050 train_time:927010ms step_avg:228.38ms step:4060/7050 train_time:927249ms step_avg:228.39ms step:4061/7050 train_time:927485ms step_avg:228.39ms step:4062/7050 train_time:927723ms step_avg:228.39ms step:4063/7050 train_time:927958ms step_avg:228.39ms step:4064/7050 train_time:928194ms step_avg:228.39ms step:4065/7050 train_time:928432ms step_avg:228.40ms step:4066/7050 train_time:928668ms step_avg:228.40ms step:4067/7050 train_time:928904ms step_avg:228.40ms step:4068/7050 train_time:929141ms step_avg:228.40ms step:4069/7050 train_time:929377ms step_avg:228.40ms step:4070/7050 train_time:929614ms step_avg:228.41ms step:4071/7050 train_time:929851ms step_avg:228.41ms step:4072/7050 train_time:930086ms step_avg:228.41ms step:4073/7050 train_time:930324ms step_avg:228.41ms step:4074/7050 train_time:930558ms step_avg:228.41ms step:4075/7050 train_time:930794ms step_avg:228.42ms step:4076/7050 train_time:931030ms step_avg:228.42ms step:4077/7050 train_time:931267ms step_avg:228.42ms step:4078/7050 train_time:931503ms step_avg:228.42ms step:4079/7050 train_time:931740ms step_avg:228.42ms step:4080/7050 train_time:931977ms step_avg:228.43ms step:4081/7050 train_time:932213ms step_avg:228.43ms step:4082/7050 train_time:932449ms step_avg:228.43ms step:4083/7050 train_time:932683ms step_avg:228.43ms step:4084/7050 train_time:932918ms step_avg:228.43ms step:4085/7050 train_time:933154ms step_avg:228.43ms step:4086/7050 train_time:933391ms step_avg:228.44ms step:4087/7050 train_time:933628ms step_avg:228.44ms step:4088/7050 train_time:933865ms step_avg:228.44ms step:4089/7050 train_time:934102ms step_avg:228.44ms step:4090/7050 train_time:934338ms step_avg:228.44ms step:4091/7050 train_time:934575ms step_avg:228.45ms step:4092/7050 train_time:934812ms step_avg:228.45ms step:4093/7050 train_time:935049ms step_avg:228.45ms step:4094/7050 train_time:935285ms step_avg:228.45ms step:4095/7050 train_time:935521ms step_avg:228.45ms step:4096/7050 train_time:935758ms step_avg:228.46ms step:4097/7050 train_time:935995ms step_avg:228.46ms step:4098/7050 train_time:936235ms step_avg:228.46ms step:4099/7050 train_time:936472ms step_avg:228.46ms step:4100/7050 train_time:936707ms step_avg:228.47ms step:4101/7050 train_time:936943ms step_avg:228.47ms step:4102/7050 train_time:937180ms step_avg:228.47ms step:4103/7050 train_time:937416ms step_avg:228.47ms step:4104/7050 train_time:937654ms step_avg:228.47ms step:4105/7050 train_time:937893ms step_avg:228.48ms step:4106/7050 train_time:938131ms step_avg:228.48ms step:4107/7050 train_time:938366ms step_avg:228.48ms step:4108/7050 train_time:938602ms step_avg:228.48ms step:4109/7050 train_time:938839ms step_avg:228.48ms step:4110/7050 train_time:939076ms step_avg:228.49ms step:4111/7050 train_time:939312ms step_avg:228.49ms step:4112/7050 train_time:939549ms step_avg:228.49ms step:4113/7050 train_time:939784ms step_avg:228.49ms step:4114/7050 train_time:940021ms step_avg:228.49ms step:4115/7050 train_time:940258ms step_avg:228.50ms step:4116/7050 train_time:940493ms step_avg:228.50ms step:4117/7050 train_time:940730ms step_avg:228.50ms step:4118/7050 train_time:940965ms step_avg:228.50ms step:4119/7050 train_time:941203ms step_avg:228.50ms step:4120/7050 train_time:941440ms step_avg:228.50ms step:4121/7050 train_time:941676ms step_avg:228.51ms step:4122/7050 train_time:941912ms step_avg:228.51ms step:4123/7050 train_time:942149ms step_avg:228.51ms step:4124/7050 train_time:942384ms step_avg:228.51ms step:4125/7050 train_time:942621ms step_avg:228.51ms step:4125/7050 val_loss:3.1105 train_time:942808ms step_avg:228.56ms step:4126/7050 train_time:942861ms step_avg:228.52ms step:4127/7050 train_time:943096ms step_avg:228.52ms step:4128/7050 train_time:943334ms step_avg:228.52ms step:4129/7050 train_time:943571ms step_avg:228.52ms step:4130/7050 train_time:943807ms step_avg:228.52ms step:4131/7050 train_time:944045ms step_avg:228.53ms step:4132/7050 train_time:944284ms step_avg:228.53ms step:4133/7050 train_time:944520ms step_avg:228.53ms step:4134/7050 train_time:944756ms step_avg:228.53ms step:4135/7050 train_time:944992ms step_avg:228.53ms step:4136/7050 train_time:945231ms step_avg:228.54ms step:4137/7050 train_time:945467ms step_avg:228.54ms step:4138/7050 train_time:945703ms step_avg:228.54ms step:4139/7050 train_time:945939ms step_avg:228.54ms step:4140/7050 train_time:946176ms step_avg:228.54ms step:4141/7050 train_time:946414ms step_avg:228.55ms step:4142/7050 train_time:946650ms step_avg:228.55ms step:4143/7050 train_time:946887ms step_avg:228.55ms step:4144/7050 train_time:947122ms step_avg:228.55ms step:4145/7050 train_time:947358ms step_avg:228.55ms step:4146/7050 train_time:947595ms step_avg:228.56ms step:4147/7050 train_time:947833ms step_avg:228.56ms step:4148/7050 train_time:948070ms step_avg:228.56ms step:4149/7050 train_time:948305ms step_avg:228.56ms step:4150/7050 train_time:948541ms step_avg:228.56ms step:4151/7050 train_time:948778ms step_avg:228.57ms step:4152/7050 train_time:949015ms step_avg:228.57ms step:4153/7050 train_time:949251ms step_avg:228.57ms step:4154/7050 train_time:949486ms step_avg:228.57ms step:4155/7050 train_time:949723ms step_avg:228.57ms step:4156/7050 train_time:949962ms step_avg:228.58ms step:4157/7050 train_time:950198ms step_avg:228.58ms step:4158/7050 train_time:950438ms step_avg:228.58ms step:4159/7050 train_time:950677ms step_avg:228.58ms step:4160/7050 train_time:950914ms step_avg:228.59ms step:4161/7050 train_time:951150ms step_avg:228.59ms step:4162/7050 train_time:951388ms step_avg:228.59ms step:4163/7050 train_time:951627ms step_avg:228.59ms step:4164/7050 train_time:951863ms step_avg:228.59ms step:4165/7050 train_time:952097ms step_avg:228.59ms step:4166/7050 train_time:952333ms step_avg:228.60ms step:4167/7050 train_time:952568ms step_avg:228.60ms step:4168/7050 train_time:952803ms step_avg:228.60ms step:4169/7050 train_time:953039ms step_avg:228.60ms step:4170/7050 train_time:953274ms step_avg:228.60ms step:4171/7050 train_time:953512ms step_avg:228.61ms step:4172/7050 train_time:953748ms step_avg:228.61ms step:4173/7050 train_time:953983ms step_avg:228.61ms step:4174/7050 train_time:954220ms step_avg:228.61ms step:4175/7050 train_time:954454ms step_avg:228.61ms step:4176/7050 train_time:954691ms step_avg:228.61ms step:4177/7050 train_time:954927ms step_avg:228.62ms step:4178/7050 train_time:955162ms step_avg:228.62ms step:4179/7050 train_time:955399ms step_avg:228.62ms step:4180/7050 train_time:955636ms step_avg:228.62ms step:4181/7050 train_time:955873ms step_avg:228.62ms step:4182/7050 train_time:956109ms step_avg:228.62ms step:4183/7050 train_time:956346ms step_avg:228.63ms step:4184/7050 train_time:956582ms step_avg:228.63ms step:4185/7050 train_time:956820ms step_avg:228.63ms step:4186/7050 train_time:957057ms step_avg:228.63ms step:4187/7050 train_time:957295ms step_avg:228.64ms step:4188/7050 train_time:957532ms step_avg:228.64ms step:4189/7050 train_time:957768ms step_avg:228.64ms step:4190/7050 train_time:958006ms step_avg:228.64ms step:4191/7050 train_time:958248ms step_avg:228.64ms step:4192/7050 train_time:958484ms step_avg:228.65ms step:4193/7050 train_time:958721ms step_avg:228.65ms step:4194/7050 train_time:958959ms step_avg:228.65ms step:4195/7050 train_time:959195ms step_avg:228.65ms step:4196/7050 train_time:959432ms step_avg:228.65ms step:4197/7050 train_time:959668ms step_avg:228.66ms step:4198/7050 train_time:959905ms step_avg:228.66ms step:4199/7050 train_time:960144ms step_avg:228.66ms step:4200/7050 train_time:960382ms step_avg:228.66ms step:4201/7050 train_time:960618ms step_avg:228.66ms step:4202/7050 train_time:960854ms step_avg:228.67ms step:4203/7050 train_time:961090ms step_avg:228.67ms step:4204/7050 train_time:961326ms step_avg:228.67ms step:4205/7050 train_time:961564ms step_avg:228.67ms step:4206/7050 train_time:961803ms step_avg:228.67ms step:4207/7050 train_time:962040ms step_avg:228.68ms step:4208/7050 train_time:962276ms step_avg:228.68ms step:4209/7050 train_time:962513ms step_avg:228.68ms step:4210/7050 train_time:962749ms step_avg:228.68ms step:4211/7050 train_time:962984ms step_avg:228.68ms step:4212/7050 train_time:963223ms step_avg:228.69ms step:4213/7050 train_time:963460ms step_avg:228.69ms step:4214/7050 train_time:963696ms step_avg:228.69ms step:4215/7050 train_time:963934ms step_avg:228.69ms step:4216/7050 train_time:964170ms step_avg:228.69ms step:4217/7050 train_time:964407ms step_avg:228.69ms step:4218/7050 train_time:964643ms step_avg:228.70ms step:4219/7050 train_time:964879ms step_avg:228.70ms step:4220/7050 train_time:965116ms step_avg:228.70ms step:4221/7050 train_time:965352ms step_avg:228.70ms step:4222/7050 train_time:965587ms step_avg:228.70ms step:4223/7050 train_time:965826ms step_avg:228.71ms step:4224/7050 train_time:966062ms step_avg:228.71ms step:4225/7050 train_time:966298ms step_avg:228.71ms step:4226/7050 train_time:966534ms step_avg:228.71ms step:4227/7050 train_time:966769ms step_avg:228.71ms step:4228/7050 train_time:967006ms step_avg:228.71ms step:4229/7050 train_time:967243ms step_avg:228.72ms step:4230/7050 train_time:967479ms step_avg:228.72ms step:4231/7050 train_time:967717ms step_avg:228.72ms step:4232/7050 train_time:967952ms step_avg:228.72ms step:4233/7050 train_time:968189ms step_avg:228.72ms step:4234/7050 train_time:968426ms step_avg:228.73ms step:4235/7050 train_time:968664ms step_avg:228.73ms step:4236/7050 train_time:968902ms step_avg:228.73ms step:4237/7050 train_time:969138ms step_avg:228.73ms step:4238/7050 train_time:969375ms step_avg:228.73ms step:4239/7050 train_time:969612ms step_avg:228.74ms step:4240/7050 train_time:969850ms step_avg:228.74ms step:4241/7050 train_time:970087ms step_avg:228.74ms step:4242/7050 train_time:970325ms step_avg:228.74ms step:4243/7050 train_time:970563ms step_avg:228.74ms step:4244/7050 train_time:970800ms step_avg:228.75ms step:4245/7050 train_time:971038ms step_avg:228.75ms step:4246/7050 train_time:971275ms step_avg:228.75ms step:4247/7050 train_time:971514ms step_avg:228.75ms step:4248/7050 train_time:971750ms step_avg:228.75ms step:4249/7050 train_time:971988ms step_avg:228.76ms step:4250/7050 train_time:972227ms step_avg:228.76ms step:4250/7050 val_loss:3.1043 train_time:972414ms step_avg:228.80ms step:4251/7050 train_time:972465ms step_avg:228.76ms step:4252/7050 train_time:972703ms step_avg:228.76ms step:4253/7050 train_time:972939ms step_avg:228.77ms step:4254/7050 train_time:973176ms step_avg:228.77ms step:4255/7050 train_time:973415ms step_avg:228.77ms step:4256/7050 train_time:973652ms step_avg:228.77ms step:4257/7050 train_time:973889ms step_avg:228.77ms step:4258/7050 train_time:974124ms step_avg:228.78ms step:4259/7050 train_time:974362ms step_avg:228.78ms step:4260/7050 train_time:974599ms step_avg:228.78ms step:4261/7050 train_time:974832ms step_avg:228.78ms step:4262/7050 train_time:975069ms step_avg:228.78ms step:4263/7050 train_time:975306ms step_avg:228.78ms step:4264/7050 train_time:975543ms step_avg:228.79ms step:4265/7050 train_time:975782ms step_avg:228.79ms step:4266/7050 train_time:976019ms step_avg:228.79ms step:4267/7050 train_time:976256ms step_avg:228.79ms step:4268/7050 train_time:976492ms step_avg:228.79ms step:4269/7050 train_time:976730ms step_avg:228.80ms step:4270/7050 train_time:976968ms step_avg:228.80ms step:4271/7050 train_time:977206ms step_avg:228.80ms step:4272/7050 train_time:977445ms step_avg:228.80ms step:4273/7050 train_time:977682ms step_avg:228.80ms step:4274/7050 train_time:977919ms step_avg:228.81ms step:4275/7050 train_time:978156ms step_avg:228.81ms step:4276/7050 train_time:978393ms step_avg:228.81ms step:4277/7050 train_time:978629ms step_avg:228.81ms step:4278/7050 train_time:978867ms step_avg:228.81ms step:4279/7050 train_time:979103ms step_avg:228.82ms step:4280/7050 train_time:979339ms step_avg:228.82ms step:4281/7050 train_time:979576ms step_avg:228.82ms step:4282/7050 train_time:979811ms step_avg:228.82ms step:4283/7050 train_time:980049ms step_avg:228.82ms step:4284/7050 train_time:980286ms step_avg:228.82ms step:4285/7050 train_time:980523ms step_avg:228.83ms step:4286/7050 train_time:980759ms step_avg:228.83ms step:4287/7050 train_time:980995ms step_avg:228.83ms step:4288/7050 train_time:981234ms step_avg:228.83ms step:4289/7050 train_time:981470ms step_avg:228.83ms step:4290/7050 train_time:981708ms step_avg:228.84ms step:4291/7050 train_time:981944ms step_avg:228.84ms step:4292/7050 train_time:982182ms step_avg:228.84ms step:4293/7050 train_time:982419ms step_avg:228.84ms step:4294/7050 train_time:982658ms step_avg:228.84ms step:4295/7050 train_time:982894ms step_avg:228.85ms step:4296/7050 train_time:983130ms step_avg:228.85ms step:4297/7050 train_time:983367ms step_avg:228.85ms step:4298/7050 train_time:983605ms step_avg:228.85ms step:4299/7050 train_time:983842ms step_avg:228.85ms step:4300/7050 train_time:984079ms step_avg:228.86ms step:4301/7050 train_time:984315ms step_avg:228.86ms step:4302/7050 train_time:984552ms step_avg:228.86ms step:4303/7050 train_time:984790ms step_avg:228.86ms step:4304/7050 train_time:985028ms step_avg:228.86ms step:4305/7050 train_time:985265ms step_avg:228.87ms step:4306/7050 train_time:985502ms step_avg:228.87ms step:4307/7050 train_time:985739ms step_avg:228.87ms step:4308/7050 train_time:985976ms step_avg:228.87ms step:4309/7050 train_time:986212ms step_avg:228.87ms step:4310/7050 train_time:986449ms step_avg:228.87ms step:4311/7050 train_time:986689ms step_avg:228.88ms step:4312/7050 train_time:986926ms step_avg:228.88ms step:4313/7050 train_time:987163ms step_avg:228.88ms step:4314/7050 train_time:987399ms step_avg:228.88ms step:4315/7050 train_time:987636ms step_avg:228.88ms step:4316/7050 train_time:987873ms step_avg:228.89ms step:4317/7050 train_time:988109ms step_avg:228.89ms step:4318/7050 train_time:988349ms step_avg:228.89ms step:4319/7050 train_time:988586ms step_avg:228.89ms step:4320/7050 train_time:988824ms step_avg:228.89ms step:4321/7050 train_time:989062ms step_avg:228.90ms step:4322/7050 train_time:989297ms step_avg:228.90ms step:4323/7050 train_time:989534ms step_avg:228.90ms step:4324/7050 train_time:989772ms step_avg:228.90ms step:4325/7050 train_time:990012ms step_avg:228.90ms step:4326/7050 train_time:990249ms step_avg:228.91ms step:4327/7050 train_time:990486ms step_avg:228.91ms step:4328/7050 train_time:990722ms step_avg:228.91ms step:4329/7050 train_time:990959ms step_avg:228.91ms step:4330/7050 train_time:991195ms step_avg:228.91ms step:4331/7050 train_time:991432ms step_avg:228.92ms step:4332/7050 train_time:991670ms step_avg:228.92ms step:4333/7050 train_time:991907ms step_avg:228.92ms step:4334/7050 train_time:992142ms step_avg:228.92ms step:4335/7050 train_time:992380ms step_avg:228.92ms step:4336/7050 train_time:992616ms step_avg:228.92ms step:4337/7050 train_time:992857ms step_avg:228.93ms step:4338/7050 train_time:993093ms step_avg:228.93ms step:4339/7050 train_time:993328ms step_avg:228.93ms step:4340/7050 train_time:993565ms step_avg:228.93ms step:4341/7050 train_time:993802ms step_avg:228.93ms step:4342/7050 train_time:994040ms step_avg:228.94ms step:4343/7050 train_time:994275ms step_avg:228.94ms step:4344/7050 train_time:994511ms step_avg:228.94ms step:4345/7050 train_time:994749ms step_avg:228.94ms step:4346/7050 train_time:994986ms step_avg:228.94ms step:4347/7050 train_time:995223ms step_avg:228.94ms step:4348/7050 train_time:995462ms step_avg:228.95ms step:4349/7050 train_time:995699ms step_avg:228.95ms step:4350/7050 train_time:995937ms step_avg:228.95ms step:4351/7050 train_time:996176ms step_avg:228.95ms step:4352/7050 train_time:996411ms step_avg:228.95ms step:4353/7050 train_time:996649ms step_avg:228.96ms step:4354/7050 train_time:996885ms step_avg:228.96ms step:4355/7050 train_time:997122ms step_avg:228.96ms step:4356/7050 train_time:997361ms step_avg:228.96ms step:4357/7050 train_time:997597ms step_avg:228.96ms step:4358/7050 train_time:997834ms step_avg:228.97ms step:4359/7050 train_time:998072ms step_avg:228.97ms step:4360/7050 train_time:998309ms step_avg:228.97ms step:4361/7050 train_time:998548ms step_avg:228.97ms step:4362/7050 train_time:998784ms step_avg:228.97ms step:4363/7050 train_time:999020ms step_avg:228.98ms step:4364/7050 train_time:999257ms step_avg:228.98ms step:4365/7050 train_time:999494ms step_avg:228.98ms step:4366/7050 train_time:999732ms step_avg:228.98ms step:4367/7050 train_time:999970ms step_avg:228.98ms step:4368/7050 train_time:1000209ms step_avg:228.99ms step:4369/7050 train_time:1000447ms step_avg:228.99ms step:4370/7050 train_time:1000684ms step_avg:228.99ms step:4371/7050 train_time:1000920ms step_avg:228.99ms step:4372/7050 train_time:1001156ms step_avg:228.99ms step:4373/7050 train_time:1001394ms step_avg:228.99ms step:4374/7050 train_time:1001632ms step_avg:229.00ms step:4375/7050 train_time:1001867ms step_avg:229.00ms step:4375/7050 val_loss:3.0957 train_time:1002055ms step_avg:229.04ms step:4376/7050 train_time:1002105ms step_avg:229.00ms step:4377/7050 train_time:1002343ms step_avg:229.00ms step:4378/7050 train_time:1002586ms step_avg:229.01ms step:4379/7050 train_time:1002822ms step_avg:229.01ms step:4380/7050 train_time:1003058ms step_avg:229.01ms step:4381/7050 train_time:1003295ms step_avg:229.01ms step:4382/7050 train_time:1003534ms step_avg:229.01ms step:4383/7050 train_time:1003772ms step_avg:229.01ms step:4384/7050 train_time:1004007ms step_avg:229.02ms step:4385/7050 train_time:1004244ms step_avg:229.02ms step:4386/7050 train_time:1004484ms step_avg:229.02ms step:4387/7050 train_time:1004721ms step_avg:229.02ms step:4388/7050 train_time:1004958ms step_avg:229.02ms step:4389/7050 train_time:1005194ms step_avg:229.03ms step:4390/7050 train_time:1005430ms step_avg:229.03ms step:4391/7050 train_time:1005669ms step_avg:229.03ms step:4392/7050 train_time:1005905ms step_avg:229.03ms step:4393/7050 train_time:1006140ms step_avg:229.03ms step:4394/7050 train_time:1006378ms step_avg:229.03ms step:4395/7050 train_time:1006616ms step_avg:229.04ms step:4396/7050 train_time:1006855ms step_avg:229.04ms step:4397/7050 train_time:1007090ms step_avg:229.04ms step:4398/7050 train_time:1007328ms step_avg:229.04ms step:4399/7050 train_time:1007565ms step_avg:229.04ms step:4400/7050 train_time:1007804ms step_avg:229.05ms step:4401/7050 train_time:1008040ms step_avg:229.05ms step:4402/7050 train_time:1008280ms step_avg:229.05ms step:4403/7050 train_time:1008515ms step_avg:229.05ms step:4404/7050 train_time:1008752ms step_avg:229.05ms step:4405/7050 train_time:1008988ms step_avg:229.06ms step:4406/7050 train_time:1009226ms step_avg:229.06ms step:4407/7050 train_time:1009462ms step_avg:229.06ms step:4408/7050 train_time:1009701ms step_avg:229.06ms step:4409/7050 train_time:1009938ms step_avg:229.06ms step:4410/7050 train_time:1010175ms step_avg:229.06ms step:4411/7050 train_time:1010413ms step_avg:229.07ms step:4412/7050 train_time:1010651ms step_avg:229.07ms step:4413/7050 train_time:1010885ms step_avg:229.07ms step:4414/7050 train_time:1011121ms step_avg:229.07ms step:4415/7050 train_time:1011361ms step_avg:229.07ms step:4416/7050 train_time:1011598ms step_avg:229.08ms step:4417/7050 train_time:1011834ms step_avg:229.08ms step:4418/7050 train_time:1012070ms step_avg:229.08ms step:4419/7050 train_time:1012305ms step_avg:229.08ms step:4420/7050 train_time:1012545ms step_avg:229.08ms step:4421/7050 train_time:1012781ms step_avg:229.08ms step:4422/7050 train_time:1013018ms step_avg:229.09ms step:4423/7050 train_time:1013256ms step_avg:229.09ms step:4424/7050 train_time:1013493ms step_avg:229.09ms step:4425/7050 train_time:1013731ms step_avg:229.09ms step:4426/7050 train_time:1013966ms step_avg:229.09ms step:4427/7050 train_time:1014204ms step_avg:229.10ms step:4428/7050 train_time:1014442ms step_avg:229.10ms step:4429/7050 train_time:1014678ms step_avg:229.10ms step:4430/7050 train_time:1014915ms step_avg:229.10ms step:4431/7050 train_time:1015154ms step_avg:229.10ms step:4432/7050 train_time:1015391ms step_avg:229.10ms step:4433/7050 train_time:1015626ms step_avg:229.11ms step:4434/7050 train_time:1015864ms step_avg:229.11ms step:4435/7050 train_time:1016103ms step_avg:229.11ms step:4436/7050 train_time:1016340ms step_avg:229.11ms step:4437/7050 train_time:1016578ms step_avg:229.11ms step:4438/7050 train_time:1016818ms step_avg:229.12ms step:4439/7050 train_time:1017056ms step_avg:229.12ms step:4440/7050 train_time:1017293ms step_avg:229.12ms step:4441/7050 train_time:1017530ms step_avg:229.12ms step:4442/7050 train_time:1017766ms step_avg:229.12ms step:4443/7050 train_time:1018002ms step_avg:229.12ms step:4444/7050 train_time:1018242ms step_avg:229.13ms step:4445/7050 train_time:1018478ms step_avg:229.13ms step:4446/7050 train_time:1018716ms step_avg:229.13ms step:4447/7050 train_time:1018953ms step_avg:229.13ms step:4448/7050 train_time:1019189ms step_avg:229.13ms step:4449/7050 train_time:1019426ms step_avg:229.14ms step:4450/7050 train_time:1019664ms step_avg:229.14ms step:4451/7050 train_time:1019901ms step_avg:229.14ms step:4452/7050 train_time:1020139ms step_avg:229.14ms step:4453/7050 train_time:1020378ms step_avg:229.14ms step:4454/7050 train_time:1020614ms step_avg:229.15ms step:4455/7050 train_time:1020850ms step_avg:229.15ms step:4456/7050 train_time:1021088ms step_avg:229.15ms step:4457/7050 train_time:1021324ms step_avg:229.15ms step:4458/7050 train_time:1021565ms step_avg:229.15ms step:4459/7050 train_time:1021799ms step_avg:229.15ms step:4460/7050 train_time:1022038ms step_avg:229.16ms step:4461/7050 train_time:1022278ms step_avg:229.16ms step:4462/7050 train_time:1022518ms step_avg:229.16ms step:4463/7050 train_time:1022756ms step_avg:229.16ms step:4464/7050 train_time:1022991ms step_avg:229.16ms step:4465/7050 train_time:1023227ms step_avg:229.17ms step:4466/7050 train_time:1023464ms step_avg:229.17ms step:4467/7050 train_time:1023700ms step_avg:229.17ms step:4468/7050 train_time:1023938ms step_avg:229.17ms step:4469/7050 train_time:1024174ms step_avg:229.17ms step:4470/7050 train_time:1024411ms step_avg:229.17ms step:4471/7050 train_time:1024647ms step_avg:229.18ms step:4472/7050 train_time:1024887ms step_avg:229.18ms step:4473/7050 train_time:1025123ms step_avg:229.18ms step:4474/7050 train_time:1025360ms step_avg:229.18ms step:4475/7050 train_time:1025596ms step_avg:229.18ms step:4476/7050 train_time:1025834ms step_avg:229.19ms step:4477/7050 train_time:1026070ms step_avg:229.19ms step:4478/7050 train_time:1026304ms step_avg:229.19ms step:4479/7050 train_time:1026543ms step_avg:229.19ms step:4480/7050 train_time:1026782ms step_avg:229.19ms step:4481/7050 train_time:1027021ms step_avg:229.19ms step:4482/7050 train_time:1027258ms step_avg:229.20ms step:4483/7050 train_time:1027494ms step_avg:229.20ms step:4484/7050 train_time:1027732ms step_avg:229.20ms step:4485/7050 train_time:1027970ms step_avg:229.20ms step:4486/7050 train_time:1028206ms step_avg:229.20ms step:4487/7050 train_time:1028443ms step_avg:229.20ms step:4488/7050 train_time:1028681ms step_avg:229.21ms step:4489/7050 train_time:1028918ms step_avg:229.21ms step:4490/7050 train_time:1029155ms step_avg:229.21ms step:4491/7050 train_time:1029391ms step_avg:229.21ms step:4492/7050 train_time:1029628ms step_avg:229.21ms step:4493/7050 train_time:1029864ms step_avg:229.22ms step:4494/7050 train_time:1030103ms step_avg:229.22ms step:4495/7050 train_time:1030341ms step_avg:229.22ms step:4496/7050 train_time:1030577ms step_avg:229.22ms step:4497/7050 train_time:1030812ms step_avg:229.22ms step:4498/7050 train_time:1031049ms step_avg:229.22ms step:4499/7050 train_time:1031286ms step_avg:229.23ms step:4500/7050 train_time:1031525ms step_avg:229.23ms step:4500/7050 val_loss:3.0869 train_time:1031716ms step_avg:229.27ms step:4501/7050 train_time:1031767ms step_avg:229.23ms step:4502/7050 train_time:1032005ms step_avg:229.23ms step:4503/7050 train_time:1032244ms step_avg:229.23ms step:4504/7050 train_time:1032481ms step_avg:229.24ms step:4505/7050 train_time:1032718ms step_avg:229.24ms step:4506/7050 train_time:1032955ms step_avg:229.24ms step:4507/7050 train_time:1033191ms step_avg:229.24ms step:4508/7050 train_time:1033431ms step_avg:229.24ms step:4509/7050 train_time:1033666ms step_avg:229.25ms step:4510/7050 train_time:1033903ms step_avg:229.25ms step:4511/7050 train_time:1034141ms step_avg:229.25ms step:4512/7050 train_time:1034377ms step_avg:229.25ms step:4513/7050 train_time:1034614ms step_avg:229.25ms step:4514/7050 train_time:1034850ms step_avg:229.25ms step:4515/7050 train_time:1035086ms step_avg:229.25ms step:4516/7050 train_time:1035321ms step_avg:229.26ms step:4517/7050 train_time:1035559ms step_avg:229.26ms step:4518/7050 train_time:1035795ms step_avg:229.26ms step:4519/7050 train_time:1036032ms step_avg:229.26ms step:4520/7050 train_time:1036271ms step_avg:229.26ms step:4521/7050 train_time:1036508ms step_avg:229.27ms step:4522/7050 train_time:1036746ms step_avg:229.27ms step:4523/7050 train_time:1036984ms step_avg:229.27ms step:4524/7050 train_time:1037220ms step_avg:229.27ms step:4525/7050 train_time:1037457ms step_avg:229.27ms step:4526/7050 train_time:1037691ms step_avg:229.27ms step:4527/7050 train_time:1037928ms step_avg:229.28ms step:4528/7050 train_time:1038166ms step_avg:229.28ms step:4529/7050 train_time:1038405ms step_avg:229.28ms step:4530/7050 train_time:1038641ms step_avg:229.28ms step:4531/7050 train_time:1038877ms step_avg:229.28ms step:4532/7050 train_time:1039115ms step_avg:229.28ms step:4533/7050 train_time:1039353ms step_avg:229.29ms step:4534/7050 train_time:1039589ms step_avg:229.29ms step:4535/7050 train_time:1039826ms step_avg:229.29ms step:4536/7050 train_time:1040065ms step_avg:229.29ms step:4537/7050 train_time:1040301ms step_avg:229.29ms step:4538/7050 train_time:1040538ms step_avg:229.29ms step:4539/7050 train_time:1040774ms step_avg:229.30ms step:4540/7050 train_time:1041012ms step_avg:229.30ms step:4541/7050 train_time:1041251ms step_avg:229.30ms step:4542/7050 train_time:1041486ms step_avg:229.30ms step:4543/7050 train_time:1041724ms step_avg:229.30ms step:4544/7050 train_time:1041959ms step_avg:229.30ms step:4545/7050 train_time:1042197ms step_avg:229.31ms step:4546/7050 train_time:1042434ms step_avg:229.31ms step:4547/7050 train_time:1042671ms step_avg:229.31ms step:4548/7050 train_time:1042908ms step_avg:229.31ms step:4549/7050 train_time:1043144ms step_avg:229.31ms step:4550/7050 train_time:1043382ms step_avg:229.31ms step:4551/7050 train_time:1043620ms step_avg:229.32ms step:4552/7050 train_time:1043855ms step_avg:229.32ms step:4553/7050 train_time:1044093ms step_avg:229.32ms step:4554/7050 train_time:1044330ms step_avg:229.32ms step:4555/7050 train_time:1044567ms step_avg:229.32ms step:4556/7050 train_time:1044806ms step_avg:229.33ms step:4557/7050 train_time:1045042ms step_avg:229.33ms step:4558/7050 train_time:1045281ms step_avg:229.33ms step:4559/7050 train_time:1045518ms step_avg:229.33ms step:4560/7050 train_time:1045754ms step_avg:229.33ms step:4561/7050 train_time:1045990ms step_avg:229.33ms step:4562/7050 train_time:1046228ms step_avg:229.34ms step:4563/7050 train_time:1046467ms step_avg:229.34ms step:4564/7050 train_time:1046704ms step_avg:229.34ms step:4565/7050 train_time:1046942ms step_avg:229.34ms step:4566/7050 train_time:1047178ms step_avg:229.34ms step:4567/7050 train_time:1047415ms step_avg:229.34ms step:4568/7050 train_time:1047654ms step_avg:229.35ms step:4569/7050 train_time:1047890ms step_avg:229.35ms step:4570/7050 train_time:1048128ms step_avg:229.35ms step:4571/7050 train_time:1048368ms step_avg:229.35ms step:4572/7050 train_time:1048607ms step_avg:229.35ms step:4573/7050 train_time:1048843ms step_avg:229.36ms step:4574/7050 train_time:1049081ms step_avg:229.36ms step:4575/7050 train_time:1049318ms step_avg:229.36ms step:4576/7050 train_time:1049555ms step_avg:229.36ms step:4577/7050 train_time:1049791ms step_avg:229.36ms step:4578/7050 train_time:1050029ms step_avg:229.36ms step:4579/7050 train_time:1050266ms step_avg:229.37ms step:4580/7050 train_time:1050503ms step_avg:229.37ms step:4581/7050 train_time:1050741ms step_avg:229.37ms step:4582/7050 train_time:1050976ms step_avg:229.37ms step:4583/7050 train_time:1051213ms step_avg:229.37ms step:4584/7050 train_time:1051450ms step_avg:229.37ms step:4585/7050 train_time:1051687ms step_avg:229.38ms step:4586/7050 train_time:1051922ms step_avg:229.38ms step:4587/7050 train_time:1052159ms step_avg:229.38ms step:4588/7050 train_time:1052395ms step_avg:229.38ms step:4589/7050 train_time:1052633ms step_avg:229.38ms step:4590/7050 train_time:1052871ms step_avg:229.38ms step:4591/7050 train_time:1053111ms step_avg:229.39ms step:4592/7050 train_time:1053349ms step_avg:229.39ms step:4593/7050 train_time:1053586ms step_avg:229.39ms step:4594/7050 train_time:1053822ms step_avg:229.39ms step:4595/7050 train_time:1054058ms step_avg:229.39ms step:4596/7050 train_time:1054295ms step_avg:229.39ms step:4597/7050 train_time:1054535ms step_avg:229.40ms step:4598/7050 train_time:1054772ms step_avg:229.40ms step:4599/7050 train_time:1055011ms step_avg:229.40ms step:4600/7050 train_time:1055247ms step_avg:229.40ms step:4601/7050 train_time:1055483ms step_avg:229.40ms step:4602/7050 train_time:1055719ms step_avg:229.40ms step:4603/7050 train_time:1055956ms step_avg:229.41ms step:4604/7050 train_time:1056192ms step_avg:229.41ms step:4605/7050 train_time:1056432ms step_avg:229.41ms step:4606/7050 train_time:1056669ms step_avg:229.41ms step:4607/7050 train_time:1056905ms step_avg:229.41ms step:4608/7050 train_time:1057142ms step_avg:229.41ms step:4609/7050 train_time:1057377ms step_avg:229.42ms step:4610/7050 train_time:1057614ms step_avg:229.42ms step:4611/7050 train_time:1057851ms step_avg:229.42ms step:4612/7050 train_time:1058089ms step_avg:229.42ms step:4613/7050 train_time:1058327ms step_avg:229.42ms step:4614/7050 train_time:1058562ms step_avg:229.42ms step:4615/7050 train_time:1058799ms step_avg:229.43ms step:4616/7050 train_time:1059036ms step_avg:229.43ms step:4617/7050 train_time:1059273ms step_avg:229.43ms step:4618/7050 train_time:1059511ms step_avg:229.43ms step:4619/7050 train_time:1059747ms step_avg:229.43ms step:4620/7050 train_time:1059984ms step_avg:229.43ms step:4621/7050 train_time:1060221ms step_avg:229.44ms step:4622/7050 train_time:1060456ms step_avg:229.44ms step:4623/7050 train_time:1060692ms step_avg:229.44ms step:4624/7050 train_time:1060929ms step_avg:229.44ms step:4625/7050 train_time:1061168ms step_avg:229.44ms step:4625/7050 val_loss:3.0766 train_time:1061355ms step_avg:229.48ms step:4626/7050 train_time:1061406ms step_avg:229.44ms step:4627/7050 train_time:1061641ms step_avg:229.44ms step:4628/7050 train_time:1061883ms step_avg:229.45ms step:4629/7050 train_time:1062118ms step_avg:229.45ms step:4630/7050 train_time:1062354ms step_avg:229.45ms step:4631/7050 train_time:1062589ms step_avg:229.45ms step:4632/7050 train_time:1062828ms step_avg:229.45ms step:4633/7050 train_time:1063068ms step_avg:229.46ms step:4634/7050 train_time:1063304ms step_avg:229.46ms step:4635/7050 train_time:1063539ms step_avg:229.46ms step:4636/7050 train_time:1063778ms step_avg:229.46ms step:4637/7050 train_time:1064016ms step_avg:229.46ms step:4638/7050 train_time:1064252ms step_avg:229.46ms step:4639/7050 train_time:1064489ms step_avg:229.47ms step:4640/7050 train_time:1064725ms step_avg:229.47ms step:4641/7050 train_time:1064962ms step_avg:229.47ms step:4642/7050 train_time:1065198ms step_avg:229.47ms step:4643/7050 train_time:1065435ms step_avg:229.47ms step:4644/7050 train_time:1065674ms step_avg:229.47ms step:4645/7050 train_time:1065911ms step_avg:229.47ms step:4646/7050 train_time:1066149ms step_avg:229.48ms step:4647/7050 train_time:1066387ms step_avg:229.48ms step:4648/7050 train_time:1066626ms step_avg:229.48ms step:4649/7050 train_time:1066861ms step_avg:229.48ms step:4650/7050 train_time:1067098ms step_avg:229.48ms step:4651/7050 train_time:1067334ms step_avg:229.48ms step:4652/7050 train_time:1067572ms step_avg:229.49ms step:4653/7050 train_time:1067809ms step_avg:229.49ms step:4654/7050 train_time:1068046ms step_avg:229.49ms step:4655/7050 train_time:1068282ms step_avg:229.49ms step:4656/7050 train_time:1068518ms step_avg:229.49ms step:4657/7050 train_time:1068756ms step_avg:229.49ms step:4658/7050 train_time:1068993ms step_avg:229.50ms step:4659/7050 train_time:1069229ms step_avg:229.50ms step:4660/7050 train_time:1069465ms step_avg:229.50ms step:4661/7050 train_time:1069702ms step_avg:229.50ms step:4662/7050 train_time:1069939ms step_avg:229.50ms step:4663/7050 train_time:1070178ms step_avg:229.50ms step:4664/7050 train_time:1070417ms step_avg:229.51ms step:4665/7050 train_time:1070654ms step_avg:229.51ms step:4666/7050 train_time:1070892ms step_avg:229.51ms step:4667/7050 train_time:1071127ms step_avg:229.51ms step:4668/7050 train_time:1071364ms step_avg:229.51ms step:4669/7050 train_time:1071601ms step_avg:229.51ms step:4670/7050 train_time:1071839ms step_avg:229.52ms step:4671/7050 train_time:1072077ms step_avg:229.52ms step:4672/7050 train_time:1072315ms step_avg:229.52ms step:4673/7050 train_time:1072552ms step_avg:229.52ms step:4674/7050 train_time:1072789ms step_avg:229.52ms step:4675/7050 train_time:1073027ms step_avg:229.52ms step:4676/7050 train_time:1073261ms step_avg:229.53ms step:4677/7050 train_time:1073498ms step_avg:229.53ms step:4678/7050 train_time:1073735ms step_avg:229.53ms step:4679/7050 train_time:1073974ms step_avg:229.53ms step:4680/7050 train_time:1074212ms step_avg:229.53ms step:4681/7050 train_time:1074447ms step_avg:229.53ms step:4682/7050 train_time:1074684ms step_avg:229.54ms step:4683/7050 train_time:1074921ms step_avg:229.54ms step:4684/7050 train_time:1075159ms step_avg:229.54ms step:4685/7050 train_time:1075399ms step_avg:229.54ms step:4686/7050 train_time:1075635ms step_avg:229.54ms step:4687/7050 train_time:1075871ms step_avg:229.54ms step:4688/7050 train_time:1076108ms step_avg:229.55ms step:4689/7050 train_time:1076345ms step_avg:229.55ms step:4690/7050 train_time:1076583ms step_avg:229.55ms step:4691/7050 train_time:1076818ms step_avg:229.55ms step:4692/7050 train_time:1077056ms step_avg:229.55ms step:4693/7050 train_time:1077296ms step_avg:229.55ms step:4694/7050 train_time:1077532ms step_avg:229.56ms step:4695/7050 train_time:1077772ms step_avg:229.56ms step:4696/7050 train_time:1078008ms step_avg:229.56ms step:4697/7050 train_time:1078244ms step_avg:229.56ms step:4698/7050 train_time:1078482ms step_avg:229.56ms step:4699/7050 train_time:1078720ms step_avg:229.56ms step:4700/7050 train_time:1078959ms step_avg:229.57ms step:4701/7050 train_time:1079194ms step_avg:229.57ms step:4702/7050 train_time:1079432ms step_avg:229.57ms step:4703/7050 train_time:1079669ms step_avg:229.57ms step:4704/7050 train_time:1079910ms step_avg:229.57ms step:4705/7050 train_time:1080148ms step_avg:229.57ms step:4706/7050 train_time:1080389ms step_avg:229.58ms step:4707/7050 train_time:1080631ms step_avg:229.58ms step:4708/7050 train_time:1080870ms step_avg:229.58ms step:4709/7050 train_time:1081109ms step_avg:229.58ms step:4710/7050 train_time:1081350ms step_avg:229.59ms step:4711/7050 train_time:1081590ms step_avg:229.59ms step:4712/7050 train_time:1081831ms step_avg:229.59ms step:4713/7050 train_time:1082070ms step_avg:229.59ms step:4714/7050 train_time:1082313ms step_avg:229.60ms step:4715/7050 train_time:1082552ms step_avg:229.60ms step:4716/7050 train_time:1082792ms step_avg:229.60ms step:4717/7050 train_time:1083031ms step_avg:229.60ms step:4718/7050 train_time:1083274ms step_avg:229.60ms step:4719/7050 train_time:1083516ms step_avg:229.61ms step:4720/7050 train_time:1083754ms step_avg:229.61ms step:4721/7050 train_time:1083994ms step_avg:229.61ms step:4722/7050 train_time:1084234ms step_avg:229.61ms step:4723/7050 train_time:1084477ms step_avg:229.62ms step:4724/7050 train_time:1084715ms step_avg:229.62ms step:4725/7050 train_time:1084956ms step_avg:229.62ms step:4726/7050 train_time:1085198ms step_avg:229.62ms step:4727/7050 train_time:1085438ms step_avg:229.63ms step:4728/7050 train_time:1085677ms step_avg:229.63ms step:4729/7050 train_time:1085916ms step_avg:229.63ms step:4730/7050 train_time:1086155ms step_avg:229.63ms step:4731/7050 train_time:1086396ms step_avg:229.63ms step:4732/7050 train_time:1086635ms step_avg:229.64ms step:4733/7050 train_time:1086875ms step_avg:229.64ms step:4734/7050 train_time:1087115ms step_avg:229.64ms step:4735/7050 train_time:1087355ms step_avg:229.64ms step:4736/7050 train_time:1087595ms step_avg:229.64ms step:4737/7050 train_time:1087834ms step_avg:229.65ms step:4738/7050 train_time:1088078ms step_avg:229.65ms step:4739/7050 train_time:1088320ms step_avg:229.65ms step:4740/7050 train_time:1088558ms step_avg:229.65ms step:4741/7050 train_time:1088799ms step_avg:229.66ms step:4742/7050 train_time:1089040ms step_avg:229.66ms step:4743/7050 train_time:1089280ms step_avg:229.66ms step:4744/7050 train_time:1089522ms step_avg:229.66ms step:4745/7050 train_time:1089760ms step_avg:229.66ms step:4746/7050 train_time:1090000ms step_avg:229.67ms step:4747/7050 train_time:1090244ms step_avg:229.67ms step:4748/7050 train_time:1090485ms step_avg:229.67ms step:4749/7050 train_time:1090725ms step_avg:229.67ms step:4750/7050 train_time:1090965ms step_avg:229.68ms step:4750/7050 val_loss:3.0649 train_time:1091155ms step_avg:229.72ms step:4751/7050 train_time:1091267ms step_avg:229.69ms step:4752/7050 train_time:1091503ms step_avg:229.69ms step:4753/7050 train_time:1091741ms step_avg:229.70ms step:4754/7050 train_time:1091978ms step_avg:229.70ms step:4755/7050 train_time:1092221ms step_avg:229.70ms step:4756/7050 train_time:1092463ms step_avg:229.70ms step:4757/7050 train_time:1092700ms step_avg:229.70ms step:4758/7050 train_time:1092939ms step_avg:229.71ms step:4759/7050 train_time:1093181ms step_avg:229.71ms step:4760/7050 train_time:1093420ms step_avg:229.71ms step:4761/7050 train_time:1093658ms step_avg:229.71ms step:4762/7050 train_time:1093896ms step_avg:229.71ms step:4763/7050 train_time:1094138ms step_avg:229.72ms step:4764/7050 train_time:1094378ms step_avg:229.72ms step:4765/7050 train_time:1094617ms step_avg:229.72ms step:4766/7050 train_time:1094857ms step_avg:229.72ms step:4767/7050 train_time:1095097ms step_avg:229.72ms step:4768/7050 train_time:1095338ms step_avg:229.73ms step:4769/7050 train_time:1095577ms step_avg:229.73ms step:4770/7050 train_time:1095816ms step_avg:229.73ms step:4771/7050 train_time:1096056ms step_avg:229.73ms step:4772/7050 train_time:1096294ms step_avg:229.73ms step:4773/7050 train_time:1096533ms step_avg:229.74ms step:4774/7050 train_time:1096773ms step_avg:229.74ms step:4775/7050 train_time:1097014ms step_avg:229.74ms step:4776/7050 train_time:1097254ms step_avg:229.74ms step:4777/7050 train_time:1097493ms step_avg:229.75ms step:4778/7050 train_time:1097732ms step_avg:229.75ms step:4779/7050 train_time:1097972ms step_avg:229.75ms step:4780/7050 train_time:1098212ms step_avg:229.75ms step:4781/7050 train_time:1098452ms step_avg:229.75ms step:4782/7050 train_time:1098695ms step_avg:229.76ms step:4783/7050 train_time:1098936ms step_avg:229.76ms step:4784/7050 train_time:1099174ms step_avg:229.76ms step:4785/7050 train_time:1099414ms step_avg:229.76ms step:4786/7050 train_time:1099655ms step_avg:229.76ms step:4787/7050 train_time:1099893ms step_avg:229.77ms step:4788/7050 train_time:1100135ms step_avg:229.77ms step:4789/7050 train_time:1100375ms step_avg:229.77ms step:4790/7050 train_time:1100617ms step_avg:229.77ms step:4791/7050 train_time:1100861ms step_avg:229.78ms step:4792/7050 train_time:1101099ms step_avg:229.78ms step:4793/7050 train_time:1101338ms step_avg:229.78ms step:4794/7050 train_time:1101577ms step_avg:229.78ms step:4795/7050 train_time:1101816ms step_avg:229.78ms step:4796/7050 train_time:1102056ms step_avg:229.79ms step:4797/7050 train_time:1102297ms step_avg:229.79ms step:4798/7050 train_time:1102535ms step_avg:229.79ms step:4799/7050 train_time:1102774ms step_avg:229.79ms step:4800/7050 train_time:1103014ms step_avg:229.79ms step:4801/7050 train_time:1103255ms step_avg:229.80ms step:4802/7050 train_time:1103494ms step_avg:229.80ms step:4803/7050 train_time:1103734ms step_avg:229.80ms step:4804/7050 train_time:1103974ms step_avg:229.80ms step:4805/7050 train_time:1104218ms step_avg:229.81ms step:4806/7050 train_time:1104458ms step_avg:229.81ms step:4807/7050 train_time:1104698ms step_avg:229.81ms step:4808/7050 train_time:1104937ms step_avg:229.81ms step:4809/7050 train_time:1105178ms step_avg:229.81ms step:4810/7050 train_time:1105420ms step_avg:229.82ms step:4811/7050 train_time:1105659ms step_avg:229.82ms step:4812/7050 train_time:1105898ms step_avg:229.82ms step:4813/7050 train_time:1106139ms step_avg:229.82ms step:4814/7050 train_time:1106380ms step_avg:229.83ms step:4815/7050 train_time:1106621ms step_avg:229.83ms step:4816/7050 train_time:1106861ms step_avg:229.83ms step:4817/7050 train_time:1107100ms step_avg:229.83ms step:4818/7050 train_time:1107341ms step_avg:229.83ms step:4819/7050 train_time:1107580ms step_avg:229.84ms step:4820/7050 train_time:1107820ms step_avg:229.84ms step:4821/7050 train_time:1108061ms step_avg:229.84ms step:4822/7050 train_time:1108303ms step_avg:229.84ms step:4823/7050 train_time:1108543ms step_avg:229.85ms step:4824/7050 train_time:1108781ms step_avg:229.85ms step:4825/7050 train_time:1109022ms step_avg:229.85ms step:4826/7050 train_time:1109264ms step_avg:229.85ms step:4827/7050 train_time:1109503ms step_avg:229.85ms step:4828/7050 train_time:1109742ms step_avg:229.86ms step:4829/7050 train_time:1109982ms step_avg:229.86ms step:4830/7050 train_time:1110222ms step_avg:229.86ms step:4831/7050 train_time:1110463ms step_avg:229.86ms step:4832/7050 train_time:1110704ms step_avg:229.86ms step:4833/7050 train_time:1110942ms step_avg:229.87ms step:4834/7050 train_time:1111180ms step_avg:229.87ms step:4835/7050 train_time:1111419ms step_avg:229.87ms step:4836/7050 train_time:1111661ms step_avg:229.87ms step:4837/7050 train_time:1111900ms step_avg:229.87ms step:4838/7050 train_time:1112141ms step_avg:229.88ms step:4839/7050 train_time:1112380ms step_avg:229.88ms step:4840/7050 train_time:1112622ms step_avg:229.88ms step:4841/7050 train_time:1112863ms step_avg:229.88ms step:4842/7050 train_time:1113100ms step_avg:229.88ms step:4843/7050 train_time:1113341ms step_avg:229.89ms step:4844/7050 train_time:1113581ms step_avg:229.89ms step:4845/7050 train_time:1113821ms step_avg:229.89ms step:4846/7050 train_time:1114062ms step_avg:229.89ms step:4847/7050 train_time:1114302ms step_avg:229.90ms step:4848/7050 train_time:1114544ms step_avg:229.90ms step:4849/7050 train_time:1114783ms step_avg:229.90ms step:4850/7050 train_time:1115022ms step_avg:229.90ms step:4851/7050 train_time:1115262ms step_avg:229.90ms step:4852/7050 train_time:1115502ms step_avg:229.91ms step:4853/7050 train_time:1115745ms step_avg:229.91ms step:4854/7050 train_time:1115985ms step_avg:229.91ms step:4855/7050 train_time:1116224ms step_avg:229.91ms step:4856/7050 train_time:1116462ms step_avg:229.91ms step:4857/7050 train_time:1116702ms step_avg:229.92ms step:4858/7050 train_time:1116941ms step_avg:229.92ms step:4859/7050 train_time:1117181ms step_avg:229.92ms step:4860/7050 train_time:1117423ms step_avg:229.92ms step:4861/7050 train_time:1117663ms step_avg:229.92ms step:4862/7050 train_time:1117900ms step_avg:229.93ms step:4863/7050 train_time:1118140ms step_avg:229.93ms step:4864/7050 train_time:1118380ms step_avg:229.93ms step:4865/7050 train_time:1118619ms step_avg:229.93ms step:4866/7050 train_time:1118858ms step_avg:229.93ms step:4867/7050 train_time:1119097ms step_avg:229.94ms step:4868/7050 train_time:1119336ms step_avg:229.94ms step:4869/7050 train_time:1119575ms step_avg:229.94ms step:4870/7050 train_time:1119816ms step_avg:229.94ms step:4871/7050 train_time:1120056ms step_avg:229.94ms step:4872/7050 train_time:1120295ms step_avg:229.95ms step:4873/7050 train_time:1120536ms step_avg:229.95ms step:4874/7050 train_time:1120776ms step_avg:229.95ms step:4875/7050 train_time:1121015ms step_avg:229.95ms step:4875/7050 val_loss:3.0553 train_time:1121204ms step_avg:229.99ms step:4876/7050 train_time:1121257ms step_avg:229.95ms step:4877/7050 train_time:1121496ms step_avg:229.96ms step:4878/7050 train_time:1121741ms step_avg:229.96ms step:4879/7050 train_time:1121979ms step_avg:229.96ms step:4880/7050 train_time:1122216ms step_avg:229.96ms step:4881/7050 train_time:1122453ms step_avg:229.96ms step:4882/7050 train_time:1122694ms step_avg:229.97ms step:4883/7050 train_time:1122935ms step_avg:229.97ms step:4884/7050 train_time:1123174ms step_avg:229.97ms step:4885/7050 train_time:1123413ms step_avg:229.97ms step:4886/7050 train_time:1123653ms step_avg:229.97ms step:4887/7050 train_time:1123892ms step_avg:229.98ms step:4888/7050 train_time:1124130ms step_avg:229.98ms step:4889/7050 train_time:1124369ms step_avg:229.98ms step:4890/7050 train_time:1124610ms step_avg:229.98ms step:4891/7050 train_time:1124849ms step_avg:229.98ms step:4892/7050 train_time:1125088ms step_avg:229.99ms step:4893/7050 train_time:1125327ms step_avg:229.99ms step:4894/7050 train_time:1125568ms step_avg:229.99ms step:4895/7050 train_time:1125808ms step_avg:229.99ms step:4896/7050 train_time:1126048ms step_avg:229.99ms step:4897/7050 train_time:1126288ms step_avg:230.00ms step:4898/7050 train_time:1126529ms step_avg:230.00ms step:4899/7050 train_time:1126771ms step_avg:230.00ms step:4900/7050 train_time:1127013ms step_avg:230.00ms step:4901/7050 train_time:1127254ms step_avg:230.00ms step:4902/7050 train_time:1127493ms step_avg:230.01ms step:4903/7050 train_time:1127732ms step_avg:230.01ms step:4904/7050 train_time:1127972ms step_avg:230.01ms step:4905/7050 train_time:1128212ms step_avg:230.01ms step:4906/7050 train_time:1128453ms step_avg:230.01ms step:4907/7050 train_time:1128694ms step_avg:230.02ms step:4908/7050 train_time:1128932ms step_avg:230.02ms step:4909/7050 train_time:1129169ms step_avg:230.02ms step:4910/7050 train_time:1129409ms step_avg:230.02ms step:4911/7050 train_time:1129649ms step_avg:230.02ms step:4912/7050 train_time:1129889ms step_avg:230.03ms step:4913/7050 train_time:1130129ms step_avg:230.03ms step:4914/7050 train_time:1130370ms step_avg:230.03ms step:4915/7050 train_time:1130609ms step_avg:230.03ms step:4916/7050 train_time:1130849ms step_avg:230.03ms step:4917/7050 train_time:1131090ms step_avg:230.04ms step:4918/7050 train_time:1131329ms step_avg:230.04ms step:4919/7050 train_time:1131570ms step_avg:230.04ms step:4920/7050 train_time:1131810ms step_avg:230.04ms step:4921/7050 train_time:1132048ms step_avg:230.04ms step:4922/7050 train_time:1132287ms step_avg:230.05ms step:4923/7050 train_time:1132527ms step_avg:230.05ms step:4924/7050 train_time:1132766ms step_avg:230.05ms step:4925/7050 train_time:1133005ms step_avg:230.05ms step:4926/7050 train_time:1133245ms step_avg:230.05ms step:4927/7050 train_time:1133484ms step_avg:230.06ms step:4928/7050 train_time:1133725ms step_avg:230.06ms step:4929/7050 train_time:1133965ms step_avg:230.06ms step:4930/7050 train_time:1134204ms step_avg:230.06ms step:4931/7050 train_time:1134444ms step_avg:230.06ms step:4932/7050 train_time:1134682ms step_avg:230.07ms step:4933/7050 train_time:1134925ms step_avg:230.07ms step:4934/7050 train_time:1135168ms step_avg:230.07ms step:4935/7050 train_time:1135407ms step_avg:230.07ms step:4936/7050 train_time:1135646ms step_avg:230.07ms step:4937/7050 train_time:1135888ms step_avg:230.08ms step:4938/7050 train_time:1136127ms step_avg:230.08ms step:4939/7050 train_time:1136368ms step_avg:230.08ms step:4940/7050 train_time:1136608ms step_avg:230.08ms step:4941/7050 train_time:1136847ms step_avg:230.08ms step:4942/7050 train_time:1137086ms step_avg:230.09ms step:4943/7050 train_time:1137325ms step_avg:230.09ms step:4944/7050 train_time:1137565ms step_avg:230.09ms step:4945/7050 train_time:1137807ms step_avg:230.09ms step:4946/7050 train_time:1138047ms step_avg:230.09ms step:4947/7050 train_time:1138287ms step_avg:230.10ms step:4948/7050 train_time:1138526ms step_avg:230.10ms step:4949/7050 train_time:1138764ms step_avg:230.10ms step:4950/7050 train_time:1139004ms step_avg:230.10ms step:4951/7050 train_time:1139242ms step_avg:230.10ms step:4952/7050 train_time:1139480ms step_avg:230.10ms step:4953/7050 train_time:1139720ms step_avg:230.11ms step:4954/7050 train_time:1139960ms step_avg:230.11ms step:4955/7050 train_time:1140203ms step_avg:230.11ms step:4956/7050 train_time:1140442ms step_avg:230.11ms step:4957/7050 train_time:1140683ms step_avg:230.12ms step:4958/7050 train_time:1140922ms step_avg:230.12ms step:4959/7050 train_time:1141162ms step_avg:230.12ms step:4960/7050 train_time:1141400ms step_avg:230.12ms step:4961/7050 train_time:1141640ms step_avg:230.12ms step:4962/7050 train_time:1141879ms step_avg:230.12ms step:4963/7050 train_time:1142118ms step_avg:230.13ms step:4964/7050 train_time:1142358ms step_avg:230.13ms step:4965/7050 train_time:1142597ms step_avg:230.13ms step:4966/7050 train_time:1142839ms step_avg:230.13ms step:4967/7050 train_time:1143082ms step_avg:230.14ms step:4968/7050 train_time:1143322ms step_avg:230.14ms step:4969/7050 train_time:1143562ms step_avg:230.14ms step:4970/7050 train_time:1143802ms step_avg:230.14ms step:4971/7050 train_time:1144043ms step_avg:230.14ms step:4972/7050 train_time:1144283ms step_avg:230.15ms step:4973/7050 train_time:1144528ms step_avg:230.15ms step:4974/7050 train_time:1144769ms step_avg:230.15ms step:4975/7050 train_time:1145008ms step_avg:230.15ms step:4976/7050 train_time:1145247ms step_avg:230.15ms step:4977/7050 train_time:1145488ms step_avg:230.16ms step:4978/7050 train_time:1145732ms step_avg:230.16ms step:4979/7050 train_time:1145974ms step_avg:230.16ms step:4980/7050 train_time:1146214ms step_avg:230.16ms step:4981/7050 train_time:1146456ms step_avg:230.17ms step:4982/7050 train_time:1146696ms step_avg:230.17ms step:4983/7050 train_time:1146935ms step_avg:230.17ms step:4984/7050 train_time:1147173ms step_avg:230.17ms step:4985/7050 train_time:1147414ms step_avg:230.17ms step:4986/7050 train_time:1147653ms step_avg:230.18ms step:4987/7050 train_time:1147893ms step_avg:230.18ms step:4988/7050 train_time:1148131ms step_avg:230.18ms step:4989/7050 train_time:1148373ms step_avg:230.18ms step:4990/7050 train_time:1148610ms step_avg:230.18ms step:4991/7050 train_time:1148850ms step_avg:230.18ms step:4992/7050 train_time:1149091ms step_avg:230.19ms step:4993/7050 train_time:1149330ms step_avg:230.19ms step:4994/7050 train_time:1149571ms step_avg:230.19ms step:4995/7050 train_time:1149811ms step_avg:230.19ms step:4996/7050 train_time:1150051ms step_avg:230.19ms step:4997/7050 train_time:1150288ms step_avg:230.20ms step:4998/7050 train_time:1150528ms step_avg:230.20ms step:4999/7050 train_time:1150770ms step_avg:230.20ms step:5000/7050 train_time:1151009ms step_avg:230.20ms step:5000/7050 val_loss:3.0465 train_time:1151201ms step_avg:230.24ms step:5001/7050 train_time:1151256ms step_avg:230.21ms step:5002/7050 train_time:1151490ms step_avg:230.21ms step:5003/7050 train_time:1151737ms step_avg:230.21ms step:5004/7050 train_time:1151975ms step_avg:230.21ms step:5005/7050 train_time:1152214ms step_avg:230.21ms step:5006/7050 train_time:1152455ms step_avg:230.21ms step:5007/7050 train_time:1152697ms step_avg:230.22ms step:5008/7050 train_time:1152936ms step_avg:230.22ms step:5009/7050 train_time:1153175ms step_avg:230.22ms step:5010/7050 train_time:1153414ms step_avg:230.22ms step:5011/7050 train_time:1153655ms step_avg:230.22ms step:5012/7050 train_time:1153892ms step_avg:230.23ms step:5013/7050 train_time:1154133ms step_avg:230.23ms step:5014/7050 train_time:1154373ms step_avg:230.23ms step:5015/7050 train_time:1154613ms step_avg:230.23ms step:5016/7050 train_time:1154855ms step_avg:230.23ms step:5017/7050 train_time:1155094ms step_avg:230.24ms step:5018/7050 train_time:1155335ms step_avg:230.24ms step:5019/7050 train_time:1155575ms step_avg:230.24ms step:5020/7050 train_time:1155814ms step_avg:230.24ms step:5021/7050 train_time:1156055ms step_avg:230.24ms step:5022/7050 train_time:1156296ms step_avg:230.25ms step:5023/7050 train_time:1156537ms step_avg:230.25ms step:5024/7050 train_time:1156777ms step_avg:230.25ms step:5025/7050 train_time:1157018ms step_avg:230.25ms step:5026/7050 train_time:1157260ms step_avg:230.25ms step:5027/7050 train_time:1157498ms step_avg:230.26ms step:5028/7050 train_time:1157738ms step_avg:230.26ms step:5029/7050 train_time:1157979ms step_avg:230.26ms step:5030/7050 train_time:1158220ms step_avg:230.26ms step:5031/7050 train_time:1158459ms step_avg:230.26ms step:5032/7050 train_time:1158697ms step_avg:230.27ms step:5033/7050 train_time:1158936ms step_avg:230.27ms step:5034/7050 train_time:1159177ms step_avg:230.27ms step:5035/7050 train_time:1159417ms step_avg:230.27ms step:5036/7050 train_time:1159658ms step_avg:230.27ms step:5037/7050 train_time:1159899ms step_avg:230.28ms step:5038/7050 train_time:1160137ms step_avg:230.28ms step:5039/7050 train_time:1160378ms step_avg:230.28ms step:5040/7050 train_time:1160620ms step_avg:230.28ms step:5041/7050 train_time:1160860ms step_avg:230.28ms step:5042/7050 train_time:1161097ms step_avg:230.29ms step:5043/7050 train_time:1161337ms step_avg:230.29ms step:5044/7050 train_time:1161577ms step_avg:230.29ms step:5045/7050 train_time:1161817ms step_avg:230.29ms step:5046/7050 train_time:1162057ms step_avg:230.29ms step:5047/7050 train_time:1162298ms step_avg:230.29ms step:5048/7050 train_time:1162537ms step_avg:230.30ms step:5049/7050 train_time:1162777ms step_avg:230.30ms step:5050/7050 train_time:1163015ms step_avg:230.30ms step:5051/7050 train_time:1163256ms step_avg:230.30ms step:5052/7050 train_time:1163495ms step_avg:230.30ms step:5053/7050 train_time:1163736ms step_avg:230.31ms step:5054/7050 train_time:1163976ms step_avg:230.31ms step:5055/7050 train_time:1164218ms step_avg:230.31ms step:5056/7050 train_time:1164456ms step_avg:230.31ms step:5057/7050 train_time:1164696ms step_avg:230.31ms step:5058/7050 train_time:1164937ms step_avg:230.32ms step:5059/7050 train_time:1165176ms step_avg:230.32ms step:5060/7050 train_time:1165416ms step_avg:230.32ms step:5061/7050 train_time:1165656ms step_avg:230.32ms step:5062/7050 train_time:1165897ms step_avg:230.32ms step:5063/7050 train_time:1166137ms step_avg:230.33ms step:5064/7050 train_time:1166378ms step_avg:230.33ms step:5065/7050 train_time:1166618ms step_avg:230.33ms step:5066/7050 train_time:1166858ms step_avg:230.33ms step:5067/7050 train_time:1167097ms step_avg:230.33ms step:5068/7050 train_time:1167335ms step_avg:230.33ms step:5069/7050 train_time:1167575ms step_avg:230.34ms step:5070/7050 train_time:1167816ms step_avg:230.34ms step:5071/7050 train_time:1168058ms step_avg:230.34ms step:5072/7050 train_time:1168296ms step_avg:230.34ms step:5073/7050 train_time:1168535ms step_avg:230.34ms step:5074/7050 train_time:1168775ms step_avg:230.35ms step:5075/7050 train_time:1169016ms step_avg:230.35ms step:5076/7050 train_time:1169255ms step_avg:230.35ms step:5077/7050 train_time:1169495ms step_avg:230.35ms step:5078/7050 train_time:1169735ms step_avg:230.35ms step:5079/7050 train_time:1169978ms step_avg:230.36ms step:5080/7050 train_time:1170217ms step_avg:230.36ms step:5081/7050 train_time:1170456ms step_avg:230.36ms step:5082/7050 train_time:1170695ms step_avg:230.36ms step:5083/7050 train_time:1170936ms step_avg:230.36ms step:5084/7050 train_time:1171176ms step_avg:230.37ms step:5085/7050 train_time:1171417ms step_avg:230.37ms step:5086/7050 train_time:1171659ms step_avg:230.37ms step:5087/7050 train_time:1171898ms step_avg:230.37ms step:5088/7050 train_time:1172142ms step_avg:230.37ms step:5089/7050 train_time:1172381ms step_avg:230.38ms step:5090/7050 train_time:1172620ms step_avg:230.38ms step:5091/7050 train_time:1172861ms step_avg:230.38ms step:5092/7050 train_time:1173100ms step_avg:230.38ms step:5093/7050 train_time:1173339ms step_avg:230.38ms step:5094/7050 train_time:1173581ms step_avg:230.38ms step:5095/7050 train_time:1173821ms step_avg:230.39ms step:5096/7050 train_time:1174061ms step_avg:230.39ms step:5097/7050 train_time:1174300ms step_avg:230.39ms step:5098/7050 train_time:1174539ms step_avg:230.39ms step:5099/7050 train_time:1174781ms step_avg:230.39ms step:5100/7050 train_time:1175023ms step_avg:230.40ms step:5101/7050 train_time:1175264ms step_avg:230.40ms step:5102/7050 train_time:1175505ms step_avg:230.40ms step:5103/7050 train_time:1175745ms step_avg:230.40ms step:5104/7050 train_time:1175985ms step_avg:230.40ms step:5105/7050 train_time:1176223ms step_avg:230.41ms step:5106/7050 train_time:1176464ms step_avg:230.41ms step:5107/7050 train_time:1176704ms step_avg:230.41ms step:5108/7050 train_time:1176945ms step_avg:230.41ms step:5109/7050 train_time:1177184ms step_avg:230.41ms step:5110/7050 train_time:1177421ms step_avg:230.42ms step:5111/7050 train_time:1177662ms step_avg:230.42ms step:5112/7050 train_time:1177903ms step_avg:230.42ms step:5113/7050 train_time:1178144ms step_avg:230.42ms step:5114/7050 train_time:1178382ms step_avg:230.42ms step:5115/7050 train_time:1178621ms step_avg:230.42ms step:5116/7050 train_time:1178863ms step_avg:230.43ms step:5117/7050 train_time:1179101ms step_avg:230.43ms step:5118/7050 train_time:1179341ms step_avg:230.43ms step:5119/7050 train_time:1179580ms step_avg:230.43ms step:5120/7050 train_time:1179823ms step_avg:230.43ms step:5121/7050 train_time:1180066ms step_avg:230.44ms step:5122/7050 train_time:1180303ms step_avg:230.44ms step:5123/7050 train_time:1180543ms step_avg:230.44ms step:5124/7050 train_time:1180787ms step_avg:230.44ms step:5125/7050 train_time:1181026ms step_avg:230.44ms step:5125/7050 val_loss:3.0371 train_time:1181217ms step_avg:230.48ms step:5126/7050 train_time:1181268ms step_avg:230.45ms step:5127/7050 train_time:1181508ms step_avg:230.45ms step:5128/7050 train_time:1181753ms step_avg:230.45ms step:5129/7050 train_time:1181991ms step_avg:230.45ms step:5130/7050 train_time:1182229ms step_avg:230.45ms step:5131/7050 train_time:1182469ms step_avg:230.46ms step:5132/7050 train_time:1182713ms step_avg:230.46ms step:5133/7050 train_time:1182952ms step_avg:230.46ms step:5134/7050 train_time:1183193ms step_avg:230.46ms step:5135/7050 train_time:1183431ms step_avg:230.46ms step:5136/7050 train_time:1183672ms step_avg:230.47ms step:5137/7050 train_time:1183914ms step_avg:230.47ms step:5138/7050 train_time:1184156ms step_avg:230.47ms step:5139/7050 train_time:1184396ms step_avg:230.47ms step:5140/7050 train_time:1184635ms step_avg:230.47ms step:5141/7050 train_time:1184875ms step_avg:230.48ms step:5142/7050 train_time:1185114ms step_avg:230.48ms step:5143/7050 train_time:1185353ms step_avg:230.48ms step:5144/7050 train_time:1185594ms step_avg:230.48ms step:5145/7050 train_time:1185835ms step_avg:230.48ms step:5146/7050 train_time:1186074ms step_avg:230.48ms step:5147/7050 train_time:1186314ms step_avg:230.49ms step:5148/7050 train_time:1186554ms step_avg:230.49ms step:5149/7050 train_time:1186796ms step_avg:230.49ms step:5150/7050 train_time:1187034ms step_avg:230.49ms step:5151/7050 train_time:1187274ms step_avg:230.49ms step:5152/7050 train_time:1187513ms step_avg:230.50ms step:5153/7050 train_time:1187754ms step_avg:230.50ms step:5154/7050 train_time:1187993ms step_avg:230.50ms step:5155/7050 train_time:1188234ms step_avg:230.50ms step:5156/7050 train_time:1188473ms step_avg:230.50ms step:5157/7050 train_time:1188712ms step_avg:230.50ms step:5158/7050 train_time:1188954ms step_avg:230.51ms step:5159/7050 train_time:1189194ms step_avg:230.51ms step:5160/7050 train_time:1189434ms step_avg:230.51ms step:5161/7050 train_time:1189674ms step_avg:230.51ms step:5162/7050 train_time:1189916ms step_avg:230.51ms step:5163/7050 train_time:1190153ms step_avg:230.52ms step:5164/7050 train_time:1190394ms step_avg:230.52ms step:5165/7050 train_time:1190634ms step_avg:230.52ms step:5166/7050 train_time:1190874ms step_avg:230.52ms step:5167/7050 train_time:1191115ms step_avg:230.52ms step:5168/7050 train_time:1191356ms step_avg:230.53ms step:5169/7050 train_time:1191595ms step_avg:230.53ms step:5170/7050 train_time:1191835ms step_avg:230.53ms step:5171/7050 train_time:1192075ms step_avg:230.53ms step:5172/7050 train_time:1192316ms step_avg:230.53ms step:5173/7050 train_time:1192555ms step_avg:230.53ms step:5174/7050 train_time:1192795ms step_avg:230.54ms step:5175/7050 train_time:1193036ms step_avg:230.54ms step:5176/7050 train_time:1193275ms step_avg:230.54ms step:5177/7050 train_time:1193515ms step_avg:230.54ms step:5178/7050 train_time:1193754ms step_avg:230.54ms step:5179/7050 train_time:1193995ms step_avg:230.55ms step:5180/7050 train_time:1194239ms step_avg:230.55ms step:5181/7050 train_time:1194479ms step_avg:230.55ms step:5182/7050 train_time:1194719ms step_avg:230.55ms step:5183/7050 train_time:1194960ms step_avg:230.55ms step:5184/7050 train_time:1195199ms step_avg:230.56ms step:5185/7050 train_time:1195440ms step_avg:230.56ms step:5186/7050 train_time:1195678ms step_avg:230.56ms step:5187/7050 train_time:1195916ms step_avg:230.56ms step:5188/7050 train_time:1196158ms step_avg:230.56ms step:5189/7050 train_time:1196397ms step_avg:230.56ms step:5190/7050 train_time:1196635ms step_avg:230.57ms step:5191/7050 train_time:1196876ms step_avg:230.57ms step:5192/7050 train_time:1197119ms step_avg:230.57ms step:5193/7050 train_time:1197361ms step_avg:230.57ms step:5194/7050 train_time:1197600ms step_avg:230.57ms step:5195/7050 train_time:1197841ms step_avg:230.58ms step:5196/7050 train_time:1198080ms step_avg:230.58ms step:5197/7050 train_time:1198320ms step_avg:230.58ms step:5198/7050 train_time:1198559ms step_avg:230.58ms step:5199/7050 train_time:1198800ms step_avg:230.58ms step:5200/7050 train_time:1199040ms step_avg:230.58ms step:5201/7050 train_time:1199279ms step_avg:230.59ms step:5202/7050 train_time:1199519ms step_avg:230.59ms step:5203/7050 train_time:1199759ms step_avg:230.59ms step:5204/7050 train_time:1199999ms step_avg:230.59ms step:5205/7050 train_time:1200240ms step_avg:230.59ms step:5206/7050 train_time:1200479ms step_avg:230.60ms step:5207/7050 train_time:1200719ms step_avg:230.60ms step:5208/7050 train_time:1200960ms step_avg:230.60ms step:5209/7050 train_time:1201199ms step_avg:230.60ms step:5210/7050 train_time:1201441ms step_avg:230.60ms step:5211/7050 train_time:1201680ms step_avg:230.60ms step:5212/7050 train_time:1201921ms step_avg:230.61ms step:5213/7050 train_time:1202161ms step_avg:230.61ms step:5214/7050 train_time:1202402ms step_avg:230.61ms step:5215/7050 train_time:1202644ms step_avg:230.61ms step:5216/7050 train_time:1202882ms step_avg:230.61ms step:5217/7050 train_time:1203120ms step_avg:230.62ms step:5218/7050 train_time:1203361ms step_avg:230.62ms step:5219/7050 train_time:1203600ms step_avg:230.62ms step:5220/7050 train_time:1203841ms step_avg:230.62ms step:5221/7050 train_time:1204083ms step_avg:230.62ms step:5222/7050 train_time:1204322ms step_avg:230.62ms step:5223/7050 train_time:1204560ms step_avg:230.63ms step:5224/7050 train_time:1204801ms step_avg:230.63ms step:5225/7050 train_time:1205042ms step_avg:230.63ms step:5226/7050 train_time:1205282ms step_avg:230.63ms step:5227/7050 train_time:1205520ms step_avg:230.63ms step:5228/7050 train_time:1205761ms step_avg:230.64ms step:5229/7050 train_time:1206001ms step_avg:230.64ms step:5230/7050 train_time:1206241ms step_avg:230.64ms step:5231/7050 train_time:1206481ms step_avg:230.64ms step:5232/7050 train_time:1206721ms step_avg:230.64ms step:5233/7050 train_time:1206961ms step_avg:230.64ms step:5234/7050 train_time:1207205ms step_avg:230.65ms step:5235/7050 train_time:1207446ms step_avg:230.65ms step:5236/7050 train_time:1207687ms step_avg:230.65ms step:5237/7050 train_time:1207926ms step_avg:230.65ms step:5238/7050 train_time:1208166ms step_avg:230.65ms step:5239/7050 train_time:1208405ms step_avg:230.66ms step:5240/7050 train_time:1208646ms step_avg:230.66ms step:5241/7050 train_time:1208887ms step_avg:230.66ms step:5242/7050 train_time:1209125ms step_avg:230.66ms step:5243/7050 train_time:1209366ms step_avg:230.66ms step:5244/7050 train_time:1209605ms step_avg:230.66ms step:5245/7050 train_time:1209845ms step_avg:230.67ms step:5246/7050 train_time:1210085ms step_avg:230.67ms step:5247/7050 train_time:1210328ms step_avg:230.67ms step:5248/7050 train_time:1210567ms step_avg:230.67ms step:5249/7050 train_time:1210808ms step_avg:230.67ms step:5250/7050 train_time:1211047ms step_avg:230.68ms step:5250/7050 val_loss:3.0269 train_time:1211238ms step_avg:230.71ms step:5251/7050 train_time:1211290ms step_avg:230.68ms step:5252/7050 train_time:1211530ms step_avg:230.68ms step:5253/7050 train_time:1211772ms step_avg:230.68ms step:5254/7050 train_time:1212011ms step_avg:230.68ms step:5255/7050 train_time:1212254ms step_avg:230.69ms step:5256/7050 train_time:1212494ms step_avg:230.69ms step:5257/7050 train_time:1212736ms step_avg:230.69ms step:5258/7050 train_time:1212976ms step_avg:230.69ms step:5259/7050 train_time:1213215ms step_avg:230.69ms step:5260/7050 train_time:1213457ms step_avg:230.70ms step:5261/7050 train_time:1213698ms step_avg:230.70ms step:5262/7050 train_time:1213939ms step_avg:230.70ms step:5263/7050 train_time:1214179ms step_avg:230.70ms step:5264/7050 train_time:1214420ms step_avg:230.70ms step:5265/7050 train_time:1214660ms step_avg:230.70ms step:5266/7050 train_time:1214901ms step_avg:230.71ms step:5267/7050 train_time:1215140ms step_avg:230.71ms step:5268/7050 train_time:1215380ms step_avg:230.71ms step:5269/7050 train_time:1215620ms step_avg:230.71ms step:5270/7050 train_time:1215863ms step_avg:230.71ms step:5271/7050 train_time:1216102ms step_avg:230.72ms step:5272/7050 train_time:1216342ms step_avg:230.72ms step:5273/7050 train_time:1216584ms step_avg:230.72ms step:5274/7050 train_time:1216825ms step_avg:230.72ms step:5275/7050 train_time:1217065ms step_avg:230.72ms step:5276/7050 train_time:1217304ms step_avg:230.72ms step:5277/7050 train_time:1217544ms step_avg:230.73ms step:5278/7050 train_time:1217785ms step_avg:230.73ms step:5279/7050 train_time:1218025ms step_avg:230.73ms step:5280/7050 train_time:1218269ms step_avg:230.73ms step:5281/7050 train_time:1218509ms step_avg:230.73ms step:5282/7050 train_time:1218749ms step_avg:230.74ms step:5283/7050 train_time:1218989ms step_avg:230.74ms step:5284/7050 train_time:1219229ms step_avg:230.74ms step:5285/7050 train_time:1219469ms step_avg:230.74ms step:5286/7050 train_time:1219710ms step_avg:230.74ms step:5287/7050 train_time:1219952ms step_avg:230.75ms step:5288/7050 train_time:1220193ms step_avg:230.75ms step:5289/7050 train_time:1220433ms step_avg:230.75ms step:5290/7050 train_time:1220674ms step_avg:230.75ms step:5291/7050 train_time:1220915ms step_avg:230.75ms step:5292/7050 train_time:1221155ms step_avg:230.75ms step:5293/7050 train_time:1221395ms step_avg:230.76ms step:5294/7050 train_time:1221641ms step_avg:230.76ms step:5295/7050 train_time:1221882ms step_avg:230.76ms step:5296/7050 train_time:1222124ms step_avg:230.76ms step:5297/7050 train_time:1222365ms step_avg:230.77ms step:5298/7050 train_time:1222606ms step_avg:230.77ms step:5299/7050 train_time:1222846ms step_avg:230.77ms step:5300/7050 train_time:1223086ms step_avg:230.77ms step:5301/7050 train_time:1223326ms step_avg:230.77ms step:5302/7050 train_time:1223568ms step_avg:230.77ms step:5303/7050 train_time:1223807ms step_avg:230.78ms step:5304/7050 train_time:1224046ms step_avg:230.78ms step:5305/7050 train_time:1224285ms step_avg:230.78ms step:5306/7050 train_time:1224524ms step_avg:230.78ms step:5307/7050 train_time:1224767ms step_avg:230.78ms step:5308/7050 train_time:1225007ms step_avg:230.79ms step:5309/7050 train_time:1225249ms step_avg:230.79ms step:5310/7050 train_time:1225489ms step_avg:230.79ms step:5311/7050 train_time:1225728ms step_avg:230.79ms step:5312/7050 train_time:1225966ms step_avg:230.79ms step:5313/7050 train_time:1226210ms step_avg:230.79ms step:5314/7050 train_time:1226451ms step_avg:230.80ms step:5315/7050 train_time:1226691ms step_avg:230.80ms step:5316/7050 train_time:1226932ms step_avg:230.80ms step:5317/7050 train_time:1227171ms step_avg:230.80ms step:5318/7050 train_time:1227412ms step_avg:230.80ms step:5319/7050 train_time:1227651ms step_avg:230.80ms step:5320/7050 train_time:1227893ms step_avg:230.81ms step:5321/7050 train_time:1228133ms step_avg:230.81ms step:5322/7050 train_time:1228373ms step_avg:230.81ms step:5323/7050 train_time:1228615ms step_avg:230.81ms step:5324/7050 train_time:1228858ms step_avg:230.81ms step:5325/7050 train_time:1229099ms step_avg:230.82ms step:5326/7050 train_time:1229339ms step_avg:230.82ms step:5327/7050 train_time:1229579ms step_avg:230.82ms step:5328/7050 train_time:1229820ms step_avg:230.82ms step:5329/7050 train_time:1230062ms step_avg:230.82ms step:5330/7050 train_time:1230302ms step_avg:230.83ms step:5331/7050 train_time:1230543ms step_avg:230.83ms step:5332/7050 train_time:1230782ms step_avg:230.83ms step:5333/7050 train_time:1231025ms step_avg:230.83ms step:5334/7050 train_time:1231268ms step_avg:230.83ms step:5335/7050 train_time:1231509ms step_avg:230.84ms step:5336/7050 train_time:1231748ms step_avg:230.84ms step:5337/7050 train_time:1231989ms step_avg:230.84ms step:5338/7050 train_time:1232229ms step_avg:230.84ms step:5339/7050 train_time:1232468ms step_avg:230.84ms step:5340/7050 train_time:1232707ms step_avg:230.84ms step:5341/7050 train_time:1232946ms step_avg:230.85ms step:5342/7050 train_time:1233186ms step_avg:230.85ms step:5343/7050 train_time:1233427ms step_avg:230.85ms step:5344/7050 train_time:1233667ms step_avg:230.85ms step:5345/7050 train_time:1233907ms step_avg:230.85ms step:5346/7050 train_time:1234149ms step_avg:230.85ms step:5347/7050 train_time:1234389ms step_avg:230.86ms step:5348/7050 train_time:1234628ms step_avg:230.86ms step:5349/7050 train_time:1234871ms step_avg:230.86ms step:5350/7050 train_time:1235112ms step_avg:230.86ms step:5351/7050 train_time:1235353ms step_avg:230.86ms step:5352/7050 train_time:1235592ms step_avg:230.87ms step:5353/7050 train_time:1235833ms step_avg:230.87ms step:5354/7050 train_time:1236074ms step_avg:230.87ms step:5355/7050 train_time:1236315ms step_avg:230.87ms step:5356/7050 train_time:1236557ms step_avg:230.87ms step:5357/7050 train_time:1236796ms step_avg:230.87ms step:5358/7050 train_time:1237037ms step_avg:230.88ms step:5359/7050 train_time:1237276ms step_avg:230.88ms step:5360/7050 train_time:1237518ms step_avg:230.88ms step:5361/7050 train_time:1237759ms step_avg:230.88ms step:5362/7050 train_time:1237998ms step_avg:230.88ms step:5363/7050 train_time:1238239ms step_avg:230.89ms step:5364/7050 train_time:1238479ms step_avg:230.89ms step:5365/7050 train_time:1238723ms step_avg:230.89ms step:5366/7050 train_time:1238964ms step_avg:230.89ms step:5367/7050 train_time:1239204ms step_avg:230.89ms step:5368/7050 train_time:1239447ms step_avg:230.90ms step:5369/7050 train_time:1239688ms step_avg:230.90ms step:5370/7050 train_time:1239929ms step_avg:230.90ms step:5371/7050 train_time:1240168ms step_avg:230.90ms step:5372/7050 train_time:1240408ms step_avg:230.90ms step:5373/7050 train_time:1240651ms step_avg:230.90ms step:5374/7050 train_time:1240893ms step_avg:230.91ms step:5375/7050 train_time:1241132ms step_avg:230.91ms step:5375/7050 val_loss:3.0188 train_time:1241322ms step_avg:230.94ms step:5376/7050 train_time:1241373ms step_avg:230.91ms step:5377/7050 train_time:1241617ms step_avg:230.91ms step:5378/7050 train_time:1241862ms step_avg:230.92ms step:5379/7050 train_time:1242102ms step_avg:230.92ms step:5380/7050 train_time:1242338ms step_avg:230.92ms step:5381/7050 train_time:1242578ms step_avg:230.92ms step:5382/7050 train_time:1242825ms step_avg:230.92ms step:5383/7050 train_time:1243065ms step_avg:230.92ms step:5384/7050 train_time:1243304ms step_avg:230.93ms step:5385/7050 train_time:1243543ms step_avg:230.93ms step:5386/7050 train_time:1243784ms step_avg:230.93ms step:5387/7050 train_time:1244025ms step_avg:230.93ms step:5388/7050 train_time:1244266ms step_avg:230.93ms step:5389/7050 train_time:1244508ms step_avg:230.93ms step:5390/7050 train_time:1244745ms step_avg:230.94ms step:5391/7050 train_time:1244986ms step_avg:230.94ms step:5392/7050 train_time:1245226ms step_avg:230.94ms step:5393/7050 train_time:1245466ms step_avg:230.94ms step:5394/7050 train_time:1245706ms step_avg:230.94ms step:5395/7050 train_time:1245947ms step_avg:230.94ms step:5396/7050 train_time:1246189ms step_avg:230.95ms step:5397/7050 train_time:1246431ms step_avg:230.95ms step:5398/7050 train_time:1246672ms step_avg:230.95ms step:5399/7050 train_time:1246915ms step_avg:230.95ms step:5400/7050 train_time:1247155ms step_avg:230.95ms step:5401/7050 train_time:1247395ms step_avg:230.96ms step:5402/7050 train_time:1247636ms step_avg:230.96ms step:5403/7050 train_time:1247878ms step_avg:230.96ms step:5404/7050 train_time:1248120ms step_avg:230.96ms step:5405/7050 train_time:1248358ms step_avg:230.96ms step:5406/7050 train_time:1248599ms step_avg:230.97ms step:5407/7050 train_time:1248838ms step_avg:230.97ms step:5408/7050 train_time:1249079ms step_avg:230.97ms step:5409/7050 train_time:1249320ms step_avg:230.97ms step:5410/7050 train_time:1249559ms step_avg:230.97ms step:5411/7050 train_time:1249801ms step_avg:230.97ms step:5412/7050 train_time:1250042ms step_avg:230.98ms step:5413/7050 train_time:1250285ms step_avg:230.98ms step:5414/7050 train_time:1250523ms step_avg:230.98ms step:5415/7050 train_time:1250765ms step_avg:230.98ms step:5416/7050 train_time:1251005ms step_avg:230.98ms step:5417/7050 train_time:1251245ms step_avg:230.98ms step:5418/7050 train_time:1251483ms step_avg:230.99ms step:5419/7050 train_time:1251724ms step_avg:230.99ms step:5420/7050 train_time:1251964ms step_avg:230.99ms step:5421/7050 train_time:1252203ms step_avg:230.99ms step:5422/7050 train_time:1252444ms step_avg:230.99ms step:5423/7050 train_time:1252686ms step_avg:230.99ms step:5424/7050 train_time:1252931ms step_avg:231.00ms step:5425/7050 train_time:1253175ms step_avg:231.00ms step:5426/7050 train_time:1253417ms step_avg:231.00ms step:5427/7050 train_time:1253656ms step_avg:231.00ms step:5428/7050 train_time:1253897ms step_avg:231.01ms step:5429/7050 train_time:1254137ms step_avg:231.01ms step:5430/7050 train_time:1254376ms step_avg:231.01ms step:5431/7050 train_time:1254615ms step_avg:231.01ms step:5432/7050 train_time:1254856ms step_avg:231.01ms step:5433/7050 train_time:1255096ms step_avg:231.01ms step:5434/7050 train_time:1255338ms step_avg:231.02ms step:5435/7050 train_time:1255579ms step_avg:231.02ms step:5436/7050 train_time:1255819ms step_avg:231.02ms step:5437/7050 train_time:1256058ms step_avg:231.02ms step:5438/7050 train_time:1256302ms step_avg:231.02ms step:5439/7050 train_time:1256545ms step_avg:231.03ms step:5440/7050 train_time:1256784ms step_avg:231.03ms step:5441/7050 train_time:1257024ms step_avg:231.03ms step:5442/7050 train_time:1257263ms step_avg:231.03ms step:5443/7050 train_time:1257503ms step_avg:231.03ms step:5444/7050 train_time:1257743ms step_avg:231.03ms step:5445/7050 train_time:1257980ms step_avg:231.03ms step:5446/7050 train_time:1258221ms step_avg:231.04ms step:5447/7050 train_time:1258460ms step_avg:231.04ms step:5448/7050 train_time:1258700ms step_avg:231.04ms step:5449/7050 train_time:1258941ms step_avg:231.04ms step:5450/7050 train_time:1259180ms step_avg:231.04ms step:5451/7050 train_time:1259421ms step_avg:231.04ms step:5452/7050 train_time:1259662ms step_avg:231.05ms step:5453/7050 train_time:1259905ms step_avg:231.05ms step:5454/7050 train_time:1260145ms step_avg:231.05ms step:5455/7050 train_time:1260384ms step_avg:231.05ms step:5456/7050 train_time:1260625ms step_avg:231.05ms step:5457/7050 train_time:1260866ms step_avg:231.05ms step:5458/7050 train_time:1261106ms step_avg:231.06ms step:5459/7050 train_time:1261348ms step_avg:231.06ms step:5460/7050 train_time:1261588ms step_avg:231.06ms step:5461/7050 train_time:1261830ms step_avg:231.06ms step:5462/7050 train_time:1262070ms step_avg:231.06ms step:5463/7050 train_time:1262312ms step_avg:231.07ms step:5464/7050 train_time:1262555ms step_avg:231.07ms step:5465/7050 train_time:1262794ms step_avg:231.07ms step:5466/7050 train_time:1263035ms step_avg:231.07ms step:5467/7050 train_time:1263275ms step_avg:231.07ms step:5468/7050 train_time:1263516ms step_avg:231.07ms step:5469/7050 train_time:1263758ms step_avg:231.08ms step:5470/7050 train_time:1263997ms step_avg:231.08ms step:5471/7050 train_time:1264237ms step_avg:231.08ms step:5472/7050 train_time:1264478ms step_avg:231.08ms step:5473/7050 train_time:1264720ms step_avg:231.08ms step:5474/7050 train_time:1264961ms step_avg:231.09ms step:5475/7050 train_time:1265204ms step_avg:231.09ms step:5476/7050 train_time:1265443ms step_avg:231.09ms step:5477/7050 train_time:1265683ms step_avg:231.09ms step:5478/7050 train_time:1265924ms step_avg:231.09ms step:5479/7050 train_time:1266162ms step_avg:231.09ms step:5480/7050 train_time:1266405ms step_avg:231.10ms step:5481/7050 train_time:1266646ms step_avg:231.10ms step:5482/7050 train_time:1266889ms step_avg:231.10ms step:5483/7050 train_time:1267130ms step_avg:231.10ms step:5484/7050 train_time:1267374ms step_avg:231.10ms step:5485/7050 train_time:1267613ms step_avg:231.11ms step:5486/7050 train_time:1267854ms step_avg:231.11ms step:5487/7050 train_time:1268096ms step_avg:231.11ms step:5488/7050 train_time:1268336ms step_avg:231.11ms step:5489/7050 train_time:1268575ms step_avg:231.11ms step:5490/7050 train_time:1268814ms step_avg:231.11ms step:5491/7050 train_time:1269056ms step_avg:231.12ms step:5492/7050 train_time:1269298ms step_avg:231.12ms step:5493/7050 train_time:1269539ms step_avg:231.12ms step:5494/7050 train_time:1269778ms step_avg:231.12ms step:5495/7050 train_time:1270020ms step_avg:231.12ms step:5496/7050 train_time:1270258ms step_avg:231.12ms step:5497/7050 train_time:1270497ms step_avg:231.13ms step:5498/7050 train_time:1270739ms step_avg:231.13ms step:5499/7050 train_time:1270979ms step_avg:231.13ms step:5500/7050 train_time:1271219ms step_avg:231.13ms step:5500/7050 val_loss:3.0110 train_time:1271409ms step_avg:231.17ms step:5501/7050 train_time:1271461ms step_avg:231.13ms step:5502/7050 train_time:1271705ms step_avg:231.13ms step:5503/7050 train_time:1271946ms step_avg:231.14ms step:5504/7050 train_time:1272190ms step_avg:231.14ms step:5505/7050 train_time:1272428ms step_avg:231.14ms step:5506/7050 train_time:1272667ms step_avg:231.14ms step:5507/7050 train_time:1272910ms step_avg:231.14ms step:5508/7050 train_time:1273152ms step_avg:231.15ms step:5509/7050 train_time:1273391ms step_avg:231.15ms step:5510/7050 train_time:1273632ms step_avg:231.15ms step:5511/7050 train_time:1273872ms step_avg:231.15ms step:5512/7050 train_time:1274113ms step_avg:231.15ms step:5513/7050 train_time:1274356ms step_avg:231.15ms step:5514/7050 train_time:1274595ms step_avg:231.16ms step:5515/7050 train_time:1274835ms step_avg:231.16ms step:5516/7050 train_time:1275075ms step_avg:231.16ms step:5517/7050 train_time:1275316ms step_avg:231.16ms step:5518/7050 train_time:1275557ms step_avg:231.16ms step:5519/7050 train_time:1275799ms step_avg:231.16ms step:5520/7050 train_time:1276042ms step_avg:231.17ms step:5521/7050 train_time:1276282ms step_avg:231.17ms step:5522/7050 train_time:1276524ms step_avg:231.17ms step:5523/7050 train_time:1276764ms step_avg:231.17ms step:5524/7050 train_time:1277006ms step_avg:231.17ms step:5525/7050 train_time:1277252ms step_avg:231.18ms step:5526/7050 train_time:1277492ms step_avg:231.18ms step:5527/7050 train_time:1277732ms step_avg:231.18ms step:5528/7050 train_time:1277973ms step_avg:231.18ms step:5529/7050 train_time:1278212ms step_avg:231.18ms step:5530/7050 train_time:1278454ms step_avg:231.19ms step:5531/7050 train_time:1278696ms step_avg:231.19ms step:5532/7050 train_time:1278936ms step_avg:231.19ms step:5533/7050 train_time:1279178ms step_avg:231.19ms step:5534/7050 train_time:1279418ms step_avg:231.19ms step:5535/7050 train_time:1279657ms step_avg:231.19ms step:5536/7050 train_time:1279896ms step_avg:231.20ms step:5537/7050 train_time:1280135ms step_avg:231.20ms step:5538/7050 train_time:1280375ms step_avg:231.20ms step:5539/7050 train_time:1280617ms step_avg:231.20ms step:5540/7050 train_time:1280858ms step_avg:231.20ms step:5541/7050 train_time:1281097ms step_avg:231.20ms step:5542/7050 train_time:1281338ms step_avg:231.21ms step:5543/7050 train_time:1281582ms step_avg:231.21ms step:5544/7050 train_time:1281824ms step_avg:231.21ms step:5545/7050 train_time:1282064ms step_avg:231.21ms step:5546/7050 train_time:1282303ms step_avg:231.21ms step:5547/7050 train_time:1282543ms step_avg:231.21ms step:5548/7050 train_time:1282785ms step_avg:231.22ms step:5549/7050 train_time:1283032ms step_avg:231.22ms step:5550/7050 train_time:1283274ms step_avg:231.22ms step:5551/7050 train_time:1283512ms step_avg:231.22ms step:5552/7050 train_time:1283754ms step_avg:231.22ms step:5553/7050 train_time:1283992ms step_avg:231.22ms step:5554/7050 train_time:1284233ms step_avg:231.23ms step:5555/7050 train_time:1284476ms step_avg:231.23ms step:5556/7050 train_time:1284714ms step_avg:231.23ms step:5557/7050 train_time:1284954ms step_avg:231.23ms step:5558/7050 train_time:1285195ms step_avg:231.23ms step:5559/7050 train_time:1285435ms step_avg:231.23ms step:5560/7050 train_time:1285673ms step_avg:231.24ms step:5561/7050 train_time:1285913ms step_avg:231.24ms step:5562/7050 train_time:1286155ms step_avg:231.24ms step:5563/7050 train_time:1286396ms step_avg:231.24ms step:5564/7050 train_time:1286636ms step_avg:231.24ms step:5565/7050 train_time:1286876ms step_avg:231.24ms step:5566/7050 train_time:1287122ms step_avg:231.25ms step:5567/7050 train_time:1287362ms step_avg:231.25ms step:5568/7050 train_time:1287602ms step_avg:231.25ms step:5569/7050 train_time:1287843ms step_avg:231.25ms step:5570/7050 train_time:1288084ms step_avg:231.25ms step:5571/7050 train_time:1288325ms step_avg:231.26ms step:5572/7050 train_time:1288565ms step_avg:231.26ms step:5573/7050 train_time:1288810ms step_avg:231.26ms step:5574/7050 train_time:1289056ms step_avg:231.26ms step:5575/7050 train_time:1289294ms step_avg:231.26ms step:5576/7050 train_time:1289533ms step_avg:231.26ms step:5577/7050 train_time:1289773ms step_avg:231.27ms step:5578/7050 train_time:1290016ms step_avg:231.27ms step:5579/7050 train_time:1290256ms step_avg:231.27ms step:5580/7050 train_time:1290497ms step_avg:231.27ms step:5581/7050 train_time:1290738ms step_avg:231.27ms step:5582/7050 train_time:1290979ms step_avg:231.28ms step:5583/7050 train_time:1291218ms step_avg:231.28ms step:5584/7050 train_time:1291458ms step_avg:231.28ms step:5585/7050 train_time:1291698ms step_avg:231.28ms step:5586/7050 train_time:1291937ms step_avg:231.28ms step:5587/7050 train_time:1292179ms step_avg:231.28ms step:5588/7050 train_time:1292422ms step_avg:231.29ms step:5589/7050 train_time:1292665ms step_avg:231.29ms step:5590/7050 train_time:1292904ms step_avg:231.29ms step:5591/7050 train_time:1293145ms step_avg:231.29ms step:5592/7050 train_time:1293386ms step_avg:231.29ms step:5593/7050 train_time:1293625ms step_avg:231.29ms step:5594/7050 train_time:1293869ms step_avg:231.30ms step:5595/7050 train_time:1294108ms step_avg:231.30ms step:5596/7050 train_time:1294349ms step_avg:231.30ms step:5597/7050 train_time:1294590ms step_avg:231.30ms step:5598/7050 train_time:1294828ms step_avg:231.30ms step:5599/7050 train_time:1295071ms step_avg:231.30ms step:5600/7050 train_time:1295310ms step_avg:231.31ms step:5601/7050 train_time:1295549ms step_avg:231.31ms step:5602/7050 train_time:1295791ms step_avg:231.31ms step:5603/7050 train_time:1296030ms step_avg:231.31ms step:5604/7050 train_time:1296271ms step_avg:231.31ms step:5605/7050 train_time:1296510ms step_avg:231.31ms step:5606/7050 train_time:1296751ms step_avg:231.31ms step:5607/7050 train_time:1296992ms step_avg:231.32ms step:5608/7050 train_time:1297233ms step_avg:231.32ms step:5609/7050 train_time:1297473ms step_avg:231.32ms step:5610/7050 train_time:1297714ms step_avg:231.32ms step:5611/7050 train_time:1297956ms step_avg:231.32ms step:5612/7050 train_time:1298194ms step_avg:231.32ms step:5613/7050 train_time:1298435ms step_avg:231.33ms step:5614/7050 train_time:1298674ms step_avg:231.33ms step:5615/7050 train_time:1298916ms step_avg:231.33ms step:5616/7050 train_time:1299158ms step_avg:231.33ms step:5617/7050 train_time:1299403ms step_avg:231.33ms step:5618/7050 train_time:1299642ms step_avg:231.34ms step:5619/7050 train_time:1299888ms step_avg:231.34ms step:5620/7050 train_time:1300128ms step_avg:231.34ms step:5621/7050 train_time:1300369ms step_avg:231.34ms step:5622/7050 train_time:1300608ms step_avg:231.34ms step:5623/7050 train_time:1300849ms step_avg:231.34ms step:5624/7050 train_time:1301089ms step_avg:231.35ms step:5625/7050 train_time:1301329ms step_avg:231.35ms step:5625/7050 val_loss:3.0027 train_time:1301518ms step_avg:231.38ms step:5626/7050 train_time:1301570ms step_avg:231.35ms step:5627/7050 train_time:1301807ms step_avg:231.35ms step:5628/7050 train_time:1302050ms step_avg:231.35ms step:5629/7050 train_time:1302291ms step_avg:231.35ms step:5630/7050 train_time:1302530ms step_avg:231.36ms step:5631/7050 train_time:1302770ms step_avg:231.36ms step:5632/7050 train_time:1303011ms step_avg:231.36ms step:5633/7050 train_time:1303252ms step_avg:231.36ms step:5634/7050 train_time:1303493ms step_avg:231.36ms step:5635/7050 train_time:1303733ms step_avg:231.36ms step:5636/7050 train_time:1303973ms step_avg:231.36ms step:5637/7050 train_time:1304212ms step_avg:231.37ms step:5638/7050 train_time:1304451ms step_avg:231.37ms step:5639/7050 train_time:1304693ms step_avg:231.37ms step:5640/7050 train_time:1304934ms step_avg:231.37ms step:5641/7050 train_time:1305174ms step_avg:231.37ms step:5642/7050 train_time:1305415ms step_avg:231.37ms step:5643/7050 train_time:1305655ms step_avg:231.38ms step:5644/7050 train_time:1305899ms step_avg:231.38ms step:5645/7050 train_time:1306141ms step_avg:231.38ms step:5646/7050 train_time:1306379ms step_avg:231.38ms step:5647/7050 train_time:1306619ms step_avg:231.38ms step:5648/7050 train_time:1306858ms step_avg:231.38ms step:5649/7050 train_time:1307099ms step_avg:231.39ms step:5650/7050 train_time:1307339ms step_avg:231.39ms step:5651/7050 train_time:1307580ms step_avg:231.39ms step:5652/7050 train_time:1307821ms step_avg:231.39ms step:5653/7050 train_time:1308061ms step_avg:231.39ms step:5654/7050 train_time:1308307ms step_avg:231.39ms step:5655/7050 train_time:1308547ms step_avg:231.40ms step:5656/7050 train_time:1308788ms step_avg:231.40ms step:5657/7050 train_time:1309028ms step_avg:231.40ms step:5658/7050 train_time:1309275ms step_avg:231.40ms step:5659/7050 train_time:1309522ms step_avg:231.41ms step:5660/7050 train_time:1309759ms step_avg:231.41ms step:5661/7050 train_time:1309999ms step_avg:231.41ms step:5662/7050 train_time:1310241ms step_avg:231.41ms step:5663/7050 train_time:1310481ms step_avg:231.41ms step:5664/7050 train_time:1310721ms step_avg:231.41ms step:5665/7050 train_time:1310962ms step_avg:231.41ms step:5666/7050 train_time:1311204ms step_avg:231.42ms step:5667/7050 train_time:1311445ms step_avg:231.42ms step:5668/7050 train_time:1311685ms step_avg:231.42ms step:5669/7050 train_time:1311923ms step_avg:231.42ms step:5670/7050 train_time:1312164ms step_avg:231.42ms step:5671/7050 train_time:1312406ms step_avg:231.42ms step:5672/7050 train_time:1312650ms step_avg:231.43ms step:5673/7050 train_time:1312890ms step_avg:231.43ms step:5674/7050 train_time:1313132ms step_avg:231.43ms step:5675/7050 train_time:1313371ms step_avg:231.43ms step:5676/7050 train_time:1313612ms step_avg:231.43ms step:5677/7050 train_time:1313851ms step_avg:231.43ms step:5678/7050 train_time:1314092ms step_avg:231.44ms step:5679/7050 train_time:1314333ms step_avg:231.44ms step:5680/7050 train_time:1314572ms step_avg:231.44ms step:5681/7050 train_time:1314812ms step_avg:231.44ms step:5682/7050 train_time:1315051ms step_avg:231.44ms step:5683/7050 train_time:1315295ms step_avg:231.44ms step:5684/7050 train_time:1315534ms step_avg:231.45ms step:5685/7050 train_time:1315774ms step_avg:231.45ms step:5686/7050 train_time:1316015ms step_avg:231.45ms step:5687/7050 train_time:1316257ms step_avg:231.45ms step:5688/7050 train_time:1316497ms step_avg:231.45ms step:5689/7050 train_time:1316738ms step_avg:231.45ms step:5690/7050 train_time:1316978ms step_avg:231.45ms step:5691/7050 train_time:1317216ms step_avg:231.46ms step:5692/7050 train_time:1317457ms step_avg:231.46ms step:5693/7050 train_time:1317697ms step_avg:231.46ms step:5694/7050 train_time:1317940ms step_avg:231.46ms step:5695/7050 train_time:1318179ms step_avg:231.46ms step:5696/7050 train_time:1318420ms step_avg:231.46ms step:5697/7050 train_time:1318662ms step_avg:231.47ms step:5698/7050 train_time:1318902ms step_avg:231.47ms step:5699/7050 train_time:1319141ms step_avg:231.47ms step:5700/7050 train_time:1319384ms step_avg:231.47ms step:5701/7050 train_time:1319624ms step_avg:231.47ms step:5702/7050 train_time:1319868ms step_avg:231.47ms step:5703/7050 train_time:1320111ms step_avg:231.48ms step:5704/7050 train_time:1320350ms step_avg:231.48ms step:5705/7050 train_time:1320589ms step_avg:231.48ms step:5706/7050 train_time:1320832ms step_avg:231.48ms step:5707/7050 train_time:1321075ms step_avg:231.48ms step:5708/7050 train_time:1321316ms step_avg:231.48ms step:5709/7050 train_time:1321555ms step_avg:231.49ms step:5710/7050 train_time:1321795ms step_avg:231.49ms step:5711/7050 train_time:1322038ms step_avg:231.49ms step:5712/7050 train_time:1322279ms step_avg:231.49ms step:5713/7050 train_time:1322521ms step_avg:231.49ms step:5714/7050 train_time:1322760ms step_avg:231.49ms step:5715/7050 train_time:1323000ms step_avg:231.50ms step:5716/7050 train_time:1323241ms step_avg:231.50ms step:5717/7050 train_time:1323484ms step_avg:231.50ms step:5718/7050 train_time:1323723ms step_avg:231.50ms step:5719/7050 train_time:1323964ms step_avg:231.50ms step:5720/7050 train_time:1324205ms step_avg:231.50ms step:5721/7050 train_time:1324447ms step_avg:231.51ms step:5722/7050 train_time:1324687ms step_avg:231.51ms step:5723/7050 train_time:1324928ms step_avg:231.51ms step:5724/7050 train_time:1325172ms step_avg:231.51ms step:5725/7050 train_time:1325417ms step_avg:231.51ms step:5726/7050 train_time:1325657ms step_avg:231.52ms step:5727/7050 train_time:1325897ms step_avg:231.52ms step:5728/7050 train_time:1326137ms step_avg:231.52ms step:5729/7050 train_time:1326376ms step_avg:231.52ms step:5730/7050 train_time:1326617ms step_avg:231.52ms step:5731/7050 train_time:1326857ms step_avg:231.52ms step:5732/7050 train_time:1327098ms step_avg:231.52ms step:5733/7050 train_time:1327337ms step_avg:231.53ms step:5734/7050 train_time:1327577ms step_avg:231.53ms step:5735/7050 train_time:1327818ms step_avg:231.53ms step:5736/7050 train_time:1328057ms step_avg:231.53ms step:5737/7050 train_time:1328299ms step_avg:231.53ms step:5738/7050 train_time:1328538ms step_avg:231.53ms step:5739/7050 train_time:1328778ms step_avg:231.53ms step:5740/7050 train_time:1329021ms step_avg:231.54ms step:5741/7050 train_time:1329263ms step_avg:231.54ms step:5742/7050 train_time:1329507ms step_avg:231.54ms step:5743/7050 train_time:1329745ms step_avg:231.54ms step:5744/7050 train_time:1329986ms step_avg:231.54ms step:5745/7050 train_time:1330225ms step_avg:231.54ms step:5746/7050 train_time:1330468ms step_avg:231.55ms step:5747/7050 train_time:1330710ms step_avg:231.55ms step:5748/7050 train_time:1330953ms step_avg:231.55ms step:5749/7050 train_time:1331200ms step_avg:231.55ms step:5750/7050 train_time:1331444ms step_avg:231.56ms step:5750/7050 val_loss:2.9930 train_time:1331637ms step_avg:231.59ms step:5751/7050 train_time:1331688ms step_avg:231.56ms step:5752/7050 train_time:1331932ms step_avg:231.56ms step:5753/7050 train_time:1332177ms step_avg:231.56ms step:5754/7050 train_time:1332419ms step_avg:231.56ms step:5755/7050 train_time:1332661ms step_avg:231.57ms step:5756/7050 train_time:1332904ms step_avg:231.57ms step:5757/7050 train_time:1333147ms step_avg:231.57ms step:5758/7050 train_time:1333394ms step_avg:231.57ms step:5759/7050 train_time:1333636ms step_avg:231.57ms step:5760/7050 train_time:1333883ms step_avg:231.58ms step:5761/7050 train_time:1334126ms step_avg:231.58ms step:5762/7050 train_time:1334370ms step_avg:231.58ms step:5763/7050 train_time:1334612ms step_avg:231.58ms step:5764/7050 train_time:1334854ms step_avg:231.58ms step:5765/7050 train_time:1335097ms step_avg:231.59ms step:5766/7050 train_time:1335345ms step_avg:231.59ms step:5767/7050 train_time:1335586ms step_avg:231.59ms step:5768/7050 train_time:1335831ms step_avg:231.59ms step:5769/7050 train_time:1336073ms step_avg:231.60ms step:5770/7050 train_time:1336317ms step_avg:231.60ms step:5771/7050 train_time:1336560ms step_avg:231.60ms step:5772/7050 train_time:1336804ms step_avg:231.60ms step:5773/7050 train_time:1337048ms step_avg:231.60ms step:5774/7050 train_time:1337290ms step_avg:231.61ms step:5775/7050 train_time:1337532ms step_avg:231.61ms step:5776/7050 train_time:1337776ms step_avg:231.61ms step:5777/7050 train_time:1338021ms step_avg:231.61ms step:5778/7050 train_time:1338263ms step_avg:231.61ms step:5779/7050 train_time:1338504ms step_avg:231.62ms step:5780/7050 train_time:1338751ms step_avg:231.62ms step:5781/7050 train_time:1338993ms step_avg:231.62ms step:5782/7050 train_time:1339236ms step_avg:231.62ms step:5783/7050 train_time:1339478ms step_avg:231.62ms step:5784/7050 train_time:1339723ms step_avg:231.63ms step:5785/7050 train_time:1339967ms step_avg:231.63ms step:5786/7050 train_time:1340209ms step_avg:231.63ms step:5787/7050 train_time:1340453ms step_avg:231.63ms step:5788/7050 train_time:1340697ms step_avg:231.63ms step:5789/7050 train_time:1340939ms step_avg:231.64ms step:5790/7050 train_time:1341181ms step_avg:231.64ms step:5791/7050 train_time:1341422ms step_avg:231.64ms step:5792/7050 train_time:1341666ms step_avg:231.64ms step:5793/7050 train_time:1341908ms step_avg:231.64ms step:5794/7050 train_time:1342150ms step_avg:231.64ms step:5795/7050 train_time:1342391ms step_avg:231.65ms step:5796/7050 train_time:1342639ms step_avg:231.65ms step:5797/7050 train_time:1342883ms step_avg:231.65ms step:5798/7050 train_time:1343134ms step_avg:231.65ms step:5799/7050 train_time:1343376ms step_avg:231.66ms step:5800/7050 train_time:1343618ms step_avg:231.66ms step:5801/7050 train_time:1343864ms step_avg:231.66ms step:5802/7050 train_time:1344106ms step_avg:231.66ms step:5803/7050 train_time:1344354ms step_avg:231.67ms step:5804/7050 train_time:1344593ms step_avg:231.67ms step:5805/7050 train_time:1344834ms step_avg:231.67ms step:5806/7050 train_time:1345079ms step_avg:231.67ms step:5807/7050 train_time:1345321ms step_avg:231.67ms step:5808/7050 train_time:1345565ms step_avg:231.67ms step:5809/7050 train_time:1345809ms step_avg:231.68ms step:5810/7050 train_time:1346051ms step_avg:231.68ms step:5811/7050 train_time:1346294ms step_avg:231.68ms step:5812/7050 train_time:1346538ms step_avg:231.68ms step:5813/7050 train_time:1346779ms step_avg:231.68ms step:5814/7050 train_time:1347022ms step_avg:231.69ms step:5815/7050 train_time:1347269ms step_avg:231.69ms step:5816/7050 train_time:1347518ms step_avg:231.69ms step:5817/7050 train_time:1347759ms step_avg:231.69ms step:5818/7050 train_time:1348002ms step_avg:231.70ms step:5819/7050 train_time:1348249ms step_avg:231.70ms step:5820/7050 train_time:1348494ms step_avg:231.70ms step:5821/7050 train_time:1348739ms step_avg:231.70ms step:5822/7050 train_time:1348983ms step_avg:231.70ms step:5823/7050 train_time:1349230ms step_avg:231.71ms step:5824/7050 train_time:1349473ms step_avg:231.71ms step:5825/7050 train_time:1349718ms step_avg:231.71ms step:5826/7050 train_time:1349961ms step_avg:231.71ms step:5827/7050 train_time:1350204ms step_avg:231.72ms step:5828/7050 train_time:1350450ms step_avg:231.72ms step:5829/7050 train_time:1350695ms step_avg:231.72ms step:5830/7050 train_time:1350937ms step_avg:231.72ms step:5831/7050 train_time:1351178ms step_avg:231.72ms step:5832/7050 train_time:1351420ms step_avg:231.72ms step:5833/7050 train_time:1351669ms step_avg:231.73ms step:5834/7050 train_time:1351915ms step_avg:231.73ms step:5835/7050 train_time:1352157ms step_avg:231.73ms step:5836/7050 train_time:1352401ms step_avg:231.73ms step:5837/7050 train_time:1352644ms step_avg:231.74ms step:5838/7050 train_time:1352888ms step_avg:231.74ms step:5839/7050 train_time:1353131ms step_avg:231.74ms step:5840/7050 train_time:1353373ms step_avg:231.74ms step:5841/7050 train_time:1353617ms step_avg:231.74ms step:5842/7050 train_time:1353865ms step_avg:231.75ms step:5843/7050 train_time:1354109ms step_avg:231.75ms step:5844/7050 train_time:1354351ms step_avg:231.75ms step:5845/7050 train_time:1354596ms step_avg:231.75ms step:5846/7050 train_time:1354846ms step_avg:231.76ms step:5847/7050 train_time:1355087ms step_avg:231.76ms step:5848/7050 train_time:1355337ms step_avg:231.76ms step:5849/7050 train_time:1355579ms step_avg:231.76ms step:5850/7050 train_time:1355823ms step_avg:231.76ms step:5851/7050 train_time:1356071ms step_avg:231.77ms step:5852/7050 train_time:1356316ms step_avg:231.77ms step:5853/7050 train_time:1356556ms step_avg:231.77ms step:5854/7050 train_time:1356799ms step_avg:231.77ms step:5855/7050 train_time:1357040ms step_avg:231.77ms step:5856/7050 train_time:1357283ms step_avg:231.78ms step:5857/7050 train_time:1357526ms step_avg:231.78ms step:5858/7050 train_time:1357766ms step_avg:231.78ms step:5859/7050 train_time:1358013ms step_avg:231.78ms step:5860/7050 train_time:1358255ms step_avg:231.78ms step:5861/7050 train_time:1358504ms step_avg:231.79ms step:5862/7050 train_time:1358744ms step_avg:231.79ms step:5863/7050 train_time:1358989ms step_avg:231.79ms step:5864/7050 train_time:1359235ms step_avg:231.79ms step:5865/7050 train_time:1359481ms step_avg:231.80ms step:5866/7050 train_time:1359723ms step_avg:231.80ms step:5867/7050 train_time:1359967ms step_avg:231.80ms step:5868/7050 train_time:1360209ms step_avg:231.80ms step:5869/7050 train_time:1360452ms step_avg:231.80ms step:5870/7050 train_time:1360696ms step_avg:231.81ms step:5871/7050 train_time:1360939ms step_avg:231.81ms step:5872/7050 train_time:1361186ms step_avg:231.81ms step:5873/7050 train_time:1361430ms step_avg:231.81ms step:5874/7050 train_time:1361671ms step_avg:231.81ms step:5875/7050 train_time:1361913ms step_avg:231.81ms step:5875/7050 val_loss:2.9842 train_time:1362108ms step_avg:231.85ms step:5876/7050 train_time:1362161ms step_avg:231.82ms step:5877/7050 train_time:1362404ms step_avg:231.82ms step:5878/7050 train_time:1362650ms step_avg:231.82ms step:5879/7050 train_time:1362894ms step_avg:231.82ms step:5880/7050 train_time:1363137ms step_avg:231.83ms step:5881/7050 train_time:1363380ms step_avg:231.83ms step:5882/7050 train_time:1363628ms step_avg:231.83ms step:5883/7050 train_time:1363869ms step_avg:231.83ms step:5884/7050 train_time:1364112ms step_avg:231.83ms step:5885/7050 train_time:1364355ms step_avg:231.84ms step:5886/7050 train_time:1364599ms step_avg:231.84ms step:5887/7050 train_time:1364846ms step_avg:231.84ms step:5888/7050 train_time:1365090ms step_avg:231.84ms step:5889/7050 train_time:1365328ms step_avg:231.84ms step:5890/7050 train_time:1365571ms step_avg:231.85ms step:5891/7050 train_time:1365815ms step_avg:231.85ms step:5892/7050 train_time:1366059ms step_avg:231.85ms step:5893/7050 train_time:1366301ms step_avg:231.85ms step:5894/7050 train_time:1366543ms step_avg:231.85ms step:5895/7050 train_time:1366786ms step_avg:231.86ms step:5896/7050 train_time:1367032ms step_avg:231.86ms step:5897/7050 train_time:1367273ms step_avg:231.86ms step:5898/7050 train_time:1367514ms step_avg:231.86ms step:5899/7050 train_time:1367757ms step_avg:231.86ms step:5900/7050 train_time:1368004ms step_avg:231.87ms step:5901/7050 train_time:1368245ms step_avg:231.87ms step:5902/7050 train_time:1368486ms step_avg:231.87ms step:5903/7050 train_time:1368727ms step_avg:231.87ms step:5904/7050 train_time:1368970ms step_avg:231.87ms step:5905/7050 train_time:1369212ms step_avg:231.87ms step:5906/7050 train_time:1369455ms step_avg:231.88ms step:5907/7050 train_time:1369697ms step_avg:231.88ms step:5908/7050 train_time:1369943ms step_avg:231.88ms step:5909/7050 train_time:1370191ms step_avg:231.88ms step:5910/7050 train_time:1370432ms step_avg:231.88ms step:5911/7050 train_time:1370674ms step_avg:231.89ms step:5912/7050 train_time:1370916ms step_avg:231.89ms step:5913/7050 train_time:1371160ms step_avg:231.89ms step:5914/7050 train_time:1371411ms step_avg:231.89ms step:5915/7050 train_time:1371653ms step_avg:231.89ms step:5916/7050 train_time:1371896ms step_avg:231.90ms step:5917/7050 train_time:1372138ms step_avg:231.90ms step:5918/7050 train_time:1372381ms step_avg:231.90ms step:5919/7050 train_time:1372623ms step_avg:231.90ms step:5920/7050 train_time:1372865ms step_avg:231.90ms step:5921/7050 train_time:1373106ms step_avg:231.90ms step:5922/7050 train_time:1373354ms step_avg:231.91ms step:5923/7050 train_time:1373599ms step_avg:231.91ms step:5924/7050 train_time:1373842ms step_avg:231.91ms step:5925/7050 train_time:1374084ms step_avg:231.91ms step:5926/7050 train_time:1374326ms step_avg:231.91ms step:5927/7050 train_time:1374571ms step_avg:231.92ms step:5928/7050 train_time:1374816ms step_avg:231.92ms step:5929/7050 train_time:1375060ms step_avg:231.92ms step:5930/7050 train_time:1375301ms step_avg:231.92ms step:5931/7050 train_time:1375545ms step_avg:231.92ms step:5932/7050 train_time:1375789ms step_avg:231.93ms step:5933/7050 train_time:1376031ms step_avg:231.93ms step:5934/7050 train_time:1376278ms step_avg:231.93ms step:5935/7050 train_time:1376519ms step_avg:231.93ms step:5936/7050 train_time:1376761ms step_avg:231.93ms step:5937/7050 train_time:1377004ms step_avg:231.94ms step:5938/7050 train_time:1377248ms step_avg:231.94ms step:5939/7050 train_time:1377494ms step_avg:231.94ms step:5940/7050 train_time:1377736ms step_avg:231.94ms step:5941/7050 train_time:1377982ms step_avg:231.94ms step:5942/7050 train_time:1378227ms step_avg:231.95ms step:5943/7050 train_time:1378470ms step_avg:231.95ms step:5944/7050 train_time:1378712ms step_avg:231.95ms step:5945/7050 train_time:1378954ms step_avg:231.95ms step:5946/7050 train_time:1379200ms step_avg:231.95ms step:5947/7050 train_time:1379442ms step_avg:231.96ms step:5948/7050 train_time:1379684ms step_avg:231.96ms step:5949/7050 train_time:1379929ms step_avg:231.96ms step:5950/7050 train_time:1380171ms step_avg:231.96ms step:5951/7050 train_time:1380412ms step_avg:231.96ms step:5952/7050 train_time:1380654ms step_avg:231.96ms step:5953/7050 train_time:1380899ms step_avg:231.97ms step:5954/7050 train_time:1381143ms step_avg:231.97ms step:5955/7050 train_time:1381386ms step_avg:231.97ms step:5956/7050 train_time:1381629ms step_avg:231.97ms step:5957/7050 train_time:1381875ms step_avg:231.98ms step:5958/7050 train_time:1382117ms step_avg:231.98ms step:5959/7050 train_time:1382362ms step_avg:231.98ms step:5960/7050 train_time:1382606ms step_avg:231.98ms step:5961/7050 train_time:1382851ms step_avg:231.98ms step:5962/7050 train_time:1383096ms step_avg:231.99ms step:5963/7050 train_time:1383337ms step_avg:231.99ms step:5964/7050 train_time:1383580ms step_avg:231.99ms step:5965/7050 train_time:1383823ms step_avg:231.99ms step:5966/7050 train_time:1384067ms step_avg:231.99ms step:5967/7050 train_time:1384310ms step_avg:231.99ms step:5968/7050 train_time:1384552ms step_avg:232.00ms step:5969/7050 train_time:1384793ms step_avg:232.00ms step:5970/7050 train_time:1385037ms step_avg:232.00ms step:5971/7050 train_time:1385282ms step_avg:232.00ms step:5972/7050 train_time:1385523ms step_avg:232.00ms step:5973/7050 train_time:1385767ms step_avg:232.01ms step:5974/7050 train_time:1386008ms step_avg:232.01ms step:5975/7050 train_time:1386250ms step_avg:232.01ms step:5976/7050 train_time:1386491ms step_avg:232.01ms step:5977/7050 train_time:1386738ms step_avg:232.01ms step:5978/7050 train_time:1386981ms step_avg:232.01ms step:5979/7050 train_time:1387222ms step_avg:232.02ms step:5980/7050 train_time:1387466ms step_avg:232.02ms step:5981/7050 train_time:1387709ms step_avg:232.02ms step:5982/7050 train_time:1387954ms step_avg:232.02ms step:5983/7050 train_time:1388198ms step_avg:232.02ms step:5984/7050 train_time:1388440ms step_avg:232.03ms step:5985/7050 train_time:1388682ms step_avg:232.03ms step:5986/7050 train_time:1388925ms step_avg:232.03ms step:5987/7050 train_time:1389169ms step_avg:232.03ms step:5988/7050 train_time:1389417ms step_avg:232.03ms step:5989/7050 train_time:1389664ms step_avg:232.04ms step:5990/7050 train_time:1389914ms step_avg:232.04ms step:5991/7050 train_time:1390154ms step_avg:232.04ms step:5992/7050 train_time:1390397ms step_avg:232.04ms step:5993/7050 train_time:1390638ms step_avg:232.04ms step:5994/7050 train_time:1390887ms step_avg:232.05ms step:5995/7050 train_time:1391129ms step_avg:232.05ms step:5996/7050 train_time:1391370ms step_avg:232.05ms step:5997/7050 train_time:1391611ms step_avg:232.05ms step:5998/7050 train_time:1391854ms step_avg:232.05ms step:5999/7050 train_time:1392096ms step_avg:232.05ms step:6000/7050 train_time:1392340ms step_avg:232.06ms step:6000/7050 val_loss:2.9773 train_time:1392532ms step_avg:232.09ms step:6001/7050 train_time:1392583ms step_avg:232.06ms step:6002/7050 train_time:1392828ms step_avg:232.06ms step:6003/7050 train_time:1393073ms step_avg:232.06ms step:6004/7050 train_time:1393316ms step_avg:232.06ms step:6005/7050 train_time:1393559ms step_avg:232.07ms step:6006/7050 train_time:1393802ms step_avg:232.07ms step:6007/7050 train_time:1394047ms step_avg:232.07ms step:6008/7050 train_time:1394290ms step_avg:232.07ms step:6009/7050 train_time:1394535ms step_avg:232.07ms step:6010/7050 train_time:1394778ms step_avg:232.08ms step:6011/7050 train_time:1395021ms step_avg:232.08ms step:6012/7050 train_time:1395268ms step_avg:232.08ms step:6013/7050 train_time:1395511ms step_avg:232.08ms step:6014/7050 train_time:1395756ms step_avg:232.08ms step:6015/7050 train_time:1396000ms step_avg:232.09ms step:6016/7050 train_time:1396244ms step_avg:232.09ms step:6017/7050 train_time:1396486ms step_avg:232.09ms step:6018/7050 train_time:1396731ms step_avg:232.09ms step:6019/7050 train_time:1396974ms step_avg:232.09ms step:6020/7050 train_time:1397215ms step_avg:232.10ms step:6021/7050 train_time:1397459ms step_avg:232.10ms step:6022/7050 train_time:1397703ms step_avg:232.10ms step:6023/7050 train_time:1397947ms step_avg:232.10ms step:6024/7050 train_time:1398192ms step_avg:232.10ms step:6025/7050 train_time:1398437ms step_avg:232.11ms step:6026/7050 train_time:1398677ms step_avg:232.11ms step:6027/7050 train_time:1398921ms step_avg:232.11ms step:6028/7050 train_time:1399163ms step_avg:232.11ms step:6029/7050 train_time:1399407ms step_avg:232.11ms step:6030/7050 train_time:1399650ms step_avg:232.11ms step:6031/7050 train_time:1399893ms step_avg:232.12ms step:6032/7050 train_time:1400138ms step_avg:232.12ms step:6033/7050 train_time:1400383ms step_avg:232.12ms step:6034/7050 train_time:1400628ms step_avg:232.12ms step:6035/7050 train_time:1400874ms step_avg:232.12ms step:6036/7050 train_time:1401119ms step_avg:232.13ms step:6037/7050 train_time:1401361ms step_avg:232.13ms step:6038/7050 train_time:1401609ms step_avg:232.13ms step:6039/7050 train_time:1401849ms step_avg:232.13ms step:6040/7050 train_time:1402096ms step_avg:232.14ms step:6041/7050 train_time:1402338ms step_avg:232.14ms step:6042/7050 train_time:1402583ms step_avg:232.14ms step:6043/7050 train_time:1402828ms step_avg:232.14ms step:6044/7050 train_time:1403069ms step_avg:232.14ms step:6045/7050 train_time:1403317ms step_avg:232.15ms step:6046/7050 train_time:1403561ms step_avg:232.15ms step:6047/7050 train_time:1403804ms step_avg:232.15ms step:6048/7050 train_time:1404048ms step_avg:232.15ms step:6049/7050 train_time:1404288ms step_avg:232.15ms step:6050/7050 train_time:1404542ms step_avg:232.16ms step:6051/7050 train_time:1404784ms step_avg:232.16ms step:6052/7050 train_time:1405026ms step_avg:232.16ms step:6053/7050 train_time:1405267ms step_avg:232.16ms step:6054/7050 train_time:1405511ms step_avg:232.16ms step:6055/7050 train_time:1405760ms step_avg:232.17ms step:6056/7050 train_time:1406001ms step_avg:232.17ms step:6057/7050 train_time:1406250ms step_avg:232.17ms step:6058/7050 train_time:1406495ms step_avg:232.17ms step:6059/7050 train_time:1406741ms step_avg:232.17ms step:6060/7050 train_time:1406983ms step_avg:232.18ms step:6061/7050 train_time:1407226ms step_avg:232.18ms step:6062/7050 train_time:1407467ms step_avg:232.18ms step:6063/7050 train_time:1407709ms step_avg:232.18ms step:6064/7050 train_time:1407949ms step_avg:232.18ms step:6065/7050 train_time:1408193ms step_avg:232.18ms step:6066/7050 train_time:1408444ms step_avg:232.19ms step:6067/7050 train_time:1408686ms step_avg:232.19ms step:6068/7050 train_time:1408932ms step_avg:232.19ms step:6069/7050 train_time:1409172ms step_avg:232.19ms step:6070/7050 train_time:1409420ms step_avg:232.19ms step:6071/7050 train_time:1409662ms step_avg:232.20ms step:6072/7050 train_time:1409907ms step_avg:232.20ms step:6073/7050 train_time:1410148ms step_avg:232.20ms step:6074/7050 train_time:1410391ms step_avg:232.20ms step:6075/7050 train_time:1410639ms step_avg:232.20ms step:6076/7050 train_time:1410880ms step_avg:232.21ms step:6077/7050 train_time:1411121ms step_avg:232.21ms step:6078/7050 train_time:1411366ms step_avg:232.21ms step:6079/7050 train_time:1411609ms step_avg:232.21ms step:6080/7050 train_time:1411854ms step_avg:232.21ms step:6081/7050 train_time:1412097ms step_avg:232.21ms step:6082/7050 train_time:1412340ms step_avg:232.22ms step:6083/7050 train_time:1412590ms step_avg:232.22ms step:6084/7050 train_time:1412833ms step_avg:232.22ms step:6085/7050 train_time:1413074ms step_avg:232.22ms step:6086/7050 train_time:1413315ms step_avg:232.22ms step:6087/7050 train_time:1413560ms step_avg:232.23ms step:6088/7050 train_time:1413802ms step_avg:232.23ms step:6089/7050 train_time:1414047ms step_avg:232.23ms step:6090/7050 train_time:1414290ms step_avg:232.23ms step:6091/7050 train_time:1414536ms step_avg:232.23ms step:6092/7050 train_time:1414778ms step_avg:232.24ms step:6093/7050 train_time:1415020ms step_avg:232.24ms step:6094/7050 train_time:1415262ms step_avg:232.24ms step:6095/7050 train_time:1415511ms step_avg:232.24ms step:6096/7050 train_time:1415750ms step_avg:232.24ms step:6097/7050 train_time:1415993ms step_avg:232.24ms step:6098/7050 train_time:1416234ms step_avg:232.25ms step:6099/7050 train_time:1416477ms step_avg:232.25ms step:6100/7050 train_time:1416721ms step_avg:232.25ms step:6101/7050 train_time:1416963ms step_avg:232.25ms step:6102/7050 train_time:1417206ms step_avg:232.25ms step:6103/7050 train_time:1417449ms step_avg:232.25ms step:6104/7050 train_time:1417697ms step_avg:232.26ms step:6105/7050 train_time:1417938ms step_avg:232.26ms step:6106/7050 train_time:1418180ms step_avg:232.26ms step:6107/7050 train_time:1418425ms step_avg:232.26ms step:6108/7050 train_time:1418672ms step_avg:232.26ms step:6109/7050 train_time:1418918ms step_avg:232.27ms step:6110/7050 train_time:1419163ms step_avg:232.27ms step:6111/7050 train_time:1419406ms step_avg:232.27ms step:6112/7050 train_time:1419657ms step_avg:232.27ms step:6113/7050 train_time:1419899ms step_avg:232.28ms step:6114/7050 train_time:1420141ms step_avg:232.28ms step:6115/7050 train_time:1420386ms step_avg:232.28ms step:6116/7050 train_time:1420630ms step_avg:232.28ms step:6117/7050 train_time:1420872ms step_avg:232.28ms step:6118/7050 train_time:1421117ms step_avg:232.28ms step:6119/7050 train_time:1421360ms step_avg:232.29ms step:6120/7050 train_time:1421603ms step_avg:232.29ms step:6121/7050 train_time:1421846ms step_avg:232.29ms step:6122/7050 train_time:1422092ms step_avg:232.29ms step:6123/7050 train_time:1422335ms step_avg:232.29ms step:6124/7050 train_time:1422580ms step_avg:232.30ms step:6125/7050 train_time:1422832ms step_avg:232.30ms step:6125/7050 val_loss:2.9686 train_time:1423023ms step_avg:232.33ms step:6126/7050 train_time:1423077ms step_avg:232.30ms step:6127/7050 train_time:1423323ms step_avg:232.30ms step:6128/7050 train_time:1423568ms step_avg:232.31ms step:6129/7050 train_time:1423812ms step_avg:232.31ms step:6130/7050 train_time:1424053ms step_avg:232.31ms step:6131/7050 train_time:1424298ms step_avg:232.31ms step:6132/7050 train_time:1424550ms step_avg:232.31ms step:6133/7050 train_time:1424794ms step_avg:232.32ms step:6134/7050 train_time:1425035ms step_avg:232.32ms step:6135/7050 train_time:1425275ms step_avg:232.32ms step:6136/7050 train_time:1425519ms step_avg:232.32ms step:6137/7050 train_time:1425761ms step_avg:232.32ms step:6138/7050 train_time:1426003ms step_avg:232.32ms step:6139/7050 train_time:1426245ms step_avg:232.33ms step:6140/7050 train_time:1426487ms step_avg:232.33ms step:6141/7050 train_time:1426730ms step_avg:232.33ms step:6142/7050 train_time:1426971ms step_avg:232.33ms step:6143/7050 train_time:1427215ms step_avg:232.33ms step:6144/7050 train_time:1427457ms step_avg:232.33ms step:6145/7050 train_time:1427704ms step_avg:232.34ms step:6146/7050 train_time:1427955ms step_avg:232.34ms step:6147/7050 train_time:1428195ms step_avg:232.34ms step:6148/7050 train_time:1428437ms step_avg:232.34ms step:6149/7050 train_time:1428680ms step_avg:232.34ms step:6150/7050 train_time:1428924ms step_avg:232.35ms step:6151/7050 train_time:1429166ms step_avg:232.35ms step:6152/7050 train_time:1429408ms step_avg:232.35ms step:6153/7050 train_time:1429650ms step_avg:232.35ms step:6154/7050 train_time:1429894ms step_avg:232.35ms step:6155/7050 train_time:1430136ms step_avg:232.35ms step:6156/7050 train_time:1430379ms step_avg:232.36ms step:6157/7050 train_time:1430625ms step_avg:232.36ms step:6158/7050 train_time:1430870ms step_avg:232.36ms step:6159/7050 train_time:1431113ms step_avg:232.36ms step:6160/7050 train_time:1431357ms step_avg:232.36ms step:6161/7050 train_time:1431598ms step_avg:232.36ms step:6162/7050 train_time:1431843ms step_avg:232.37ms step:6163/7050 train_time:1432089ms step_avg:232.37ms step:6164/7050 train_time:1432331ms step_avg:232.37ms step:6165/7050 train_time:1432573ms step_avg:232.37ms step:6166/7050 train_time:1432814ms step_avg:232.37ms step:6167/7050 train_time:1433059ms step_avg:232.38ms step:6168/7050 train_time:1433301ms step_avg:232.38ms step:6169/7050 train_time:1433548ms step_avg:232.38ms step:6170/7050 train_time:1433789ms step_avg:232.38ms step:6171/7050 train_time:1434030ms step_avg:232.38ms step:6172/7050 train_time:1434271ms step_avg:232.38ms step:6173/7050 train_time:1434514ms step_avg:232.39ms step:6174/7050 train_time:1434756ms step_avg:232.39ms step:6175/7050 train_time:1435001ms step_avg:232.39ms step:6176/7050 train_time:1435242ms step_avg:232.39ms step:6177/7050 train_time:1435484ms step_avg:232.39ms step:6178/7050 train_time:1435726ms step_avg:232.39ms step:6179/7050 train_time:1435971ms step_avg:232.40ms step:6180/7050 train_time:1436215ms step_avg:232.40ms step:6181/7050 train_time:1436458ms step_avg:232.40ms step:6182/7050 train_time:1436700ms step_avg:232.40ms step:6183/7050 train_time:1436946ms step_avg:232.40ms step:6184/7050 train_time:1437192ms step_avg:232.40ms step:6185/7050 train_time:1437433ms step_avg:232.41ms step:6186/7050 train_time:1437677ms step_avg:232.41ms step:6187/7050 train_time:1437919ms step_avg:232.41ms step:6188/7050 train_time:1438169ms step_avg:232.41ms step:6189/7050 train_time:1438412ms step_avg:232.41ms step:6190/7050 train_time:1438656ms step_avg:232.42ms step:6191/7050 train_time:1438898ms step_avg:232.42ms step:6192/7050 train_time:1439141ms step_avg:232.42ms step:6193/7050 train_time:1439387ms step_avg:232.42ms step:6194/7050 train_time:1439627ms step_avg:232.42ms step:6195/7050 train_time:1439870ms step_avg:232.42ms step:6196/7050 train_time:1440115ms step_avg:232.43ms step:6197/7050 train_time:1440357ms step_avg:232.43ms step:6198/7050 train_time:1440600ms step_avg:232.43ms step:6199/7050 train_time:1440844ms step_avg:232.43ms step:6200/7050 train_time:1441088ms step_avg:232.43ms step:6201/7050 train_time:1441329ms step_avg:232.43ms step:6202/7050 train_time:1441580ms step_avg:232.44ms step:6203/7050 train_time:1441822ms step_avg:232.44ms step:6204/7050 train_time:1442063ms step_avg:232.44ms step:6205/7050 train_time:1442304ms step_avg:232.44ms step:6206/7050 train_time:1442547ms step_avg:232.44ms step:6207/7050 train_time:1442791ms step_avg:232.45ms step:6208/7050 train_time:1443032ms step_avg:232.45ms step:6209/7050 train_time:1443274ms step_avg:232.45ms step:6210/7050 train_time:1443518ms step_avg:232.45ms step:6211/7050 train_time:1443764ms step_avg:232.45ms step:6212/7050 train_time:1444008ms step_avg:232.45ms step:6213/7050 train_time:1444250ms step_avg:232.46ms step:6214/7050 train_time:1444493ms step_avg:232.46ms step:6215/7050 train_time:1444735ms step_avg:232.46ms step:6216/7050 train_time:1444979ms step_avg:232.46ms step:6217/7050 train_time:1445222ms step_avg:232.46ms step:6218/7050 train_time:1445464ms step_avg:232.46ms step:6219/7050 train_time:1445707ms step_avg:232.47ms step:6220/7050 train_time:1445951ms step_avg:232.47ms step:6221/7050 train_time:1446194ms step_avg:232.47ms step:6222/7050 train_time:1446439ms step_avg:232.47ms step:6223/7050 train_time:1446681ms step_avg:232.47ms step:6224/7050 train_time:1446926ms step_avg:232.48ms step:6225/7050 train_time:1447170ms step_avg:232.48ms step:6226/7050 train_time:1447414ms step_avg:232.48ms step:6227/7050 train_time:1447658ms step_avg:232.48ms step:6228/7050 train_time:1447899ms step_avg:232.48ms step:6229/7050 train_time:1448144ms step_avg:232.48ms step:6230/7050 train_time:1448388ms step_avg:232.49ms step:6231/7050 train_time:1448632ms step_avg:232.49ms step:6232/7050 train_time:1448874ms step_avg:232.49ms step:6233/7050 train_time:1449117ms step_avg:232.49ms step:6234/7050 train_time:1449359ms step_avg:232.49ms step:6235/7050 train_time:1449604ms step_avg:232.49ms step:6236/7050 train_time:1449849ms step_avg:232.50ms step:6237/7050 train_time:1450089ms step_avg:232.50ms step:6238/7050 train_time:1450334ms step_avg:232.50ms step:6239/7050 train_time:1450577ms step_avg:232.50ms step:6240/7050 train_time:1450823ms step_avg:232.50ms step:6241/7050 train_time:1451065ms step_avg:232.51ms step:6242/7050 train_time:1451308ms step_avg:232.51ms step:6243/7050 train_time:1451552ms step_avg:232.51ms step:6244/7050 train_time:1451797ms step_avg:232.51ms step:6245/7050 train_time:1452040ms step_avg:232.51ms step:6246/7050 train_time:1452290ms step_avg:232.52ms step:6247/7050 train_time:1452531ms step_avg:232.52ms step:6248/7050 train_time:1452776ms step_avg:232.52ms step:6249/7050 train_time:1453020ms step_avg:232.52ms step:6250/7050 train_time:1453262ms step_avg:232.52ms step:6250/7050 val_loss:2.9600 train_time:1453452ms step_avg:232.55ms step:6251/7050 train_time:1453504ms step_avg:232.52ms step:6252/7050 train_time:1453745ms step_avg:232.52ms step:6253/7050 train_time:1453996ms step_avg:232.53ms step:6254/7050 train_time:1454238ms step_avg:232.53ms step:6255/7050 train_time:1454481ms step_avg:232.53ms step:6256/7050 train_time:1454724ms step_avg:232.53ms step:6257/7050 train_time:1454969ms step_avg:232.53ms step:6258/7050 train_time:1455212ms step_avg:232.54ms step:6259/7050 train_time:1455462ms step_avg:232.54ms step:6260/7050 train_time:1455701ms step_avg:232.54ms step:6261/7050 train_time:1455947ms step_avg:232.54ms step:6262/7050 train_time:1456187ms step_avg:232.54ms step:6263/7050 train_time:1456431ms step_avg:232.55ms step:6264/7050 train_time:1456673ms step_avg:232.55ms step:6265/7050 train_time:1456915ms step_avg:232.55ms step:6266/7050 train_time:1457159ms step_avg:232.55ms step:6267/7050 train_time:1457400ms step_avg:232.55ms step:6268/7050 train_time:1457645ms step_avg:232.55ms step:6269/7050 train_time:1457887ms step_avg:232.55ms step:6270/7050 train_time:1458130ms step_avg:232.56ms step:6271/7050 train_time:1458374ms step_avg:232.56ms step:6272/7050 train_time:1458618ms step_avg:232.56ms step:6273/7050 train_time:1458859ms step_avg:232.56ms step:6274/7050 train_time:1459102ms step_avg:232.56ms step:6275/7050 train_time:1459347ms step_avg:232.57ms step:6276/7050 train_time:1459594ms step_avg:232.57ms step:6277/7050 train_time:1459834ms step_avg:232.57ms step:6278/7050 train_time:1460082ms step_avg:232.57ms step:6279/7050 train_time:1460328ms step_avg:232.57ms step:6280/7050 train_time:1460573ms step_avg:232.58ms step:6281/7050 train_time:1460812ms step_avg:232.58ms step:6282/7050 train_time:1461057ms step_avg:232.58ms step:6283/7050 train_time:1461300ms step_avg:232.58ms step:6284/7050 train_time:1461543ms step_avg:232.58ms step:6285/7050 train_time:1461785ms step_avg:232.58ms step:6286/7050 train_time:1462027ms step_avg:232.58ms step:6287/7050 train_time:1462269ms step_avg:232.59ms step:6288/7050 train_time:1462515ms step_avg:232.59ms step:6289/7050 train_time:1462759ms step_avg:232.59ms step:6290/7050 train_time:1463002ms step_avg:232.59ms step:6291/7050 train_time:1463245ms step_avg:232.59ms step:6292/7050 train_time:1463489ms step_avg:232.60ms step:6293/7050 train_time:1463736ms step_avg:232.60ms step:6294/7050 train_time:1463981ms step_avg:232.60ms step:6295/7050 train_time:1464224ms step_avg:232.60ms step:6296/7050 train_time:1464471ms step_avg:232.60ms step:6297/7050 train_time:1464714ms step_avg:232.61ms step:6298/7050 train_time:1464956ms step_avg:232.61ms step:6299/7050 train_time:1465198ms step_avg:232.61ms step:6300/7050 train_time:1465447ms step_avg:232.61ms step:6301/7050 train_time:1465690ms step_avg:232.61ms step:6302/7050 train_time:1465932ms step_avg:232.61ms step:6303/7050 train_time:1466174ms step_avg:232.62ms step:6304/7050 train_time:1466417ms step_avg:232.62ms step:6305/7050 train_time:1466662ms step_avg:232.62ms step:6306/7050 train_time:1466903ms step_avg:232.62ms step:6307/7050 train_time:1467147ms step_avg:232.62ms step:6308/7050 train_time:1467390ms step_avg:232.62ms step:6309/7050 train_time:1467630ms step_avg:232.62ms step:6310/7050 train_time:1467875ms step_avg:232.63ms step:6311/7050 train_time:1468122ms step_avg:232.63ms step:6312/7050 train_time:1468366ms step_avg:232.63ms step:6313/7050 train_time:1468608ms step_avg:232.63ms step:6314/7050 train_time:1468852ms step_avg:232.63ms step:6315/7050 train_time:1469097ms step_avg:232.64ms step:6316/7050 train_time:1469340ms step_avg:232.64ms step:6317/7050 train_time:1469583ms step_avg:232.64ms step:6318/7050 train_time:1469824ms step_avg:232.64ms step:6319/7050 train_time:1470068ms step_avg:232.64ms step:6320/7050 train_time:1470312ms step_avg:232.64ms step:6321/7050 train_time:1470556ms step_avg:232.65ms step:6322/7050 train_time:1470803ms step_avg:232.65ms step:6323/7050 train_time:1471050ms step_avg:232.65ms step:6324/7050 train_time:1471292ms step_avg:232.65ms step:6325/7050 train_time:1471535ms step_avg:232.65ms step:6326/7050 train_time:1471778ms step_avg:232.66ms step:6327/7050 train_time:1472024ms step_avg:232.66ms step:6328/7050 train_time:1472264ms step_avg:232.66ms step:6329/7050 train_time:1472506ms step_avg:232.66ms step:6330/7050 train_time:1472757ms step_avg:232.66ms step:6331/7050 train_time:1473002ms step_avg:232.67ms step:6332/7050 train_time:1473244ms step_avg:232.67ms step:6333/7050 train_time:1473487ms step_avg:232.67ms step:6334/7050 train_time:1473731ms step_avg:232.67ms step:6335/7050 train_time:1473974ms step_avg:232.67ms step:6336/7050 train_time:1474223ms step_avg:232.67ms step:6337/7050 train_time:1474467ms step_avg:232.68ms step:6338/7050 train_time:1474711ms step_avg:232.68ms step:6339/7050 train_time:1474954ms step_avg:232.68ms step:6340/7050 train_time:1475199ms step_avg:232.68ms step:6341/7050 train_time:1475441ms step_avg:232.68ms step:6342/7050 train_time:1475687ms step_avg:232.68ms step:6343/7050 train_time:1475928ms step_avg:232.69ms step:6344/7050 train_time:1476176ms step_avg:232.69ms step:6345/7050 train_time:1476417ms step_avg:232.69ms step:6346/7050 train_time:1476663ms step_avg:232.69ms step:6347/7050 train_time:1476904ms step_avg:232.69ms step:6348/7050 train_time:1477150ms step_avg:232.70ms step:6349/7050 train_time:1477392ms step_avg:232.70ms step:6350/7050 train_time:1477636ms step_avg:232.70ms step:6351/7050 train_time:1477882ms step_avg:232.70ms step:6352/7050 train_time:1478126ms step_avg:232.70ms step:6353/7050 train_time:1478370ms step_avg:232.70ms step:6354/7050 train_time:1478615ms step_avg:232.71ms step:6355/7050 train_time:1478860ms step_avg:232.71ms step:6356/7050 train_time:1479103ms step_avg:232.71ms step:6357/7050 train_time:1479347ms step_avg:232.71ms step:6358/7050 train_time:1479591ms step_avg:232.71ms step:6359/7050 train_time:1479835ms step_avg:232.72ms step:6360/7050 train_time:1480079ms step_avg:232.72ms step:6361/7050 train_time:1480322ms step_avg:232.72ms step:6362/7050 train_time:1480565ms step_avg:232.72ms step:6363/7050 train_time:1480809ms step_avg:232.72ms step:6364/7050 train_time:1481054ms step_avg:232.72ms step:6365/7050 train_time:1481298ms step_avg:232.73ms step:6366/7050 train_time:1481546ms step_avg:232.73ms step:6367/7050 train_time:1481792ms step_avg:232.73ms step:6368/7050 train_time:1482033ms step_avg:232.73ms step:6369/7050 train_time:1482275ms step_avg:232.73ms step:6370/7050 train_time:1482518ms step_avg:232.73ms step:6371/7050 train_time:1482762ms step_avg:232.74ms step:6372/7050 train_time:1483003ms step_avg:232.74ms step:6373/7050 train_time:1483245ms step_avg:232.74ms step:6374/7050 train_time:1483493ms step_avg:232.74ms step:6375/7050 train_time:1483736ms step_avg:232.74ms step:6375/7050 val_loss:2.9510 train_time:1483927ms step_avg:232.77ms step:6376/7050 train_time:1483978ms step_avg:232.74ms step:6377/7050 train_time:1484221ms step_avg:232.75ms step:6378/7050 train_time:1484470ms step_avg:232.75ms step:6379/7050 train_time:1484715ms step_avg:232.75ms step:6380/7050 train_time:1484956ms step_avg:232.75ms step:6381/7050 train_time:1485199ms step_avg:232.75ms step:6382/7050 train_time:1485443ms step_avg:232.76ms step:6383/7050 train_time:1485685ms step_avg:232.76ms step:6384/7050 train_time:1485932ms step_avg:232.76ms step:6385/7050 train_time:1486174ms step_avg:232.76ms step:6386/7050 train_time:1486418ms step_avg:232.76ms step:6387/7050 train_time:1486661ms step_avg:232.76ms step:6388/7050 train_time:1486904ms step_avg:232.77ms step:6389/7050 train_time:1487146ms step_avg:232.77ms step:6390/7050 train_time:1487390ms step_avg:232.77ms step:6391/7050 train_time:1487631ms step_avg:232.77ms step:6392/7050 train_time:1487876ms step_avg:232.77ms step:6393/7050 train_time:1488119ms step_avg:232.77ms step:6394/7050 train_time:1488369ms step_avg:232.78ms step:6395/7050 train_time:1488610ms step_avg:232.78ms step:6396/7050 train_time:1488855ms step_avg:232.78ms step:6397/7050 train_time:1489098ms step_avg:232.78ms step:6398/7050 train_time:1489341ms step_avg:232.78ms step:6399/7050 train_time:1489582ms step_avg:232.78ms step:6400/7050 train_time:1489827ms step_avg:232.79ms step:6401/7050 train_time:1490071ms step_avg:232.79ms step:6402/7050 train_time:1490318ms step_avg:232.79ms step:6403/7050 train_time:1490558ms step_avg:232.79ms step:6404/7050 train_time:1490802ms step_avg:232.79ms step:6405/7050 train_time:1491046ms step_avg:232.79ms step:6406/7050 train_time:1491292ms step_avg:232.80ms step:6407/7050 train_time:1491536ms step_avg:232.80ms step:6408/7050 train_time:1491780ms step_avg:232.80ms step:6409/7050 train_time:1492022ms step_avg:232.80ms step:6410/7050 train_time:1492265ms step_avg:232.80ms step:6411/7050 train_time:1492506ms step_avg:232.80ms step:6412/7050 train_time:1492749ms step_avg:232.81ms step:6413/7050 train_time:1492999ms step_avg:232.81ms step:6414/7050 train_time:1493244ms step_avg:232.81ms step:6415/7050 train_time:1493486ms step_avg:232.81ms step:6416/7050 train_time:1493730ms step_avg:232.81ms step:6417/7050 train_time:1493973ms step_avg:232.81ms step:6418/7050 train_time:1494216ms step_avg:232.82ms step:6419/7050 train_time:1494463ms step_avg:232.82ms step:6420/7050 train_time:1494705ms step_avg:232.82ms step:6421/7050 train_time:1494953ms step_avg:232.82ms step:6422/7050 train_time:1495194ms step_avg:232.82ms step:6423/7050 train_time:1495440ms step_avg:232.83ms step:6424/7050 train_time:1495682ms step_avg:232.83ms step:6425/7050 train_time:1495926ms step_avg:232.83ms step:6426/7050 train_time:1496170ms step_avg:232.83ms step:6427/7050 train_time:1496412ms step_avg:232.83ms step:6428/7050 train_time:1496655ms step_avg:232.83ms step:6429/7050 train_time:1496902ms step_avg:232.84ms step:6430/7050 train_time:1497147ms step_avg:232.84ms step:6431/7050 train_time:1497391ms step_avg:232.84ms step:6432/7050 train_time:1497635ms step_avg:232.84ms step:6433/7050 train_time:1497881ms step_avg:232.84ms step:6434/7050 train_time:1498121ms step_avg:232.84ms step:6435/7050 train_time:1498364ms step_avg:232.85ms step:6436/7050 train_time:1498612ms step_avg:232.85ms step:6437/7050 train_time:1498855ms step_avg:232.85ms step:6438/7050 train_time:1499097ms step_avg:232.85ms step:6439/7050 train_time:1499341ms step_avg:232.85ms step:6440/7050 train_time:1499588ms step_avg:232.86ms step:6441/7050 train_time:1499831ms step_avg:232.86ms step:6442/7050 train_time:1500074ms step_avg:232.86ms step:6443/7050 train_time:1500320ms step_avg:232.86ms step:6444/7050 train_time:1500563ms step_avg:232.86ms step:6445/7050 train_time:1500807ms step_avg:232.86ms step:6446/7050 train_time:1501052ms step_avg:232.87ms step:6447/7050 train_time:1501298ms step_avg:232.87ms step:6448/7050 train_time:1501541ms step_avg:232.87ms step:6449/7050 train_time:1501784ms step_avg:232.87ms step:6450/7050 train_time:1502028ms step_avg:232.87ms step:6451/7050 train_time:1502272ms step_avg:232.87ms step:6452/7050 train_time:1502516ms step_avg:232.88ms step:6453/7050 train_time:1502760ms step_avg:232.88ms step:6454/7050 train_time:1503004ms step_avg:232.88ms step:6455/7050 train_time:1503246ms step_avg:232.88ms step:6456/7050 train_time:1503494ms step_avg:232.88ms step:6457/7050 train_time:1503737ms step_avg:232.88ms step:6458/7050 train_time:1503986ms step_avg:232.89ms step:6459/7050 train_time:1504228ms step_avg:232.89ms step:6460/7050 train_time:1504473ms step_avg:232.89ms step:6461/7050 train_time:1504717ms step_avg:232.89ms step:6462/7050 train_time:1504959ms step_avg:232.89ms step:6463/7050 train_time:1505200ms step_avg:232.90ms step:6464/7050 train_time:1505445ms step_avg:232.90ms step:6465/7050 train_time:1505689ms step_avg:232.90ms step:6466/7050 train_time:1505935ms step_avg:232.90ms step:6467/7050 train_time:1506181ms step_avg:232.90ms step:6468/7050 train_time:1506423ms step_avg:232.90ms step:6469/7050 train_time:1506665ms step_avg:232.91ms step:6470/7050 train_time:1506914ms step_avg:232.91ms step:6471/7050 train_time:1507156ms step_avg:232.91ms step:6472/7050 train_time:1507397ms step_avg:232.91ms step:6473/7050 train_time:1507641ms step_avg:232.91ms step:6474/7050 train_time:1507882ms step_avg:232.91ms step:6475/7050 train_time:1508125ms step_avg:232.91ms step:6476/7050 train_time:1508367ms step_avg:232.92ms step:6477/7050 train_time:1508622ms step_avg:232.92ms step:6478/7050 train_time:1508864ms step_avg:232.92ms step:6479/7050 train_time:1509106ms step_avg:232.92ms step:6480/7050 train_time:1509347ms step_avg:232.92ms step:6481/7050 train_time:1509589ms step_avg:232.93ms step:6482/7050 train_time:1509834ms step_avg:232.93ms step:6483/7050 train_time:1510074ms step_avg:232.93ms step:6484/7050 train_time:1510320ms step_avg:232.93ms step:6485/7050 train_time:1510563ms step_avg:232.93ms step:6486/7050 train_time:1510807ms step_avg:232.93ms step:6487/7050 train_time:1511050ms step_avg:232.94ms step:6488/7050 train_time:1511292ms step_avg:232.94ms step:6489/7050 train_time:1511537ms step_avg:232.94ms step:6490/7050 train_time:1511779ms step_avg:232.94ms step:6491/7050 train_time:1512022ms step_avg:232.94ms step:6492/7050 train_time:1512266ms step_avg:232.94ms step:6493/7050 train_time:1512508ms step_avg:232.94ms step:6494/7050 train_time:1512749ms step_avg:232.95ms step:6495/7050 train_time:1512992ms step_avg:232.95ms step:6496/7050 train_time:1513235ms step_avg:232.95ms step:6497/7050 train_time:1513481ms step_avg:232.95ms step:6498/7050 train_time:1513726ms step_avg:232.95ms step:6499/7050 train_time:1513977ms step_avg:232.96ms step:6500/7050 train_time:1514218ms step_avg:232.96ms step:6500/7050 val_loss:2.9433 train_time:1514410ms step_avg:232.99ms step:6501/7050 train_time:1514462ms step_avg:232.96ms step:6502/7050 train_time:1514708ms step_avg:232.96ms step:6503/7050 train_time:1514955ms step_avg:232.96ms step:6504/7050 train_time:1515203ms step_avg:232.96ms step:6505/7050 train_time:1515448ms step_avg:232.97ms step:6506/7050 train_time:1515691ms step_avg:232.97ms step:6507/7050 train_time:1515935ms step_avg:232.97ms step:6508/7050 train_time:1516180ms step_avg:232.97ms step:6509/7050 train_time:1516427ms step_avg:232.97ms step:6510/7050 train_time:1516672ms step_avg:232.98ms step:6511/7050 train_time:1516914ms step_avg:232.98ms step:6512/7050 train_time:1517161ms step_avg:232.98ms step:6513/7050 train_time:1517402ms step_avg:232.98ms step:6514/7050 train_time:1517645ms step_avg:232.98ms step:6515/7050 train_time:1517897ms step_avg:232.99ms step:6516/7050 train_time:1518141ms step_avg:232.99ms step:6517/7050 train_time:1518390ms step_avg:232.99ms step:6518/7050 train_time:1518633ms step_avg:232.99ms step:6519/7050 train_time:1518876ms step_avg:232.99ms step:6520/7050 train_time:1519120ms step_avg:232.99ms step:6521/7050 train_time:1519366ms step_avg:233.00ms step:6522/7050 train_time:1519608ms step_avg:233.00ms step:6523/7050 train_time:1519853ms step_avg:233.00ms step:6524/7050 train_time:1520095ms step_avg:233.00ms step:6525/7050 train_time:1520341ms step_avg:233.00ms step:6526/7050 train_time:1520585ms step_avg:233.00ms step:6527/7050 train_time:1520826ms step_avg:233.01ms step:6528/7050 train_time:1521068ms step_avg:233.01ms step:6529/7050 train_time:1521313ms step_avg:233.01ms step:6530/7050 train_time:1521561ms step_avg:233.01ms step:6531/7050 train_time:1521807ms step_avg:233.01ms step:6532/7050 train_time:1522050ms step_avg:233.01ms step:6533/7050 train_time:1522295ms step_avg:233.02ms step:6534/7050 train_time:1522537ms step_avg:233.02ms step:6535/7050 train_time:1522784ms step_avg:233.02ms step:6536/7050 train_time:1523032ms step_avg:233.02ms step:6537/7050 train_time:1523275ms step_avg:233.02ms step:6538/7050 train_time:1523519ms step_avg:233.03ms step:6539/7050 train_time:1523762ms step_avg:233.03ms step:6540/7050 train_time:1524005ms step_avg:233.03ms step:6541/7050 train_time:1524253ms step_avg:233.03ms step:6542/7050 train_time:1524499ms step_avg:233.03ms step:6543/7050 train_time:1524745ms step_avg:233.03ms step:6544/7050 train_time:1524993ms step_avg:233.04ms step:6545/7050 train_time:1525236ms step_avg:233.04ms step:6546/7050 train_time:1525477ms step_avg:233.04ms step:6547/7050 train_time:1525719ms step_avg:233.04ms step:6548/7050 train_time:1525962ms step_avg:233.04ms step:6549/7050 train_time:1526204ms step_avg:233.04ms step:6550/7050 train_time:1526446ms step_avg:233.05ms step:6551/7050 train_time:1526692ms step_avg:233.05ms step:6552/7050 train_time:1526938ms step_avg:233.05ms step:6553/7050 train_time:1527182ms step_avg:233.05ms step:6554/7050 train_time:1527423ms step_avg:233.05ms step:6555/7050 train_time:1527667ms step_avg:233.05ms step:6556/7050 train_time:1527911ms step_avg:233.06ms step:6557/7050 train_time:1528154ms step_avg:233.06ms step:6558/7050 train_time:1528399ms step_avg:233.06ms step:6559/7050 train_time:1528644ms step_avg:233.06ms step:6560/7050 train_time:1528887ms step_avg:233.06ms step:6561/7050 train_time:1529130ms step_avg:233.06ms step:6562/7050 train_time:1529373ms step_avg:233.07ms step:6563/7050 train_time:1529618ms step_avg:233.07ms step:6564/7050 train_time:1529862ms step_avg:233.07ms step:6565/7050 train_time:1530106ms step_avg:233.07ms step:6566/7050 train_time:1530347ms step_avg:233.07ms step:6567/7050 train_time:1530593ms step_avg:233.07ms step:6568/7050 train_time:1530835ms step_avg:233.07ms step:6569/7050 train_time:1531081ms step_avg:233.08ms step:6570/7050 train_time:1531325ms step_avg:233.08ms step:6571/7050 train_time:1531567ms step_avg:233.08ms step:6572/7050 train_time:1531808ms step_avg:233.08ms step:6573/7050 train_time:1532052ms step_avg:233.08ms step:6574/7050 train_time:1532296ms step_avg:233.08ms step:6575/7050 train_time:1532545ms step_avg:233.09ms step:6576/7050 train_time:1532787ms step_avg:233.09ms step:6577/7050 train_time:1533032ms step_avg:233.09ms step:6578/7050 train_time:1533278ms step_avg:233.09ms step:6579/7050 train_time:1533522ms step_avg:233.09ms step:6580/7050 train_time:1533765ms step_avg:233.10ms step:6581/7050 train_time:1534008ms step_avg:233.10ms step:6582/7050 train_time:1534250ms step_avg:233.10ms step:6583/7050 train_time:1534493ms step_avg:233.10ms step:6584/7050 train_time:1534737ms step_avg:233.10ms step:6585/7050 train_time:1534978ms step_avg:233.10ms step:6586/7050 train_time:1535220ms step_avg:233.10ms step:6587/7050 train_time:1535463ms step_avg:233.11ms step:6588/7050 train_time:1535704ms step_avg:233.11ms step:6589/7050 train_time:1535946ms step_avg:233.11ms step:6590/7050 train_time:1536189ms step_avg:233.11ms step:6591/7050 train_time:1536435ms step_avg:233.11ms step:6592/7050 train_time:1536680ms step_avg:233.11ms step:6593/7050 train_time:1536924ms step_avg:233.11ms step:6594/7050 train_time:1537166ms step_avg:233.12ms step:6595/7050 train_time:1537409ms step_avg:233.12ms step:6596/7050 train_time:1537653ms step_avg:233.12ms step:6597/7050 train_time:1537898ms step_avg:233.12ms step:6598/7050 train_time:1538140ms step_avg:233.12ms step:6599/7050 train_time:1538387ms step_avg:233.12ms step:6600/7050 train_time:1538628ms step_avg:233.13ms step:6601/7050 train_time:1538872ms step_avg:233.13ms step:6602/7050 train_time:1539114ms step_avg:233.13ms step:6603/7050 train_time:1539357ms step_avg:233.13ms step:6604/7050 train_time:1539608ms step_avg:233.13ms step:6605/7050 train_time:1539854ms step_avg:233.13ms step:6606/7050 train_time:1540095ms step_avg:233.14ms step:6607/7050 train_time:1540337ms step_avg:233.14ms step:6608/7050 train_time:1540580ms step_avg:233.14ms step:6609/7050 train_time:1540827ms step_avg:233.14ms step:6610/7050 train_time:1541070ms step_avg:233.14ms step:6611/7050 train_time:1541314ms step_avg:233.14ms step:6612/7050 train_time:1541558ms step_avg:233.15ms step:6613/7050 train_time:1541803ms step_avg:233.15ms step:6614/7050 train_time:1542047ms step_avg:233.15ms step:6615/7050 train_time:1542290ms step_avg:233.15ms step:6616/7050 train_time:1542532ms step_avg:233.15ms step:6617/7050 train_time:1542774ms step_avg:233.15ms step:6618/7050 train_time:1543017ms step_avg:233.15ms step:6619/7050 train_time:1543258ms step_avg:233.16ms step:6620/7050 train_time:1543504ms step_avg:233.16ms step:6621/7050 train_time:1543746ms step_avg:233.16ms step:6622/7050 train_time:1543994ms step_avg:233.16ms step:6623/7050 train_time:1544239ms step_avg:233.16ms step:6624/7050 train_time:1544483ms step_avg:233.16ms step:6625/7050 train_time:1544724ms step_avg:233.17ms step:6625/7050 val_loss:2.9359 train_time:1544918ms step_avg:233.20ms step:6626/7050 train_time:1544970ms step_avg:233.17ms step:6627/7050 train_time:1545217ms step_avg:233.17ms step:6628/7050 train_time:1545463ms step_avg:233.17ms step:6629/7050 train_time:1545705ms step_avg:233.17ms step:6630/7050 train_time:1545947ms step_avg:233.17ms step:6631/7050 train_time:1546190ms step_avg:233.18ms step:6632/7050 train_time:1546440ms step_avg:233.18ms step:6633/7050 train_time:1546682ms step_avg:233.18ms step:6634/7050 train_time:1546923ms step_avg:233.18ms step:6635/7050 train_time:1547164ms step_avg:233.18ms step:6636/7050 train_time:1547408ms step_avg:233.18ms step:6637/7050 train_time:1547650ms step_avg:233.19ms step:6638/7050 train_time:1547893ms step_avg:233.19ms step:6639/7050 train_time:1548138ms step_avg:233.19ms step:6640/7050 train_time:1548380ms step_avg:233.19ms step:6641/7050 train_time:1548624ms step_avg:233.19ms step:6642/7050 train_time:1548869ms step_avg:233.19ms step:6643/7050 train_time:1549111ms step_avg:233.19ms step:6644/7050 train_time:1549354ms step_avg:233.20ms step:6645/7050 train_time:1549599ms step_avg:233.20ms step:6646/7050 train_time:1549845ms step_avg:233.20ms step:6647/7050 train_time:1550089ms step_avg:233.20ms step:6648/7050 train_time:1550334ms step_avg:233.20ms step:6649/7050 train_time:1550583ms step_avg:233.21ms step:6650/7050 train_time:1550827ms step_avg:233.21ms step:6651/7050 train_time:1551069ms step_avg:233.21ms step:6652/7050 train_time:1551311ms step_avg:233.21ms step:6653/7050 train_time:1551555ms step_avg:233.21ms step:6654/7050 train_time:1551799ms step_avg:233.21ms step:6655/7050 train_time:1552040ms step_avg:233.21ms step:6656/7050 train_time:1552283ms step_avg:233.22ms step:6657/7050 train_time:1552530ms step_avg:233.22ms step:6658/7050 train_time:1552772ms step_avg:233.22ms step:6659/7050 train_time:1553014ms step_avg:233.22ms step:6660/7050 train_time:1553258ms step_avg:233.22ms step:6661/7050 train_time:1553500ms step_avg:233.22ms step:6662/7050 train_time:1553742ms step_avg:233.22ms step:6663/7050 train_time:1553988ms step_avg:233.23ms step:6664/7050 train_time:1554231ms step_avg:233.23ms step:6665/7050 train_time:1554473ms step_avg:233.23ms step:6666/7050 train_time:1554713ms step_avg:233.23ms step:6667/7050 train_time:1554958ms step_avg:233.23ms step:6668/7050 train_time:1555202ms step_avg:233.23ms step:6669/7050 train_time:1555445ms step_avg:233.24ms step:6670/7050 train_time:1555687ms step_avg:233.24ms step:6671/7050 train_time:1555934ms step_avg:233.24ms step:6672/7050 train_time:1556180ms step_avg:233.24ms step:6673/7050 train_time:1556424ms step_avg:233.24ms step:6674/7050 train_time:1556667ms step_avg:233.24ms step:6675/7050 train_time:1556911ms step_avg:233.25ms step:6676/7050 train_time:1557154ms step_avg:233.25ms step:6677/7050 train_time:1557396ms step_avg:233.25ms step:6678/7050 train_time:1557642ms step_avg:233.25ms step:6679/7050 train_time:1557885ms step_avg:233.25ms step:6680/7050 train_time:1558130ms step_avg:233.25ms step:6681/7050 train_time:1558375ms step_avg:233.25ms step:6682/7050 train_time:1558617ms step_avg:233.26ms step:6683/7050 train_time:1558859ms step_avg:233.26ms step:6684/7050 train_time:1559101ms step_avg:233.26ms step:6685/7050 train_time:1559345ms step_avg:233.26ms step:6686/7050 train_time:1559591ms step_avg:233.26ms step:6687/7050 train_time:1559831ms step_avg:233.26ms step:6688/7050 train_time:1560076ms step_avg:233.26ms step:6689/7050 train_time:1560320ms step_avg:233.27ms step:6690/7050 train_time:1560562ms step_avg:233.27ms step:6691/7050 train_time:1560807ms step_avg:233.27ms step:6692/7050 train_time:1561054ms step_avg:233.27ms step:6693/7050 train_time:1561297ms step_avg:233.27ms step:6694/7050 train_time:1561545ms step_avg:233.28ms step:6695/7050 train_time:1561788ms step_avg:233.28ms step:6696/7050 train_time:1562033ms step_avg:233.28ms step:6697/7050 train_time:1562277ms step_avg:233.28ms step:6698/7050 train_time:1562519ms step_avg:233.28ms step:6699/7050 train_time:1562762ms step_avg:233.28ms step:6700/7050 train_time:1563007ms step_avg:233.28ms step:6701/7050 train_time:1563254ms step_avg:233.29ms step:6702/7050 train_time:1563498ms step_avg:233.29ms step:6703/7050 train_time:1563740ms step_avg:233.29ms step:6704/7050 train_time:1563983ms step_avg:233.29ms step:6705/7050 train_time:1564226ms step_avg:233.29ms step:6706/7050 train_time:1564471ms step_avg:233.29ms step:6707/7050 train_time:1564714ms step_avg:233.30ms step:6708/7050 train_time:1564958ms step_avg:233.30ms step:6709/7050 train_time:1565204ms step_avg:233.30ms step:6710/7050 train_time:1565450ms step_avg:233.30ms step:6711/7050 train_time:1565693ms step_avg:233.30ms step:6712/7050 train_time:1565943ms step_avg:233.31ms step:6713/7050 train_time:1566188ms step_avg:233.31ms step:6714/7050 train_time:1566431ms step_avg:233.31ms step:6715/7050 train_time:1566676ms step_avg:233.31ms step:6716/7050 train_time:1566923ms step_avg:233.31ms step:6717/7050 train_time:1567166ms step_avg:233.31ms step:6718/7050 train_time:1567407ms step_avg:233.31ms step:6719/7050 train_time:1567654ms step_avg:233.32ms step:6720/7050 train_time:1567899ms step_avg:233.32ms step:6721/7050 train_time:1568141ms step_avg:233.32ms step:6722/7050 train_time:1568385ms step_avg:233.32ms step:6723/7050 train_time:1568629ms step_avg:233.32ms step:6724/7050 train_time:1568870ms step_avg:233.32ms step:6725/7050 train_time:1569115ms step_avg:233.33ms step:6726/7050 train_time:1569359ms step_avg:233.33ms step:6727/7050 train_time:1569602ms step_avg:233.33ms step:6728/7050 train_time:1569849ms step_avg:233.33ms step:6729/7050 train_time:1570093ms step_avg:233.33ms step:6730/7050 train_time:1570334ms step_avg:233.33ms step:6731/7050 train_time:1570576ms step_avg:233.33ms step:6732/7050 train_time:1570819ms step_avg:233.34ms step:6733/7050 train_time:1571064ms step_avg:233.34ms step:6734/7050 train_time:1571306ms step_avg:233.34ms step:6735/7050 train_time:1571547ms step_avg:233.34ms step:6736/7050 train_time:1571789ms step_avg:233.34ms step:6737/7050 train_time:1572034ms step_avg:233.34ms step:6738/7050 train_time:1572277ms step_avg:233.34ms step:6739/7050 train_time:1572519ms step_avg:233.35ms step:6740/7050 train_time:1572762ms step_avg:233.35ms step:6741/7050 train_time:1573006ms step_avg:233.35ms step:6742/7050 train_time:1573251ms step_avg:233.35ms step:6743/7050 train_time:1573495ms step_avg:233.35ms step:6744/7050 train_time:1573738ms step_avg:233.35ms step:6745/7050 train_time:1573981ms step_avg:233.36ms step:6746/7050 train_time:1574226ms step_avg:233.36ms step:6747/7050 train_time:1574469ms step_avg:233.36ms step:6748/7050 train_time:1574712ms step_avg:233.36ms step:6749/7050 train_time:1574958ms step_avg:233.36ms step:6750/7050 train_time:1575201ms step_avg:233.36ms step:6750/7050 val_loss:2.9295 train_time:1575394ms step_avg:233.39ms step:6751/7050 train_time:1575445ms step_avg:233.36ms step:6752/7050 train_time:1575690ms step_avg:233.37ms step:6753/7050 train_time:1575935ms step_avg:233.37ms step:6754/7050 train_time:1576177ms step_avg:233.37ms step:6755/7050 train_time:1576418ms step_avg:233.37ms step:6756/7050 train_time:1576661ms step_avg:233.37ms step:6757/7050 train_time:1576909ms step_avg:233.37ms step:6758/7050 train_time:1577153ms step_avg:233.38ms step:6759/7050 train_time:1577393ms step_avg:233.38ms step:6760/7050 train_time:1577640ms step_avg:233.38ms step:6761/7050 train_time:1577882ms step_avg:233.38ms step:6762/7050 train_time:1578124ms step_avg:233.38ms step:6763/7050 train_time:1578372ms step_avg:233.38ms step:6764/7050 train_time:1578614ms step_avg:233.38ms step:6765/7050 train_time:1578857ms step_avg:233.39ms step:6766/7050 train_time:1579101ms step_avg:233.39ms step:6767/7050 train_time:1579348ms step_avg:233.39ms step:6768/7050 train_time:1579591ms step_avg:233.39ms step:6769/7050 train_time:1579833ms step_avg:233.39ms step:6770/7050 train_time:1580077ms step_avg:233.39ms step:6771/7050 train_time:1580322ms step_avg:233.40ms step:6772/7050 train_time:1580564ms step_avg:233.40ms step:6773/7050 train_time:1580806ms step_avg:233.40ms step:6774/7050 train_time:1581049ms step_avg:233.40ms step:6775/7050 train_time:1581294ms step_avg:233.40ms step:6776/7050 train_time:1581536ms step_avg:233.40ms step:6777/7050 train_time:1581787ms step_avg:233.41ms step:6778/7050 train_time:1582031ms step_avg:233.41ms step:6779/7050 train_time:1582274ms step_avg:233.41ms step:6780/7050 train_time:1582521ms step_avg:233.41ms step:6781/7050 train_time:1582765ms step_avg:233.41ms step:6782/7050 train_time:1583006ms step_avg:233.41ms step:6783/7050 train_time:1583253ms step_avg:233.41ms step:6784/7050 train_time:1583505ms step_avg:233.42ms step:6785/7050 train_time:1583745ms step_avg:233.42ms step:6786/7050 train_time:1583989ms step_avg:233.42ms step:6787/7050 train_time:1584232ms step_avg:233.42ms step:6788/7050 train_time:1584477ms step_avg:233.42ms step:6789/7050 train_time:1584724ms step_avg:233.43ms step:6790/7050 train_time:1584968ms step_avg:233.43ms step:6791/7050 train_time:1585213ms step_avg:233.43ms step:6792/7050 train_time:1585458ms step_avg:233.43ms step:6793/7050 train_time:1585707ms step_avg:233.43ms step:6794/7050 train_time:1585959ms step_avg:233.44ms step:6795/7050 train_time:1586200ms step_avg:233.44ms step:6796/7050 train_time:1586448ms step_avg:233.44ms step:6797/7050 train_time:1586696ms step_avg:233.44ms step:6798/7050 train_time:1586940ms step_avg:233.44ms step:6799/7050 train_time:1587185ms step_avg:233.44ms step:6800/7050 train_time:1587433ms step_avg:233.45ms step:6801/7050 train_time:1587677ms step_avg:233.45ms step:6802/7050 train_time:1587928ms step_avg:233.45ms step:6803/7050 train_time:1588171ms step_avg:233.45ms step:6804/7050 train_time:1588418ms step_avg:233.45ms step:6805/7050 train_time:1588671ms step_avg:233.46ms step:6806/7050 train_time:1588913ms step_avg:233.46ms step:6807/7050 train_time:1589161ms step_avg:233.46ms step:6808/7050 train_time:1589412ms step_avg:233.46ms step:6809/7050 train_time:1589661ms step_avg:233.46ms step:6810/7050 train_time:1589905ms step_avg:233.47ms step:6811/7050 train_time:1590150ms step_avg:233.47ms step:6812/7050 train_time:1590396ms step_avg:233.47ms step:6813/7050 train_time:1590644ms step_avg:233.47ms step:6814/7050 train_time:1590889ms step_avg:233.47ms step:6815/7050 train_time:1591133ms step_avg:233.48ms step:6816/7050 train_time:1591378ms step_avg:233.48ms step:6817/7050 train_time:1591623ms step_avg:233.48ms step:6818/7050 train_time:1591869ms step_avg:233.48ms step:6819/7050 train_time:1592123ms step_avg:233.48ms step:6820/7050 train_time:1592369ms step_avg:233.49ms step:6821/7050 train_time:1592618ms step_avg:233.49ms step:6822/7050 train_time:1592867ms step_avg:233.49ms step:6823/7050 train_time:1593112ms step_avg:233.49ms step:6824/7050 train_time:1593356ms step_avg:233.49ms step:6825/7050 train_time:1593604ms step_avg:233.50ms step:6826/7050 train_time:1593846ms step_avg:233.50ms step:6827/7050 train_time:1594104ms step_avg:233.50ms step:6828/7050 train_time:1594345ms step_avg:233.50ms step:6829/7050 train_time:1594593ms step_avg:233.50ms step:6830/7050 train_time:1594839ms step_avg:233.51ms step:6831/7050 train_time:1595084ms step_avg:233.51ms step:6832/7050 train_time:1595327ms step_avg:233.51ms step:6833/7050 train_time:1595572ms step_avg:233.51ms step:6834/7050 train_time:1595818ms step_avg:233.51ms step:6835/7050 train_time:1596069ms step_avg:233.51ms step:6836/7050 train_time:1596322ms step_avg:233.52ms step:6837/7050 train_time:1596566ms step_avg:233.52ms step:6838/7050 train_time:1596813ms step_avg:233.52ms step:6839/7050 train_time:1597061ms step_avg:233.52ms step:6840/7050 train_time:1597307ms step_avg:233.52ms step:6841/7050 train_time:1597552ms step_avg:233.53ms step:6842/7050 train_time:1597796ms step_avg:233.53ms step:6843/7050 train_time:1598042ms step_avg:233.53ms step:6844/7050 train_time:1598291ms step_avg:233.53ms step:6845/7050 train_time:1598539ms step_avg:233.53ms step:6846/7050 train_time:1598783ms step_avg:233.54ms step:6847/7050 train_time:1599029ms step_avg:233.54ms step:6848/7050 train_time:1599285ms step_avg:233.54ms step:6849/7050 train_time:1599528ms step_avg:233.54ms step:6850/7050 train_time:1599772ms step_avg:233.54ms step:6851/7050 train_time:1600020ms step_avg:233.55ms step:6852/7050 train_time:1600267ms step_avg:233.55ms step:6853/7050 train_time:1600514ms step_avg:233.55ms step:6854/7050 train_time:1600756ms step_avg:233.55ms step:6855/7050 train_time:1601003ms step_avg:233.55ms step:6856/7050 train_time:1601251ms step_avg:233.55ms step:6857/7050 train_time:1601503ms step_avg:233.56ms step:6858/7050 train_time:1601747ms step_avg:233.56ms step:6859/7050 train_time:1601995ms step_avg:233.56ms step:6860/7050 train_time:1602245ms step_avg:233.56ms step:6861/7050 train_time:1602497ms step_avg:233.57ms step:6862/7050 train_time:1602745ms step_avg:233.57ms step:6863/7050 train_time:1602986ms step_avg:233.57ms step:6864/7050 train_time:1603234ms step_avg:233.57ms step:6865/7050 train_time:1603477ms step_avg:233.57ms step:6866/7050 train_time:1603724ms step_avg:233.57ms step:6867/7050 train_time:1603969ms step_avg:233.58ms step:6868/7050 train_time:1604213ms step_avg:233.58ms step:6869/7050 train_time:1604459ms step_avg:233.58ms step:6870/7050 train_time:1604711ms step_avg:233.58ms step:6871/7050 train_time:1604957ms step_avg:233.58ms step:6872/7050 train_time:1605202ms step_avg:233.59ms step:6873/7050 train_time:1605444ms step_avg:233.59ms step:6874/7050 train_time:1605691ms step_avg:233.59ms step:6875/7050 train_time:1605941ms step_avg:233.59ms step:6875/7050 val_loss:2.9235 train_time:1606134ms step_avg:233.62ms step:6876/7050 train_time:1606187ms step_avg:233.59ms step:6877/7050 train_time:1606435ms step_avg:233.60ms step:6878/7050 train_time:1606683ms step_avg:233.60ms step:6879/7050 train_time:1606928ms step_avg:233.60ms step:6880/7050 train_time:1607173ms step_avg:233.60ms step:6881/7050 train_time:1607423ms step_avg:233.60ms step:6882/7050 train_time:1607678ms step_avg:233.61ms step:6883/7050 train_time:1607924ms step_avg:233.61ms step:6884/7050 train_time:1608171ms step_avg:233.61ms step:6885/7050 train_time:1608417ms step_avg:233.61ms step:6886/7050 train_time:1608664ms step_avg:233.61ms step:6887/7050 train_time:1608907ms step_avg:233.62ms step:6888/7050 train_time:1609153ms step_avg:233.62ms step:6889/7050 train_time:1609402ms step_avg:233.62ms step:6890/7050 train_time:1609653ms step_avg:233.62ms step:6891/7050 train_time:1609898ms step_avg:233.62ms step:6892/7050 train_time:1610142ms step_avg:233.62ms step:6893/7050 train_time:1610386ms step_avg:233.63ms step:6894/7050 train_time:1610634ms step_avg:233.63ms step:6895/7050 train_time:1610891ms step_avg:233.63ms step:6896/7050 train_time:1611137ms step_avg:233.63ms step:6897/7050 train_time:1611381ms step_avg:233.64ms step:6898/7050 train_time:1611634ms step_avg:233.64ms step:6899/7050 train_time:1611888ms step_avg:233.64ms step:6900/7050 train_time:1612132ms step_avg:233.64ms step:6901/7050 train_time:1612376ms step_avg:233.64ms step:6902/7050 train_time:1612624ms step_avg:233.65ms step:6903/7050 train_time:1612871ms step_avg:233.65ms step:6904/7050 train_time:1613117ms step_avg:233.65ms step:6905/7050 train_time:1613360ms step_avg:233.65ms step:6906/7050 train_time:1613606ms step_avg:233.65ms step:6907/7050 train_time:1613852ms step_avg:233.65ms step:6908/7050 train_time:1614097ms step_avg:233.66ms step:6909/7050 train_time:1614353ms step_avg:233.66ms step:6910/7050 train_time:1614598ms step_avg:233.66ms step:6911/7050 train_time:1614843ms step_avg:233.66ms step:6912/7050 train_time:1615085ms step_avg:233.66ms step:6913/7050 train_time:1615329ms step_avg:233.67ms step:6914/7050 train_time:1615578ms step_avg:233.67ms step:6915/7050 train_time:1615824ms step_avg:233.67ms step:6916/7050 train_time:1616075ms step_avg:233.67ms step:6917/7050 train_time:1616320ms step_avg:233.67ms step:6918/7050 train_time:1616564ms step_avg:233.68ms step:6919/7050 train_time:1616811ms step_avg:233.68ms step:6920/7050 train_time:1617061ms step_avg:233.68ms step:6921/7050 train_time:1617305ms step_avg:233.68ms step:6922/7050 train_time:1617552ms step_avg:233.68ms step:6923/7050 train_time:1617797ms step_avg:233.68ms step:6924/7050 train_time:1618043ms step_avg:233.69ms step:6925/7050 train_time:1618285ms step_avg:233.69ms step:6926/7050 train_time:1618529ms step_avg:233.69ms step:6927/7050 train_time:1618775ms step_avg:233.69ms step:6928/7050 train_time:1619027ms step_avg:233.69ms step:6929/7050 train_time:1619269ms step_avg:233.69ms step:6930/7050 train_time:1619510ms step_avg:233.70ms step:6931/7050 train_time:1619756ms step_avg:233.70ms step:6932/7050 train_time:1620007ms step_avg:233.70ms step:6933/7050 train_time:1620256ms step_avg:233.70ms step:6934/7050 train_time:1620498ms step_avg:233.70ms step:6935/7050 train_time:1620742ms step_avg:233.70ms step:6936/7050 train_time:1620992ms step_avg:233.71ms step:6937/7050 train_time:1621248ms step_avg:233.71ms step:6938/7050 train_time:1621493ms step_avg:233.71ms step:6939/7050 train_time:1621737ms step_avg:233.71ms step:6940/7050 train_time:1621981ms step_avg:233.71ms step:6941/7050 train_time:1622237ms step_avg:233.72ms step:6942/7050 train_time:1622491ms step_avg:233.72ms step:6943/7050 train_time:1622734ms step_avg:233.72ms step:6944/7050 train_time:1622980ms step_avg:233.72ms step:6945/7050 train_time:1623228ms step_avg:233.73ms step:6946/7050 train_time:1623473ms step_avg:233.73ms step:6947/7050 train_time:1623721ms step_avg:233.73ms step:6948/7050 train_time:1623969ms step_avg:233.73ms step:6949/7050 train_time:1624219ms step_avg:233.73ms step:6950/7050 train_time:1624466ms step_avg:233.74ms step:6951/7050 train_time:1624709ms step_avg:233.74ms step:6952/7050 train_time:1624954ms step_avg:233.74ms step:6953/7050 train_time:1625201ms step_avg:233.74ms step:6954/7050 train_time:1625448ms step_avg:233.74ms step:6955/7050 train_time:1625690ms step_avg:233.74ms step:6956/7050 train_time:1625940ms step_avg:233.75ms step:6957/7050 train_time:1626186ms step_avg:233.75ms step:6958/7050 train_time:1626435ms step_avg:233.75ms step:6959/7050 train_time:1626679ms step_avg:233.75ms step:6960/7050 train_time:1626925ms step_avg:233.75ms step:6961/7050 train_time:1627174ms step_avg:233.76ms step:6962/7050 train_time:1627420ms step_avg:233.76ms step:6963/7050 train_time:1627669ms step_avg:233.76ms step:6964/7050 train_time:1627916ms step_avg:233.76ms step:6965/7050 train_time:1628161ms step_avg:233.76ms step:6966/7050 train_time:1628407ms step_avg:233.76ms step:6967/7050 train_time:1628653ms step_avg:233.77ms step:6968/7050 train_time:1628899ms step_avg:233.77ms step:6969/7050 train_time:1629147ms step_avg:233.77ms step:6970/7050 train_time:1629396ms step_avg:233.77ms step:6971/7050 train_time:1629645ms step_avg:233.77ms step:6972/7050 train_time:1629892ms step_avg:233.78ms step:6973/7050 train_time:1630134ms step_avg:233.78ms step:6974/7050 train_time:1630382ms step_avg:233.78ms step:6975/7050 train_time:1630628ms step_avg:233.78ms step:6976/7050 train_time:1630871ms step_avg:233.78ms step:6977/7050 train_time:1631114ms step_avg:233.78ms step:6978/7050 train_time:1631362ms step_avg:233.79ms step:6979/7050 train_time:1631608ms step_avg:233.79ms step:6980/7050 train_time:1631855ms step_avg:233.79ms step:6981/7050 train_time:1632098ms step_avg:233.79ms step:6982/7050 train_time:1632344ms step_avg:233.79ms step:6983/7050 train_time:1632592ms step_avg:233.80ms step:6984/7050 train_time:1632840ms step_avg:233.80ms step:6985/7050 train_time:1633083ms step_avg:233.80ms step:6986/7050 train_time:1633328ms step_avg:233.80ms step:6987/7050 train_time:1633575ms step_avg:233.80ms step:6988/7050 train_time:1633817ms step_avg:233.80ms step:6989/7050 train_time:1634065ms step_avg:233.81ms step:6990/7050 train_time:1634309ms step_avg:233.81ms step:6991/7050 train_time:1634554ms step_avg:233.81ms step:6992/7050 train_time:1634800ms step_avg:233.81ms step:6993/7050 train_time:1635048ms step_avg:233.81ms step:6994/7050 train_time:1635294ms step_avg:233.81ms step:6995/7050 train_time:1635540ms step_avg:233.82ms step:6996/7050 train_time:1635788ms step_avg:233.82ms step:6997/7050 train_time:1636033ms step_avg:233.82ms step:6998/7050 train_time:1636277ms step_avg:233.82ms step:6999/7050 train_time:1636523ms step_avg:233.82ms step:7000/7050 train_time:1636768ms step_avg:233.82ms step:7000/7050 val_loss:2.9198 train_time:1636960ms step_avg:233.85ms step:7001/7050 train_time:1637012ms step_avg:233.83ms step:7002/7050 train_time:1637263ms step_avg:233.83ms step:7003/7050 train_time:1637509ms step_avg:233.83ms step:7004/7050 train_time:1637757ms step_avg:233.83ms step:7005/7050 train_time:1638005ms step_avg:233.83ms step:7006/7050 train_time:1638250ms step_avg:233.84ms step:7007/7050 train_time:1638498ms step_avg:233.84ms step:7008/7050 train_time:1638742ms step_avg:233.84ms step:7009/7050 train_time:1638987ms step_avg:233.84ms step:7010/7050 train_time:1639232ms step_avg:233.84ms step:7011/7050 train_time:1639475ms step_avg:233.84ms step:7012/7050 train_time:1639725ms step_avg:233.85ms step:7013/7050 train_time:1639970ms step_avg:233.85ms step:7014/7050 train_time:1640212ms step_avg:233.85ms step:7015/7050 train_time:1640457ms step_avg:233.85ms step:7016/7050 train_time:1640703ms step_avg:233.85ms step:7017/7050 train_time:1640949ms step_avg:233.85ms step:7018/7050 train_time:1641192ms step_avg:233.85ms step:7019/7050 train_time:1641437ms step_avg:233.86ms step:7020/7050 train_time:1641682ms step_avg:233.86ms step:7021/7050 train_time:1641928ms step_avg:233.86ms step:7022/7050 train_time:1642173ms step_avg:233.86ms step:7023/7050 train_time:1642417ms step_avg:233.86ms step:7024/7050 train_time:1642665ms step_avg:233.86ms step:7025/7050 train_time:1642909ms step_avg:233.87ms step:7026/7050 train_time:1643151ms step_avg:233.87ms step:7027/7050 train_time:1643400ms step_avg:233.87ms step:7028/7050 train_time:1643642ms step_avg:233.87ms step:7029/7050 train_time:1643891ms step_avg:233.87ms step:7030/7050 train_time:1644134ms step_avg:233.87ms step:7031/7050 train_time:1644382ms step_avg:233.88ms step:7032/7050 train_time:1644626ms step_avg:233.88ms step:7033/7050 train_time:1644869ms step_avg:233.88ms step:7034/7050 train_time:1645114ms step_avg:233.88ms step:7035/7050 train_time:1645363ms step_avg:233.88ms step:7036/7050 train_time:1645608ms step_avg:233.88ms step:7037/7050 train_time:1645853ms step_avg:233.89ms step:7038/7050 train_time:1646096ms step_avg:233.89ms step:7039/7050 train_time:1646343ms step_avg:233.89ms step:7040/7050 train_time:1646589ms step_avg:233.89ms step:7041/7050 train_time:1646836ms step_avg:233.89ms step:7042/7050 train_time:1647084ms step_avg:233.89ms step:7043/7050 train_time:1647330ms step_avg:233.90ms step:7044/7050 train_time:1647575ms step_avg:233.90ms step:7045/7050 train_time:1647821ms step_avg:233.90ms step:7046/7050 train_time:1648067ms step_avg:233.90ms step:7047/7050 train_time:1648312ms step_avg:233.90ms step:7048/7050 train_time:1648558ms step_avg:233.90ms step:7049/7050 train_time:1648802ms step_avg:233.91ms step:7050/7050 train_time:1649047ms step_avg:233.91ms step:7050/7050 val_loss:2.9193 train_time:1649246ms step_avg:233.94ms peak memory allocated: 59737 MiB reserved: 70818 MiB